thys2/blexer2.sc
author Chengsong
Mon, 02 May 2022 00:23:39 +0100
changeset 500 4d9eecfc936a
parent 494 c730d018ebfa
child 514 036600af4c30
permissions -rw-r--r--
sad
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
431
Chengsong
parents:
diff changeset
     1
// A simple lexer inspired by work of Sulzmann & Lu
Chengsong
parents:
diff changeset
     2
//==================================================
Chengsong
parents:
diff changeset
     3
//
Chengsong
parents:
diff changeset
     4
// Call the test cases with 
Chengsong
parents:
diff changeset
     5
//
Chengsong
parents:
diff changeset
     6
//   amm lexer.sc small
Chengsong
parents:
diff changeset
     7
//   amm lexer.sc fib
Chengsong
parents:
diff changeset
     8
//   amm lexer.sc loops
Chengsong
parents:
diff changeset
     9
//   amm lexer.sc email
Chengsong
parents:
diff changeset
    10
//
Chengsong
parents:
diff changeset
    11
//   amm lexer.sc all
Chengsong
parents:
diff changeset
    12
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    13
import scala.util.Try
431
Chengsong
parents:
diff changeset
    14
Chengsong
parents:
diff changeset
    15
// regular expressions including records
Chengsong
parents:
diff changeset
    16
abstract class Rexp 
Chengsong
parents:
diff changeset
    17
case object ZERO extends Rexp
Chengsong
parents:
diff changeset
    18
case object ONE extends Rexp
Chengsong
parents:
diff changeset
    19
case object ANYCHAR extends Rexp
Chengsong
parents:
diff changeset
    20
case class CHAR(c: Char) extends Rexp
Chengsong
parents:
diff changeset
    21
case class ALTS(r1: Rexp, r2: Rexp) extends Rexp 
Chengsong
parents:
diff changeset
    22
case class SEQ(r1: Rexp, r2: Rexp) extends Rexp 
Chengsong
parents:
diff changeset
    23
case class STAR(r: Rexp) extends Rexp 
Chengsong
parents:
diff changeset
    24
case class RECD(x: String, r: Rexp) extends Rexp  
Chengsong
parents:
diff changeset
    25
case class NTIMES(n: Int, r: Rexp) extends Rexp
Chengsong
parents:
diff changeset
    26
case class OPTIONAL(r: Rexp) extends Rexp
Chengsong
parents:
diff changeset
    27
case class NOT(r: Rexp) extends Rexp
Chengsong
parents:
diff changeset
    28
                // records for extracting strings or tokens
Chengsong
parents:
diff changeset
    29
  
Chengsong
parents:
diff changeset
    30
// values  
Chengsong
parents:
diff changeset
    31
abstract class Val
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    32
case object Failure extends Val
431
Chengsong
parents:
diff changeset
    33
case object Empty extends Val
Chengsong
parents:
diff changeset
    34
case class Chr(c: Char) extends Val
Chengsong
parents:
diff changeset
    35
case class Sequ(v1: Val, v2: Val) extends Val
Chengsong
parents:
diff changeset
    36
case class Left(v: Val) extends Val
Chengsong
parents:
diff changeset
    37
case class Right(v: Val) extends Val
Chengsong
parents:
diff changeset
    38
case class Stars(vs: List[Val]) extends Val
Chengsong
parents:
diff changeset
    39
case class Rec(x: String, v: Val) extends Val
Chengsong
parents:
diff changeset
    40
case class Ntime(vs: List[Val]) extends Val
Chengsong
parents:
diff changeset
    41
case class Optionall(v: Val) extends Val
Chengsong
parents:
diff changeset
    42
case class Nots(s: String) extends Val
Chengsong
parents:
diff changeset
    43
Chengsong
parents:
diff changeset
    44
Chengsong
parents:
diff changeset
    45
Chengsong
parents:
diff changeset
    46
abstract class Bit
Chengsong
parents:
diff changeset
    47
case object Z extends Bit
Chengsong
parents:
diff changeset
    48
case object S extends Bit
Chengsong
parents:
diff changeset
    49
Chengsong
parents:
diff changeset
    50
Chengsong
parents:
diff changeset
    51
type Bits = List[Bit]
Chengsong
parents:
diff changeset
    52
Chengsong
parents:
diff changeset
    53
abstract class ARexp 
Chengsong
parents:
diff changeset
    54
case object AZERO extends ARexp
Chengsong
parents:
diff changeset
    55
case class AONE(bs: Bits) extends ARexp
Chengsong
parents:
diff changeset
    56
case class ACHAR(bs: Bits, c: Char) extends ARexp
Chengsong
parents:
diff changeset
    57
case class AALTS(bs: Bits, rs: List[ARexp]) extends ARexp 
Chengsong
parents:
diff changeset
    58
case class ASEQ(bs: Bits, r1: ARexp, r2: ARexp) extends ARexp 
Chengsong
parents:
diff changeset
    59
case class ASTAR(bs: Bits, r: ARexp) extends ARexp 
Chengsong
parents:
diff changeset
    60
case class ANOT(bs: Bits, r: ARexp) extends ARexp
Chengsong
parents:
diff changeset
    61
case class AANYCHAR(bs: Bits) extends ARexp
Chengsong
parents:
diff changeset
    62
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    63
trait Generator[+T] {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    64
    self => // an alias for "this"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    65
    def generate(): T
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    66
  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    67
    def gen(n: Int) : List[T] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    68
      if (n == 0) Nil else self.generate() :: gen(n - 1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    69
    
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    70
    def map[S](f: T => S): Generator[S] = new Generator[S] {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    71
      def generate = f(self.generate())  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    72
    }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    73
    def flatMap[S](f: T => Generator[S]): Generator[S] = new Generator[S] {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    74
      def generate = f(self.generate()).generate()
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    75
    }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    76
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    77
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    78
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    79
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    80
  // tests a property according to a given random generator
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    81
  def test[T](r: Generator[T], amount: Int = 100)(pred: T => Boolean) {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    82
    for (_ <- 0 until amount) {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    83
      val value = r.generate()
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    84
      assert(pred(value), s"Test failed for: $value")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    85
    }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    86
    println(s"Test passed $amount times")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    87
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    88
  def test2[T, S](r: Generator[T], s: Generator[S], amount: Int = 100)(pred: (T, S) => Boolean) {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    89
    for (_ <- 0 until amount) {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    90
      val valueR = r.generate()
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    91
      val valueS = s.generate()
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    92
      assert(pred(valueR, valueS), s"Test failed for: $valueR, $valueS")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    93
    }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    94
    println(s"Test passed $amount times")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    95
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    96
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    97
// random integers
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    98
val integers = new Generator[Int] {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    99
  val rand = new java.util.Random
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   100
  def generate() = rand.nextInt()
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   101
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   102
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   103
// random booleans
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   104
val booleans = integers.map(_ > 0)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   105
  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   106
// random integers in the range lo and high  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   107
def range(lo: Int, hi: Int): Generator[Int] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   108
  for (x <- integers) yield (lo + x.abs % (hi - lo)).abs
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   109
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   110
// random characters
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   111
def chars_range(lo: Char, hi: Char) = range(lo, hi).map(_.toChar)  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   112
val chars = chars_range('a', 'z')
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   113
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   114
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   115
def oneOf[T](xs: T*): Generator[T] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   116
  for (idx <- range(0, xs.length)) yield xs(idx)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   117
  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   118
def single[T](x: T) = new Generator[T] {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   119
  def generate() = x
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   120
}   
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   121
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   122
def pairs[T, U](t: Generator[T], u: Generator[U]): Generator[(T, U)] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   123
  for (x <- t; y <- u) yield (x, y)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   124
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   125
// lists
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   126
def emptyLists = single(Nil) 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   127
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   128
def nonEmptyLists : Generator[List[Int]] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   129
  for (head <- integers; tail <- lists) yield head :: tail
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   130
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   131
def lists: Generator[List[Int]] = for {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   132
  kind <- booleans
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   133
  list <- if (kind) emptyLists else nonEmptyLists
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   134
} yield list
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   135
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   136
def char_list(len: Int): Generator[List[Char]] = {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   137
  if(len <= 0) single(Nil)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   138
  else{
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   139
    for { 
500
Chengsong
parents: 494
diff changeset
   140
      c <- chars_range('a', 'c')
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   141
      tail <- char_list(len - 1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   142
    } yield c :: tail
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   143
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   144
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   145
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   146
def strings(len: Int): Generator[String] = for(cs <- char_list(len)) yield cs.toString
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   147
493
Chengsong
parents: 492
diff changeset
   148
def sampleString(r: Rexp) : List[String] = r match {
Chengsong
parents: 492
diff changeset
   149
  case STAR(r) => stringsFromRexp(r).flatMap(s => List("", s, s ++ s))//only generate 0, 1, 2 reptitions
Chengsong
parents: 492
diff changeset
   150
  case SEQ(r1, r2) => stringsFromRexp(r1).flatMap(s1 => stringsFromRexp(r2).map(s2 => s1 ++ s2) )
Chengsong
parents: 492
diff changeset
   151
  case ALTS(r1, r2) => throw new Error(s" Rexp ${r} not expected: all alternatives are supposed to have been opened up")
Chengsong
parents: 492
diff changeset
   152
  case ONE => "" :: Nil
Chengsong
parents: 492
diff changeset
   153
  case ZERO => Nil
Chengsong
parents: 492
diff changeset
   154
  case CHAR(c) => c.toString :: Nil
Chengsong
parents: 492
diff changeset
   155
Chengsong
parents: 492
diff changeset
   156
}
Chengsong
parents: 492
diff changeset
   157
Chengsong
parents: 492
diff changeset
   158
def stringsFromRexp(r: Rexp) : List[String] = 
Chengsong
parents: 492
diff changeset
   159
  breakIntoTerms(r).flatMap(r => sampleString(r))
Chengsong
parents: 492
diff changeset
   160
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   161
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   162
// (simple) binary trees
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   163
trait Tree[T]
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   164
case class Inner[T](left: Tree[T], right: Tree[T]) extends Tree[T]
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   165
case class Leaf[T](x: T) extends Tree[T]
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   166
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   167
def leafs[T](t: Generator[T]): Generator[Leaf[T]] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   168
  for (x <- t) yield Leaf(x)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   169
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   170
def inners[T](t: Generator[T]): Generator[Inner[T]] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   171
  for (l <- trees(t); r <- trees(t)) yield Inner(l, r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   172
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   173
def trees[T](t: Generator[T]): Generator[Tree[T]] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   174
  for (kind <- range(0, 2);  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   175
       tree <- if (kind == 0) leafs(t) else inners(t)) yield tree
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   176
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   177
// regular expressions
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   178
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   179
// generates random leaf-regexes; prefers CHAR-regexes
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   180
def leaf_rexp() : Generator[Rexp] =
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   181
  for (kind <- range(0, 5);
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   182
       c <- chars_range('a', 'd')) yield
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   183
    kind match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   184
      case 0 => ZERO
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   185
      case 1 => ONE
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   186
      case _ => CHAR(c) 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   187
    }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   188
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   189
// generates random inner regexes with maximum depth d
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   190
def inner_rexp(d: Int) : Generator[Rexp] =
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   191
  for (kind <- range(0, 3);
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   192
       l <- rexp(d); 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   193
       r <- rexp(d))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   194
  yield kind match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   195
    case 0 => ALTS(l, r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   196
    case 1 => SEQ(l, r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   197
    case 2 => STAR(r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   198
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   199
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   200
// generates random regexes with maximum depth d;
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   201
// prefers inner regexes in 2/3 of the cases
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   202
def rexp(d: Int = 100): Generator[Rexp] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   203
  for (kind <- range(0, 3);
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   204
       r <- if (d <= 0 || kind == 0) leaf_rexp() else inner_rexp(d - 1)) yield r
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   205
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   206
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   207
// some test functions for rexps
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   208
def height(r: Rexp) : Int = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   209
  case ZERO => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   210
  case ONE => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   211
  case CHAR(_) => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   212
  case ALTS(r1, r2) => 1 + List(height(r1), height(r2)).max
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   213
  case SEQ(r1, r2) =>  1 + List(height(r1), height(r2)).max
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   214
  case STAR(r) => 1 + height(r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   215
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   216
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   217
// def size(r: Rexp) : Int = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   218
//   case ZERO => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   219
//   case ONE => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   220
//   case CHAR(_) => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   221
//   case ALTS(r1, r2) => 1 + size(r1) + size(r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   222
//   case SEQ(r1, r2) =>  1 + size(r1) + size(r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   223
//   case STAR(r) => 1 + size(r) 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   224
// }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   225
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   226
// randomly subtracts 1 or 2 from the STAR case
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   227
def size_faulty(r: Rexp) : Int = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   228
  case ZERO => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   229
  case ONE => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   230
  case CHAR(_) => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   231
  case ALTS(r1, r2) => 1 + size_faulty(r1) + size_faulty(r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   232
  case SEQ(r1, r2) =>  1 + size_faulty(r1) + size_faulty(r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   233
  case STAR(r) => 1 + size_faulty(r) - range(0, 2).generate
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   234
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   235
431
Chengsong
parents:
diff changeset
   236
Chengsong
parents:
diff changeset
   237
   
Chengsong
parents:
diff changeset
   238
// some convenience for typing in regular expressions
Chengsong
parents:
diff changeset
   239
Chengsong
parents:
diff changeset
   240
def charlist2rexp(s : List[Char]): Rexp = s match {
Chengsong
parents:
diff changeset
   241
  case Nil => ONE
Chengsong
parents:
diff changeset
   242
  case c::Nil => CHAR(c)
Chengsong
parents:
diff changeset
   243
  case c::s => SEQ(CHAR(c), charlist2rexp(s))
Chengsong
parents:
diff changeset
   244
}
Chengsong
parents:
diff changeset
   245
implicit def string2rexp(s : String) : Rexp = 
Chengsong
parents:
diff changeset
   246
  charlist2rexp(s.toList)
Chengsong
parents:
diff changeset
   247
Chengsong
parents:
diff changeset
   248
implicit def RexpOps(r: Rexp) = new {
Chengsong
parents:
diff changeset
   249
  def | (s: Rexp) = ALTS(r, s)
Chengsong
parents:
diff changeset
   250
  def % = STAR(r)
Chengsong
parents:
diff changeset
   251
  def ~ (s: Rexp) = SEQ(r, s)
Chengsong
parents:
diff changeset
   252
}
Chengsong
parents:
diff changeset
   253
Chengsong
parents:
diff changeset
   254
implicit def stringOps(s: String) = new {
Chengsong
parents:
diff changeset
   255
  def | (r: Rexp) = ALTS(s, r)
Chengsong
parents:
diff changeset
   256
  def | (r: String) = ALTS(s, r)
Chengsong
parents:
diff changeset
   257
  def % = STAR(s)
Chengsong
parents:
diff changeset
   258
  def ~ (r: Rexp) = SEQ(s, r)
Chengsong
parents:
diff changeset
   259
  def ~ (r: String) = SEQ(s, r)
Chengsong
parents:
diff changeset
   260
  def $ (r: Rexp) = RECD(s, r)
Chengsong
parents:
diff changeset
   261
}
Chengsong
parents:
diff changeset
   262
Chengsong
parents:
diff changeset
   263
def nullable(r: Rexp) : Boolean = r match {
Chengsong
parents:
diff changeset
   264
  case ZERO => false
Chengsong
parents:
diff changeset
   265
  case ONE => true
Chengsong
parents:
diff changeset
   266
  case CHAR(_) => false
Chengsong
parents:
diff changeset
   267
  case ANYCHAR => false
Chengsong
parents:
diff changeset
   268
  case ALTS(r1, r2) => nullable(r1) || nullable(r2)
Chengsong
parents:
diff changeset
   269
  case SEQ(r1, r2) => nullable(r1) && nullable(r2)
Chengsong
parents:
diff changeset
   270
  case STAR(_) => true
Chengsong
parents:
diff changeset
   271
  case RECD(_, r1) => nullable(r1)
Chengsong
parents:
diff changeset
   272
  case NTIMES(n, r) => if (n == 0) true else nullable(r)
Chengsong
parents:
diff changeset
   273
  case OPTIONAL(r) => true
Chengsong
parents:
diff changeset
   274
  case NOT(r) => !nullable(r)
Chengsong
parents:
diff changeset
   275
}
Chengsong
parents:
diff changeset
   276
Chengsong
parents:
diff changeset
   277
def der(c: Char, r: Rexp) : Rexp = r match {
Chengsong
parents:
diff changeset
   278
  case ZERO => ZERO
Chengsong
parents:
diff changeset
   279
  case ONE => ZERO
Chengsong
parents:
diff changeset
   280
  case CHAR(d) => if (c == d) ONE else ZERO
Chengsong
parents:
diff changeset
   281
  case ANYCHAR => ONE 
Chengsong
parents:
diff changeset
   282
  case ALTS(r1, r2) => ALTS(der(c, r1), der(c, r2))
Chengsong
parents:
diff changeset
   283
  case SEQ(r1, r2) => 
Chengsong
parents:
diff changeset
   284
    if (nullable(r1)) ALTS(SEQ(der(c, r1), r2), der(c, r2))
Chengsong
parents:
diff changeset
   285
    else SEQ(der(c, r1), r2)
Chengsong
parents:
diff changeset
   286
  case STAR(r) => SEQ(der(c, r), STAR(r))
Chengsong
parents:
diff changeset
   287
  case RECD(_, r1) => der(c, r1)
Chengsong
parents:
diff changeset
   288
  case NTIMES(n, r) => if(n > 0) SEQ(der(c, r), NTIMES(n - 1, r)) else ZERO
Chengsong
parents:
diff changeset
   289
  case OPTIONAL(r) => der(c, r)
Chengsong
parents:
diff changeset
   290
  case NOT(r) =>  NOT(der(c, r))
Chengsong
parents:
diff changeset
   291
}
Chengsong
parents:
diff changeset
   292
Chengsong
parents:
diff changeset
   293
Chengsong
parents:
diff changeset
   294
// extracts a string from a value
Chengsong
parents:
diff changeset
   295
def flatten(v: Val) : String = v match {
Chengsong
parents:
diff changeset
   296
  case Empty => ""
Chengsong
parents:
diff changeset
   297
  case Chr(c) => c.toString
Chengsong
parents:
diff changeset
   298
  case Left(v) => flatten(v)
Chengsong
parents:
diff changeset
   299
  case Right(v) => flatten(v)
Chengsong
parents:
diff changeset
   300
  case Sequ(v1, v2) => flatten(v1) ++ flatten(v2)
Chengsong
parents:
diff changeset
   301
  case Stars(vs) => vs.map(flatten).mkString
Chengsong
parents:
diff changeset
   302
  case Ntime(vs) => vs.map(flatten).mkString
Chengsong
parents:
diff changeset
   303
  case Optionall(v) => flatten(v)
Chengsong
parents:
diff changeset
   304
  case Rec(_, v) => flatten(v)
Chengsong
parents:
diff changeset
   305
}
Chengsong
parents:
diff changeset
   306
Chengsong
parents:
diff changeset
   307
Chengsong
parents:
diff changeset
   308
// extracts an environment from a value;
Chengsong
parents:
diff changeset
   309
// used for tokenising a string
Chengsong
parents:
diff changeset
   310
def env(v: Val) : List[(String, String)] = v match {
Chengsong
parents:
diff changeset
   311
  case Empty => Nil
Chengsong
parents:
diff changeset
   312
  case Chr(c) => Nil
Chengsong
parents:
diff changeset
   313
  case Left(v) => env(v)
Chengsong
parents:
diff changeset
   314
  case Right(v) => env(v)
Chengsong
parents:
diff changeset
   315
  case Sequ(v1, v2) => env(v1) ::: env(v2)
Chengsong
parents:
diff changeset
   316
  case Stars(vs) => vs.flatMap(env)
Chengsong
parents:
diff changeset
   317
  case Ntime(vs) => vs.flatMap(env)
Chengsong
parents:
diff changeset
   318
  case Rec(x, v) => (x, flatten(v))::env(v)
Chengsong
parents:
diff changeset
   319
  case Optionall(v) => env(v)
Chengsong
parents:
diff changeset
   320
  case Nots(s) => ("Negative", s) :: Nil
Chengsong
parents:
diff changeset
   321
}
Chengsong
parents:
diff changeset
   322
Chengsong
parents:
diff changeset
   323
Chengsong
parents:
diff changeset
   324
// The injection and mkeps part of the lexer
Chengsong
parents:
diff changeset
   325
//===========================================
Chengsong
parents:
diff changeset
   326
Chengsong
parents:
diff changeset
   327
def mkeps(r: Rexp) : Val = r match {
Chengsong
parents:
diff changeset
   328
  case ONE => Empty
Chengsong
parents:
diff changeset
   329
  case ALTS(r1, r2) => 
Chengsong
parents:
diff changeset
   330
    if (nullable(r1)) Left(mkeps(r1)) else Right(mkeps(r2))
Chengsong
parents:
diff changeset
   331
  case SEQ(r1, r2) => Sequ(mkeps(r1), mkeps(r2))
Chengsong
parents:
diff changeset
   332
  case STAR(r) => Stars(Nil)
Chengsong
parents:
diff changeset
   333
  case RECD(x, r) => Rec(x, mkeps(r))
Chengsong
parents:
diff changeset
   334
  case NTIMES(n, r) => Ntime(List.fill(n)(mkeps(r)))
Chengsong
parents:
diff changeset
   335
  case OPTIONAL(r) => Optionall(Empty)
Chengsong
parents:
diff changeset
   336
  case NOT(rInner) => if(nullable(rInner)) throw new Exception("error")  
Chengsong
parents:
diff changeset
   337
                         else Nots("")//Nots(s.reverse.toString)
Chengsong
parents:
diff changeset
   338
//   case NOT(ZERO) => Empty
Chengsong
parents:
diff changeset
   339
//   case NOT(CHAR(c)) => Empty
Chengsong
parents:
diff changeset
   340
//   case NOT(SEQ(r1, r2)) => Sequ(mkeps(NOT(r1)), mkeps(NOT(r2)))
Chengsong
parents:
diff changeset
   341
//   case NOT(ALTS(r1, r2)) => if(!nullable(r1)) Left(mkeps(NOT(r1))) else Right(mkeps(NOT(r2)))
Chengsong
parents:
diff changeset
   342
//   case NOT(STAR(r)) => Stars(Nil) 
Chengsong
parents:
diff changeset
   343
Chengsong
parents:
diff changeset
   344
}
Chengsong
parents:
diff changeset
   345
Chengsong
parents:
diff changeset
   346
def inj(r: Rexp, c: Char, v: Val) : Val = (r, v) match {
Chengsong
parents:
diff changeset
   347
  case (STAR(r), Sequ(v1, Stars(vs))) => Stars(inj(r, c, v1)::vs)
Chengsong
parents:
diff changeset
   348
  case (SEQ(r1, r2), Sequ(v1, v2)) => Sequ(inj(r1, c, v1), v2)
Chengsong
parents:
diff changeset
   349
  case (SEQ(r1, r2), Left(Sequ(v1, v2))) => Sequ(inj(r1, c, v1), v2)
Chengsong
parents:
diff changeset
   350
  case (SEQ(r1, r2), Right(v2)) => Sequ(mkeps(r1), inj(r2, c, v2))
Chengsong
parents:
diff changeset
   351
  case (ALTS(r1, r2), Left(v1)) => Left(inj(r1, c, v1))
Chengsong
parents:
diff changeset
   352
  case (ALTS(r1, r2), Right(v2)) => Right(inj(r2, c, v2))
Chengsong
parents:
diff changeset
   353
  case (CHAR(d), Empty) => Chr(c) 
Chengsong
parents:
diff changeset
   354
  case (RECD(x, r1), _) => Rec(x, inj(r1, c, v))
Chengsong
parents:
diff changeset
   355
  case (NTIMES(n, r), Sequ(v1, Ntime(vs))) => Ntime(inj(r, c, v1)::vs)
Chengsong
parents:
diff changeset
   356
  case (OPTIONAL(r), v) => Optionall(inj(r, c, v))
Chengsong
parents:
diff changeset
   357
  case (NOT(r), Nots(s)) => Nots(c.toString ++ s)
Chengsong
parents:
diff changeset
   358
  case (ANYCHAR, Empty) => Chr(c)
Chengsong
parents:
diff changeset
   359
}
Chengsong
parents:
diff changeset
   360
Chengsong
parents:
diff changeset
   361
// some "rectification" functions for simplification
Chengsong
parents:
diff changeset
   362
Chengsong
parents:
diff changeset
   363
Chengsong
parents:
diff changeset
   364
Chengsong
parents:
diff changeset
   365
Chengsong
parents:
diff changeset
   366
// The Lexing Rules for the WHILE Language
Chengsong
parents:
diff changeset
   367
Chengsong
parents:
diff changeset
   368
  // bnullable function: tests whether the aregular 
Chengsong
parents:
diff changeset
   369
  // expression can recognise the empty string
Chengsong
parents:
diff changeset
   370
def bnullable (r: ARexp) : Boolean = r match {
Chengsong
parents:
diff changeset
   371
    case AZERO => false
Chengsong
parents:
diff changeset
   372
    case AONE(_) => true
Chengsong
parents:
diff changeset
   373
    case ACHAR(_,_) => false
Chengsong
parents:
diff changeset
   374
    case AALTS(_, rs) => rs.exists(bnullable)
Chengsong
parents:
diff changeset
   375
    case ASEQ(_, r1, r2) => bnullable(r1) && bnullable(r2)
Chengsong
parents:
diff changeset
   376
    case ASTAR(_, _) => true
Chengsong
parents:
diff changeset
   377
    case ANOT(_, rn) => !bnullable(rn)
Chengsong
parents:
diff changeset
   378
  }
Chengsong
parents:
diff changeset
   379
Chengsong
parents:
diff changeset
   380
def mkepsBC(r: ARexp) : Bits = r match {
Chengsong
parents:
diff changeset
   381
    case AONE(bs) => bs
Chengsong
parents:
diff changeset
   382
    case AALTS(bs, rs) => {
Chengsong
parents:
diff changeset
   383
      val n = rs.indexWhere(bnullable)
Chengsong
parents:
diff changeset
   384
      bs ++ mkepsBC(rs(n))
Chengsong
parents:
diff changeset
   385
    }
Chengsong
parents:
diff changeset
   386
    case ASEQ(bs, r1, r2) => bs ++ mkepsBC(r1) ++ mkepsBC(r2)
Chengsong
parents:
diff changeset
   387
    case ASTAR(bs, r) => bs ++ List(Z)
Chengsong
parents:
diff changeset
   388
    case ANOT(bs, rn) => bs
Chengsong
parents:
diff changeset
   389
  }
Chengsong
parents:
diff changeset
   390
Chengsong
parents:
diff changeset
   391
Chengsong
parents:
diff changeset
   392
def bder(c: Char, r: ARexp) : ARexp = r match {
Chengsong
parents:
diff changeset
   393
    case AZERO => AZERO
Chengsong
parents:
diff changeset
   394
    case AONE(_) => AZERO
Chengsong
parents:
diff changeset
   395
    case ACHAR(bs, f) => if (c == f) AONE(bs) else AZERO
Chengsong
parents:
diff changeset
   396
    case AALTS(bs, rs) => AALTS(bs, rs.map(bder(c, _)))
Chengsong
parents:
diff changeset
   397
    case ASEQ(bs, r1, r2) => 
Chengsong
parents:
diff changeset
   398
      if (bnullable(r1)) AALTS(bs, ASEQ(Nil, bder(c, r1), r2) :: fuse(mkepsBC(r1), bder(c, r2)) :: Nil )
Chengsong
parents:
diff changeset
   399
      else ASEQ(bs, bder(c, r1), r2)
Chengsong
parents:
diff changeset
   400
    case ASTAR(bs, r) => ASEQ(bs, fuse(List(S), bder(c, r)), ASTAR(Nil, r))
Chengsong
parents:
diff changeset
   401
    case ANOT(bs, rn) => ANOT(bs, bder(c, rn))
Chengsong
parents:
diff changeset
   402
    case AANYCHAR(bs) => AONE(bs)
Chengsong
parents:
diff changeset
   403
  } 
Chengsong
parents:
diff changeset
   404
Chengsong
parents:
diff changeset
   405
def fuse(bs: Bits, r: ARexp) : ARexp = r match {
Chengsong
parents:
diff changeset
   406
    case AZERO => AZERO
Chengsong
parents:
diff changeset
   407
    case AONE(cs) => AONE(bs ++ cs)
Chengsong
parents:
diff changeset
   408
    case ACHAR(cs, f) => ACHAR(bs ++ cs, f)
Chengsong
parents:
diff changeset
   409
    case AALTS(cs, rs) => AALTS(bs ++ cs, rs)
Chengsong
parents:
diff changeset
   410
    case ASEQ(cs, r1, r2) => ASEQ(bs ++ cs, r1, r2)
Chengsong
parents:
diff changeset
   411
    case ASTAR(cs, r) => ASTAR(bs ++ cs, r)
Chengsong
parents:
diff changeset
   412
    case ANOT(cs, r) => ANOT(bs ++ cs, r)
Chengsong
parents:
diff changeset
   413
  }
Chengsong
parents:
diff changeset
   414
Chengsong
parents:
diff changeset
   415
Chengsong
parents:
diff changeset
   416
def internalise(r: Rexp) : ARexp = r match {
Chengsong
parents:
diff changeset
   417
    case ZERO => AZERO
Chengsong
parents:
diff changeset
   418
    case ONE => AONE(Nil)
Chengsong
parents:
diff changeset
   419
    case CHAR(c) => ACHAR(Nil, c)
Chengsong
parents:
diff changeset
   420
    //case PRED(f) => APRED(Nil, f)
Chengsong
parents:
diff changeset
   421
    case ALTS(r1, r2) => 
Chengsong
parents:
diff changeset
   422
      AALTS(Nil, List(fuse(List(Z), internalise(r1)), fuse(List(S), internalise(r2))))
Chengsong
parents:
diff changeset
   423
    // case ALTS(r1::rs) => {
Chengsong
parents:
diff changeset
   424
    //   val AALTS(Nil, rs2) = internalise(ALTS(rs))
Chengsong
parents:
diff changeset
   425
    //   AALTS(Nil, fuse(List(Z), internalise(r1)) :: rs2.map(fuse(List(S), _)))
Chengsong
parents:
diff changeset
   426
    // }
Chengsong
parents:
diff changeset
   427
    case SEQ(r1, r2) => ASEQ(Nil, internalise(r1), internalise(r2))
Chengsong
parents:
diff changeset
   428
    case STAR(r) => ASTAR(Nil, internalise(r))
Chengsong
parents:
diff changeset
   429
    case RECD(x, r) => internalise(r)
Chengsong
parents:
diff changeset
   430
    case NOT(r) => ANOT(Nil, internalise(r))
Chengsong
parents:
diff changeset
   431
    case ANYCHAR => AANYCHAR(Nil)
Chengsong
parents:
diff changeset
   432
  }
Chengsong
parents:
diff changeset
   433
Chengsong
parents:
diff changeset
   434
Chengsong
parents:
diff changeset
   435
def bsimp(r: ARexp): ARexp = 
Chengsong
parents:
diff changeset
   436
  {
Chengsong
parents:
diff changeset
   437
    r match {
Chengsong
parents:
diff changeset
   438
      case ASEQ(bs1, r1, r2) => (bsimp(r1), bsimp(r2)) match {
Chengsong
parents:
diff changeset
   439
          case (AZERO, _) => AZERO
Chengsong
parents:
diff changeset
   440
          case (_, AZERO) => AZERO
Chengsong
parents:
diff changeset
   441
          case (AONE(bs2), r2s) => fuse(bs1 ++ bs2, r2s)
Chengsong
parents:
diff changeset
   442
          case (r1s, r2s) => ASEQ(bs1, r1s, r2s)
Chengsong
parents:
diff changeset
   443
      }
Chengsong
parents:
diff changeset
   444
      case AALTS(bs1, rs) => {
Chengsong
parents:
diff changeset
   445
            val rs_simp = rs.map(bsimp(_))
Chengsong
parents:
diff changeset
   446
            val flat_res = flats(rs_simp)
Chengsong
parents:
diff changeset
   447
            val dist_res = distinctBy(flat_res, erase)//strongDB(flat_res)//distinctBy(flat_res, erase)
Chengsong
parents:
diff changeset
   448
            dist_res match {
Chengsong
parents:
diff changeset
   449
              case Nil => AZERO
Chengsong
parents:
diff changeset
   450
              case s :: Nil => fuse(bs1, s)
Chengsong
parents:
diff changeset
   451
              case rs => AALTS(bs1, rs)  
Chengsong
parents:
diff changeset
   452
            }
Chengsong
parents:
diff changeset
   453
          
Chengsong
parents:
diff changeset
   454
      }
Chengsong
parents:
diff changeset
   455
      case r => r
Chengsong
parents:
diff changeset
   456
    }
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   457
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   458
def strongBsimp(r: ARexp): ARexp =
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   459
{
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   460
  r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   461
    case ASEQ(bs1, r1, r2) => (strongBsimp(r1), strongBsimp(r2)) match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   462
        case (AZERO, _) => AZERO
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   463
        case (_, AZERO) => AZERO
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   464
        case (AONE(bs2), r2s) => fuse(bs1 ++ bs2, r2s)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   465
        case (r1s, r2s) => ASEQ(bs1, r1s, r2s)
431
Chengsong
parents:
diff changeset
   466
    }
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   467
    case AALTS(bs1, rs) => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   468
          val rs_simp = rs.map(strongBsimp(_))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   469
          val flat_res = flats(rs_simp)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   470
          val dist_res = distinctBy4(flat_res)//distinctBy(flat_res, erase)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   471
          dist_res match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   472
            case Nil => AZERO
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   473
            case s :: Nil => fuse(bs1, s)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   474
            case rs => AALTS(bs1, rs)  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   475
          }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   476
        
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   477
    }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   478
    case r => r
431
Chengsong
parents:
diff changeset
   479
  }
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   480
}
431
Chengsong
parents:
diff changeset
   481
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   482
def strongBsimp5(r: ARexp): ARexp =
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   483
{
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   484
  // println("was this called?")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   485
  r match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   486
    case ASEQ(bs1, r1, r2) => (strongBsimp5(r1), strongBsimp5(r2)) match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   487
        case (AZERO, _) => AZERO
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   488
        case (_, AZERO) => AZERO
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   489
        case (AONE(bs2), r2s) => fuse(bs1 ++ bs2, r2s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   490
        case (r1s, r2s) => ASEQ(bs1, r1s, r2s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   491
    }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   492
    case AALTS(bs1, rs) => {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   493
        // println("alts case")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   494
          val rs_simp = rs.map(strongBsimp5(_))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   495
          val flat_res = flats(rs_simp)
500
Chengsong
parents: 494
diff changeset
   496
          var dist_res = distinctBy5(flat_res)//distinctBy(flat_res, erase)
Chengsong
parents: 494
diff changeset
   497
          var dist2_res = distinctBy5(dist_res)
Chengsong
parents: 494
diff changeset
   498
          while(dist_res != dist2_res){
Chengsong
parents: 494
diff changeset
   499
            dist_res = dist2_res
Chengsong
parents: 494
diff changeset
   500
            dist2_res = distinctBy5(dist_res)
Chengsong
parents: 494
diff changeset
   501
          }
Chengsong
parents: 494
diff changeset
   502
          (dist2_res) match {
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   503
            case Nil => AZERO
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   504
            case s :: Nil => fuse(bs1, s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   505
            case rs => AALTS(bs1, rs)  
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   506
          }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   507
    }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   508
    case r => r
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   509
  }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   510
}
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   511
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   512
def bders (s: List[Char], r: ARexp) : ARexp = s match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   513
  case Nil => r
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   514
  case c::s => bders(s, bder(c, r))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   515
}
431
Chengsong
parents:
diff changeset
   516
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   517
def flats(rs: List[ARexp]): List[ARexp] = rs match {
431
Chengsong
parents:
diff changeset
   518
    case Nil => Nil
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   519
    case AZERO :: rs1 => flats(rs1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   520
    case AALTS(bs, rs1) :: rs2 => rs1.map(fuse(bs, _)) ::: flats(rs2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   521
    case r1 :: rs2 => r1 :: flats(rs2)
431
Chengsong
parents:
diff changeset
   522
  }
Chengsong
parents:
diff changeset
   523
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   524
def distinctBy[B, C](xs: List[B], f: B => C, acc: List[C] = Nil): List[B] = xs match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   525
  case Nil => Nil
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   526
  case (x::xs) => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   527
    val res = f(x)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   528
    if (acc.contains(res)) distinctBy(xs, f, acc)  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   529
    else x::distinctBy(xs, f, res::acc)
431
Chengsong
parents:
diff changeset
   530
  }
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   531
} 
431
Chengsong
parents:
diff changeset
   532
Chengsong
parents:
diff changeset
   533
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   534
def pruneRexp(r: ARexp, allowableTerms: List[Rexp]) : ARexp = {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   535
  r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   536
    case ASEQ(bs, r1, r2) => 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   537
      val termsTruncated = allowableTerms.collect(rt => rt match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   538
        case SEQ(r1p, r2p) if(r2p == erase(r2)) => r1p//if(r2p == erase(r2)) 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   539
      })
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   540
      val pruned : ARexp = pruneRexp(r1, termsTruncated)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   541
      pruned match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   542
        case AZERO => AZERO
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   543
        case AONE(bs1) => fuse(bs ++ bs1, r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   544
        case pruned1 => ASEQ(bs, pruned1, r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   545
      }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   546
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   547
    case AALTS(bs, rs) => 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   548
      //allowableTerms.foreach(a => println(shortRexpOutput(a)))        
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   549
      val rsp = rs.map(r => 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   550
                    pruneRexp(r, allowableTerms)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   551
                  )
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   552
                  .filter(r => r != AZERO)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   553
      rsp match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   554
        case Nil => AZERO
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   555
        case r1::Nil => fuse(bs, r1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   556
        case rs1 => AALTS(bs, rs1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   557
      }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   558
    case r => 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   559
      if(allowableTerms.contains(erase(r))) r else AZERO //assert(r != AZERO)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   560
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   561
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   562
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   563
def oneSimp(r: Rexp) : Rexp = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   564
  case SEQ(ONE, r) => r
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   565
  case SEQ(r1, r2) => SEQ(oneSimp(r1), r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   566
  case r => r//assert r != 0 
432
994403dbbed5 strong!
Chengsong
parents: 431
diff changeset
   567
    
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   568
}
431
Chengsong
parents:
diff changeset
   569
Chengsong
parents:
diff changeset
   570
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   571
def distinctBy4(xs: List[ARexp], acc: List[Rexp] = Nil) : List[ARexp] = xs match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   572
  case Nil => Nil
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   573
  case x :: xs =>
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   574
    //assert(acc.distinct == acc)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   575
    val erased = erase(x)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   576
    if(acc.contains(erased))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   577
      distinctBy4(xs, acc)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   578
    else{
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   579
      val addToAcc =  breakIntoTerms(erased).filter(r => !acc.contains(oneSimp(r)))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   580
      //val xp = pruneRexp(x, addToAcc)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   581
      pruneRexp(x, addToAcc) match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   582
        case AZERO => distinctBy4(xs, addToAcc.map(oneSimp(_)) ::: acc)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   583
        case xPrime => xPrime :: distinctBy4(xs, addToAcc.map(oneSimp(_)) ::: acc)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   584
      }
431
Chengsong
parents:
diff changeset
   585
    }
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   586
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   587
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   588
// fun pAKC_aux :: "arexp list ⇒ arexp ⇒ rexp ⇒ arexp"
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   589
//   where
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   590
// "pAKC_aux rsa r ctx = (if (L (SEQ (erase r) ( ctx) )) ⊆ (L (erase (AALTs [] rsa))) then AZERO else
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   591
//                           case r of (ASEQ bs r1 r2) ⇒ 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   592
//                             bsimp_ASEQ bs (pAKC_aux rsa r1 (SEQ  (erase r2) ( ctx) )) r2   |
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   593
//                                     (AALTs bs rs) ⇒ 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   594
//                             bsimp_AALTs bs (flts (map (λr. pAKC_aux rsa r ( ctx) ) rs) )    |
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   595
//                                     r             ⇒ r
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   596
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   597
// def canonicalSeq(rs: List[Rexp], acc: Rexp) = rs match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   598
//   case r::Nil => SEQ(r, acc)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   599
//   case Nil => acc
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   600
//   case r1::r2::Nil => SEQ(SEQ(r1, r2), acc)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   601
// }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   602
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   603
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   604
//the "fake" Language interpretation: just concatenates!
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   605
def L(acc: Rexp, rs: List[Rexp]) : Rexp = rs match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   606
  case Nil => acc
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   607
  case r :: rs1 => 
500
Chengsong
parents: 494
diff changeset
   608
    // if(acc == ONE) 
Chengsong
parents: 494
diff changeset
   609
    //   L(r, rs1) 
Chengsong
parents: 494
diff changeset
   610
    // else
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   611
      L(SEQ(acc, r), rs1)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   612
}
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   613
500
Chengsong
parents: 494
diff changeset
   614
def rprint(r: Rexp) : Unit = println(shortRexpOutput(r))
Chengsong
parents: 494
diff changeset
   615
def rsprint(rs: List[Rexp]) = rs.foreach(r => println(shortRexpOutput(r)))
Chengsong
parents: 494
diff changeset
   616
def aprint(a: ARexp) = println(shortRexpOutput(erase(a)))
Chengsong
parents: 494
diff changeset
   617
def asprint(as: List[ARexp]) = as.foreach(a => println(shortRexpOutput(erase(a))))
Chengsong
parents: 494
diff changeset
   618
Chengsong
parents: 494
diff changeset
   619
def pAKC(acc: List[Rexp], r: ARexp, ctx: List[Rexp]) : ARexp = {
Chengsong
parents: 494
diff changeset
   620
  // println("pakc")
Chengsong
parents: 494
diff changeset
   621
  // println(shortRexpOutput(erase(r)))
Chengsong
parents: 494
diff changeset
   622
  // println("acc")
Chengsong
parents: 494
diff changeset
   623
  // rsprint(acc)
Chengsong
parents: 494
diff changeset
   624
  // println("ctx---------")
Chengsong
parents: 494
diff changeset
   625
  // rsprint(ctx)
Chengsong
parents: 494
diff changeset
   626
  // println("ctx---------end")
Chengsong
parents: 494
diff changeset
   627
  // rsprint(breakIntoTerms(L(erase(r), ctx)).map(oneSimp))
Chengsong
parents: 494
diff changeset
   628
Chengsong
parents: 494
diff changeset
   629
  if (breakIntoTerms(L(erase(r), ctx)).map(oneSimp).forall(acc.contains)) {//acc.flatMap(breakIntoTerms
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   630
    AZERO
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   631
  }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   632
  else{
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   633
    r match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   634
      case ASEQ(bs, r1, r2) => 
500
Chengsong
parents: 494
diff changeset
   635
      (pAKC(acc, r1, erase(r2) :: ctx)) match{
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   636
        case AZERO => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   637
          AZERO
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   638
        case AONE(bs1) => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   639
          fuse(bs1, r2)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   640
        case r1p => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   641
          ASEQ(bs, r1p, r2)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   642
      }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   643
      case AALTS(bs, rs0) => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   644
        // println("before pruning")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   645
        // println(s"ctx is ")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   646
        // ctx.foreach(r => println(shortRexpOutput(r)))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   647
        // println(s"rs0 is ")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   648
        // rs0.foreach(r => println(shortRexpOutput(erase(r))))
500
Chengsong
parents: 494
diff changeset
   649
        // println(s"acc is ")
Chengsong
parents: 494
diff changeset
   650
        // acc.foreach(r => println(shortRexpOutput(r)))
Chengsong
parents: 494
diff changeset
   651
        rs0.map(r => pAKC(acc, r, ctx)).filter(_ != AZERO) match {
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   652
          case Nil => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   653
            // println("after pruning Nil")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   654
            AZERO
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   655
          case r :: Nil => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   656
            // println("after pruning singleton")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   657
            // println(shortRexpOutput(erase(r)))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   658
            r 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   659
          case rs0p => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   660
          // println("after pruning non-singleton")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   661
            AALTS(bs, rs0p)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   662
        }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   663
      case r => r
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   664
    }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   665
  }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   666
}
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   667
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   668
def distinctBy5(xs: List[ARexp], acc: List[Rexp] = Nil) : List[ARexp] = xs match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   669
  case Nil => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   670
    Nil
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   671
  case x :: xs => {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   672
    val erased = erase(x)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   673
    if(acc.contains(erased)){
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   674
      distinctBy5(xs, acc)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   675
    }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   676
    else{
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   677
      val pruned = pAKC(acc, x, Nil)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   678
      val newTerms = breakIntoTerms(erase(pruned))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   679
      pruned match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   680
        case AZERO => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   681
          distinctBy5(xs, acc)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   682
        case xPrime => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   683
          xPrime :: distinctBy5(xs, newTerms.map(oneSimp) ::: acc)//distinctBy5(xs, addToAcc.map(oneSimp(_)) ::: acc)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   684
      }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   685
    }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   686
  }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   687
}
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   688
431
Chengsong
parents:
diff changeset
   689
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   690
def breakIntoTerms(r: Rexp) : List[Rexp] = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   691
  case SEQ(r1, r2)  => breakIntoTerms(r1).map(r11 => SEQ(r11, r2))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   692
  case ALTS(r1, r2) => breakIntoTerms(r1) ::: breakIntoTerms(r2)
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   693
  case ZERO => Nil
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   694
  case _ => r::Nil
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   695
}
431
Chengsong
parents:
diff changeset
   696
Chengsong
parents:
diff changeset
   697
Chengsong
parents:
diff changeset
   698
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   699
def decode_aux(r: Rexp, bs: Bits) : (Val, Bits) = (r, bs) match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   700
  case (ONE, bs) => (Empty, bs)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   701
  case (CHAR(f), bs) => (Chr(f), bs)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   702
  case (ALTS(r1, r2), Z::bs1) => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   703
      val (v, bs2) = decode_aux(r1, bs1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   704
      (Left(v), bs2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   705
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   706
  case (ALTS(r1, r2), S::bs1) => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   707
      val (v, bs2) = decode_aux(r2, bs1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   708
      (Right(v), bs2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   709
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   710
  case (SEQ(r1, r2), bs) => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   711
    val (v1, bs1) = decode_aux(r1, bs)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   712
    val (v2, bs2) = decode_aux(r2, bs1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   713
    (Sequ(v1, v2), bs2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   714
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   715
  case (STAR(r1), S::bs) => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   716
    val (v, bs1) = decode_aux(r1, bs)
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   717
    //(v)
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   718
    val (Stars(vs), bs2) = decode_aux(STAR(r1), bs1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   719
    (Stars(v::vs), bs2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   720
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   721
  case (STAR(_), Z::bs) => (Stars(Nil), bs)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   722
  case (RECD(x, r1), bs) => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   723
    val (v, bs1) = decode_aux(r1, bs)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   724
    (Rec(x, v), bs1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   725
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   726
  case (NOT(r), bs) => (Nots(r.toString), bs)
431
Chengsong
parents:
diff changeset
   727
}
Chengsong
parents:
diff changeset
   728
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   729
def decode(r: Rexp, bs: Bits) = decode_aux(r, bs) match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   730
  case (v, Nil) => v
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   731
  case _ => throw new Exception("Not decodable")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   732
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   733
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   734
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   735
431
Chengsong
parents:
diff changeset
   736
def blexing_simp(r: Rexp, s: String) : Val = {
Chengsong
parents:
diff changeset
   737
    val bit_code = blex_simp(internalise(r), s.toList)
Chengsong
parents:
diff changeset
   738
    decode(r, bit_code)
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   739
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   740
def simpBlexer(r: Rexp, s: String) : Val = {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   741
  Try(blexing_simp(r, s)).getOrElse(Failure)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   742
}
431
Chengsong
parents:
diff changeset
   743
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   744
def strong_blexing_simp(r: Rexp, s: String) : Val = {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   745
  decode(r, strong_blex_simp(internalise(r), s.toList))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   746
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   747
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   748
def strong_blexing_simp5(r: Rexp, s: String) : Val = {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   749
  decode(r, strong_blex_simp5(internalise(r), s.toList))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   750
}
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   751
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   752
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   753
def strongBlexer(r: Rexp, s: String) : Val = {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   754
  Try(strong_blexing_simp(r, s)).getOrElse(Failure)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   755
}
431
Chengsong
parents:
diff changeset
   756
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   757
def strongBlexer5(r: Rexp, s: String): Val = {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   758
  Try(strong_blexing_simp5(r, s)).getOrElse(Failure)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   759
}
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   760
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   761
def strong_blex_simp(r: ARexp, s: List[Char]) : Bits = s match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   762
  case Nil => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   763
    if (bnullable(r)) {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   764
      //println(asize(r))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   765
      val bits = mkepsBC(r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   766
      bits
431
Chengsong
parents:
diff changeset
   767
    }
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   768
    else 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   769
      throw new Exception("Not matched")
431
Chengsong
parents:
diff changeset
   770
  }
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   771
  case c::cs => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   772
    val der_res = bder(c,r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   773
    val simp_res = strongBsimp(der_res)  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   774
    strong_blex_simp(simp_res, cs)      
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   775
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   776
}
431
Chengsong
parents:
diff changeset
   777
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   778
def strong_blex_simp5(r: ARexp, s: List[Char]) : Bits = s match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   779
  case Nil => {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   780
    if (bnullable(r)) {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   781
      //println(asize(r))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   782
      val bits = mkepsBC(r)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   783
      bits
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   784
    }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   785
    else 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   786
      throw new Exception("Not matched")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   787
  }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   788
  case c::cs => {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   789
    val der_res = bder(c,r)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   790
    val simp_res = strongBsimp5(der_res)  
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   791
    strong_blex_simp5(simp_res, cs)      
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   792
  }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   793
}
431
Chengsong
parents:
diff changeset
   794
Chengsong
parents:
diff changeset
   795
Chengsong
parents:
diff changeset
   796
  def bders_simp(s: List[Char], r: ARexp) : ARexp = s match {
Chengsong
parents:
diff changeset
   797
    case Nil => r
435
Chengsong
parents: 432
diff changeset
   798
    case c::s => 
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   799
      //println(erase(r))
435
Chengsong
parents: 432
diff changeset
   800
      bders_simp(s, bsimp(bder(c, r)))
431
Chengsong
parents:
diff changeset
   801
  }
Chengsong
parents:
diff changeset
   802
  
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   803
  def bdersStrong5(s: List[Char], r: ARexp) : ARexp = s match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   804
    case Nil => r
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   805
    case c::s => bdersStrong5(s, strongBsimp5(bder(c, r)))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   806
  }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   807
431
Chengsong
parents:
diff changeset
   808
  def bdersSimp(s: String, r: Rexp) : ARexp = bders_simp(s.toList, internalise(r))
Chengsong
parents:
diff changeset
   809
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   810
  def bdersStrong(s: List[Char], r: ARexp) : ARexp = s match {
431
Chengsong
parents:
diff changeset
   811
    case Nil => r 
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   812
    case c::s => bdersStrong(s, strongBsimp(bder(c, r)))
431
Chengsong
parents:
diff changeset
   813
  }
Chengsong
parents:
diff changeset
   814
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   815
  def bdersStrongRexp(s: String, r: Rexp) : ARexp = bdersStrong(s.toList, internalise(r))
431
Chengsong
parents:
diff changeset
   816
Chengsong
parents:
diff changeset
   817
  def erase(r:ARexp): Rexp = r match{
Chengsong
parents:
diff changeset
   818
    case AZERO => ZERO
Chengsong
parents:
diff changeset
   819
    case AONE(_) => ONE
Chengsong
parents:
diff changeset
   820
    case ACHAR(bs, c) => CHAR(c)
Chengsong
parents:
diff changeset
   821
    case AALTS(bs, Nil) => ZERO
Chengsong
parents:
diff changeset
   822
    case AALTS(bs, a::Nil) => erase(a)
Chengsong
parents:
diff changeset
   823
    case AALTS(bs, a::as) => ALTS(erase(a), erase(AALTS(bs, as)))
Chengsong
parents:
diff changeset
   824
    case ASEQ(bs, r1, r2) => SEQ (erase(r1), erase(r2))
Chengsong
parents:
diff changeset
   825
    case ASTAR(cs, r)=> STAR(erase(r))
Chengsong
parents:
diff changeset
   826
    case ANOT(bs, r) => NOT(erase(r))
Chengsong
parents:
diff changeset
   827
    case AANYCHAR(bs) => ANYCHAR
Chengsong
parents:
diff changeset
   828
  }
Chengsong
parents:
diff changeset
   829
Chengsong
parents:
diff changeset
   830
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   831
  def allCharSeq(r: Rexp) : Boolean = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   832
    case CHAR(c) => true
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   833
    case SEQ(r1, r2) => allCharSeq(r1) && allCharSeq(r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   834
    case _ => false
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   835
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   836
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   837
  def flattenSeq(r: Rexp) : String = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   838
    case CHAR(c) => c.toString
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   839
    case SEQ(r1, r2) => flattenSeq(r1) ++ flattenSeq(r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   840
    case _ => throw new Error("flatten unflattenable rexp")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   841
  } 
431
Chengsong
parents:
diff changeset
   842
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   843
  def shortRexpOutput(r: Rexp) : String = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   844
      case CHAR(c) => c.toString
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   845
      case ONE => "1"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   846
      case ZERO => "0"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   847
      case SEQ(r1, r2) if(allCharSeq(r)) => flattenSeq(r)//"[" ++ shortRexpOutput(r1) ++ "~" ++ shortRexpOutput(r2) ++ "]"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   848
      case SEQ(r1, r2) => "[" ++ shortRexpOutput(r1) ++ "~" ++ shortRexpOutput(r2) ++ "]"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   849
      case ALTS(r1, r2) => "(" ++ shortRexpOutput(r1) ++ "+" ++ shortRexpOutput(r2) ++ ")"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   850
      case STAR(STAR(r)) => "(..)*"// ++ shortRexpOutput(r) ++ "]*"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   851
      case STAR(r) => "STAR(" ++ shortRexpOutput(r) ++ ")"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   852
      //case RTOP => "RTOP"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   853
    }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   854
431
Chengsong
parents:
diff changeset
   855
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   856
  def blex_simp(r: ARexp, s: List[Char]) : Bits = s match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   857
      case Nil => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   858
        if (bnullable(r)) {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   859
          val bits = mkepsBC(r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   860
          bits
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   861
        }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   862
        else 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   863
          throw new Exception("Not matched")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   864
      }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   865
      case c::cs => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   866
        val der_res = bder(c,r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   867
        val simp_res = bsimp(der_res)  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   868
        blex_simp(simp_res, cs)      
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   869
      }
431
Chengsong
parents:
diff changeset
   870
  }
Chengsong
parents:
diff changeset
   871
Chengsong
parents:
diff changeset
   872
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   873
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   874
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   875
    def size(r: Rexp) : Int = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   876
      case ZERO => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   877
      case ONE => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   878
      case CHAR(_) => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   879
      case ANYCHAR => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   880
      case NOT(r0) => 1 + size(r0)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   881
      case SEQ(r1, r2) => 1 + size(r1) + size(r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   882
      case ALTS(r1, r2) => 1 + List(r1, r2).map(size).sum
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   883
      case STAR(r) => 1 + size(r)
431
Chengsong
parents:
diff changeset
   884
    }
Chengsong
parents:
diff changeset
   885
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   886
    def asize(a: ARexp) = size(erase(a))
431
Chengsong
parents:
diff changeset
   887
Chengsong
parents:
diff changeset
   888
//pder related
Chengsong
parents:
diff changeset
   889
type Mon = (Char, Rexp)
Chengsong
parents:
diff changeset
   890
type Lin = Set[Mon]
Chengsong
parents:
diff changeset
   891
Chengsong
parents:
diff changeset
   892
def dot_prod(rs: Set[Rexp], r: Rexp): Set[Rexp] = r match {
Chengsong
parents:
diff changeset
   893
    case ZERO => Set()
Chengsong
parents:
diff changeset
   894
    case ONE => rs
Chengsong
parents:
diff changeset
   895
    case r => rs.map((re) => if (re == ONE) r else SEQ(re, r)  )   
Chengsong
parents:
diff changeset
   896
  }
Chengsong
parents:
diff changeset
   897
  def cir_prod(l: Lin, t: Rexp): Lin = t match {//remember this Lin is different from the Lin in Antimirov's paper. Here it does not mean the set of all subsets of linear forms that does not contain zero, but rather the type a set of linear forms
Chengsong
parents:
diff changeset
   898
    case ZERO => Set()
Chengsong
parents:
diff changeset
   899
    case ONE => l
Chengsong
parents:
diff changeset
   900
    case t => l.map( m => m._2 match {case ZERO => m case ONE => (m._1, t) case p => (m._1, SEQ(p, t)) }  )
Chengsong
parents:
diff changeset
   901
  }
Chengsong
parents:
diff changeset
   902
  def lf(r: Rexp): Lin = r match {
Chengsong
parents:
diff changeset
   903
    case ZERO => Set()
Chengsong
parents:
diff changeset
   904
    case ONE => Set()
Chengsong
parents:
diff changeset
   905
    case CHAR(f) => {
Chengsong
parents:
diff changeset
   906
      //val Some(c) = alphabet.find(f) 
Chengsong
parents:
diff changeset
   907
      Set((f, ONE))
Chengsong
parents:
diff changeset
   908
    }
Chengsong
parents:
diff changeset
   909
    case ALTS(r1, r2) => {
Chengsong
parents:
diff changeset
   910
      lf(r1 ) ++ lf(r2)
Chengsong
parents:
diff changeset
   911
    }
Chengsong
parents:
diff changeset
   912
    case STAR(r1) => cir_prod(lf(r1), STAR(r1)) //may try infix notation later......
Chengsong
parents:
diff changeset
   913
    case SEQ(r1, r2) =>{
Chengsong
parents:
diff changeset
   914
      if (nullable(r1))
Chengsong
parents:
diff changeset
   915
        cir_prod(lf(r1), r2) ++ lf(r2)
Chengsong
parents:
diff changeset
   916
      else
Chengsong
parents:
diff changeset
   917
        cir_prod(lf(r1), r2) 
Chengsong
parents:
diff changeset
   918
    }
Chengsong
parents:
diff changeset
   919
  }
Chengsong
parents:
diff changeset
   920
  def lfs(r: Set[Rexp]): Lin = {
Chengsong
parents:
diff changeset
   921
    r.foldLeft(Set[Mon]())((acc, r) => acc ++ lf(r))
Chengsong
parents:
diff changeset
   922
  }
Chengsong
parents:
diff changeset
   923
Chengsong
parents:
diff changeset
   924
  def pder(x: Char, t: Rexp): Set[Rexp] = {
Chengsong
parents:
diff changeset
   925
    val lft = lf(t)
Chengsong
parents:
diff changeset
   926
    (lft.filter(mon => if(mon._1 == x) true else false)).map(mon => mon._2)
Chengsong
parents:
diff changeset
   927
  }
Chengsong
parents:
diff changeset
   928
  def pders_single(s: List[Char], t: Rexp) : Set[Rexp] = s match {
Chengsong
parents:
diff changeset
   929
    case x::xs => pders(xs, pder(x, t))
Chengsong
parents:
diff changeset
   930
    case Nil => Set(t)
Chengsong
parents:
diff changeset
   931
  }
Chengsong
parents:
diff changeset
   932
  def pders(s: List[Char], ts: Set[Rexp]) : Set[Rexp] = s match {
Chengsong
parents:
diff changeset
   933
    case x::xs => pders(xs, ts.foldLeft(Set[Rexp]())((acc, t) => acc ++ pder(x, t)))
Chengsong
parents:
diff changeset
   934
    case Nil => ts 
Chengsong
parents:
diff changeset
   935
  }
Chengsong
parents:
diff changeset
   936
  def pderss(ss: List[List[Char]], t: Rexp): Set[Rexp] = ss.foldLeft( Set[Rexp]() )( (acc, s) => pders_single(s, t) ++ acc )
Chengsong
parents:
diff changeset
   937
  def pdera(t: Rexp): Set[Rexp] = lf(t).map(mon => mon._2)
Chengsong
parents:
diff changeset
   938
  //all implementation of partial derivatives that involve set union are potentially buggy
Chengsong
parents:
diff changeset
   939
  //because they don't include the original regular term before they are pdered.
Chengsong
parents:
diff changeset
   940
  //now only pderas is fixed.
Chengsong
parents:
diff changeset
   941
  def pderas(t: Set[Rexp], d: Int): Set[Rexp] = if(d > 0) pderas(lfs(t).map(mon => mon._2), d - 1) ++ t else lfs(t).map(mon => mon._2) ++ t//repeated application of pderas over the newest set of pders.
Chengsong
parents:
diff changeset
   942
  def pderUNIV(r: Rexp) : Set[Rexp] = pderas(Set(r), awidth(r) + 1)
Chengsong
parents:
diff changeset
   943
  def awidth(r: Rexp) : Int = r match {
Chengsong
parents:
diff changeset
   944
    case CHAR(c) => 1
Chengsong
parents:
diff changeset
   945
    case SEQ(r1, r2) => awidth(r1) + awidth(r2)
Chengsong
parents:
diff changeset
   946
    case ALTS(r1, r2) => awidth(r1) + awidth(r2)
Chengsong
parents:
diff changeset
   947
    case ONE => 0
Chengsong
parents:
diff changeset
   948
    case ZERO => 0
Chengsong
parents:
diff changeset
   949
    case STAR(r) => awidth(r)
Chengsong
parents:
diff changeset
   950
  }
Chengsong
parents:
diff changeset
   951
  //def sigma_lf(l: Set[Mon]) : Rexp = ALTS(l.map(mon => SEQ(CHAR(mon._1),mon._2)).toList)
Chengsong
parents:
diff changeset
   952
  //def sigma(rs: Set[Rexp]) : Rexp = ALTS(rs.toList)
Chengsong
parents:
diff changeset
   953
  def o(r: Rexp) = if (nullable(r)) ONE else ZERO
Chengsong
parents:
diff changeset
   954
  //def nlf(t: Rexp) : Rexp = ALTS(List( o(t), sigma_lf(lf(t)) ))
Chengsong
parents:
diff changeset
   955
  def pdp(x: Char, r: Rexp) : Set[Rexp] = r match {
Chengsong
parents:
diff changeset
   956
    case ZERO => Set[Rexp]()
Chengsong
parents:
diff changeset
   957
    case ONE => Set[Rexp]()
Chengsong
parents:
diff changeset
   958
    case CHAR(f) => if(x == f) Set(ONE) else Set[Rexp]()
Chengsong
parents:
diff changeset
   959
    case ALTS(r1, r2) => pdp(x, r1) ++ pdp(x, r2)
Chengsong
parents:
diff changeset
   960
    case STAR(r1) => pdp(x, r).map(a => SEQ(a, STAR(r1)))
Chengsong
parents:
diff changeset
   961
    case SEQ(a0, b) => if(nullable(a0)) pdp(x, a0).map(a => SEQ(a, b)) ++ pdp(x, b) else pdp(x, a0).map(a => SEQ(a, b))
Chengsong
parents:
diff changeset
   962
  }
Chengsong
parents:
diff changeset
   963
  def pdps(s: List[Char], ts: Set[Rexp]): Set[Rexp] = s match {
Chengsong
parents:
diff changeset
   964
    case x::xs => pdps(xs, ts.foldLeft(Set[Rexp]())((acc, t) => acc ++ pder(x, t)))
Chengsong
parents:
diff changeset
   965
    case Nil => ts   
Chengsong
parents:
diff changeset
   966
  }
Chengsong
parents:
diff changeset
   967
  def pdpss(ss: List[List[Char]], t: Rexp): Set[Rexp] = ss.foldLeft( Set[Rexp]())((acc, s) => pdps(s, Set(t)) ++ acc)
Chengsong
parents:
diff changeset
   968
Chengsong
parents:
diff changeset
   969
Chengsong
parents:
diff changeset
   970
Chengsong
parents:
diff changeset
   971
def starPrint(r: Rexp) : Unit = r match {
Chengsong
parents:
diff changeset
   972
        
Chengsong
parents:
diff changeset
   973
          case SEQ(head, rstar) =>
Chengsong
parents:
diff changeset
   974
            println(shortRexpOutput(head) ++ "~STARREG")
Chengsong
parents:
diff changeset
   975
          case STAR(rstar) =>
Chengsong
parents:
diff changeset
   976
            println("STARREG")
Chengsong
parents:
diff changeset
   977
          case ALTS(r1, r2) =>  
Chengsong
parents:
diff changeset
   978
            println("(")
Chengsong
parents:
diff changeset
   979
            starPrint(r1)
Chengsong
parents:
diff changeset
   980
            println("+")
Chengsong
parents:
diff changeset
   981
            starPrint(r2)
Chengsong
parents:
diff changeset
   982
            println(")")
Chengsong
parents:
diff changeset
   983
          case ZERO => println("0")
Chengsong
parents:
diff changeset
   984
        
Chengsong
parents:
diff changeset
   985
      }
Chengsong
parents:
diff changeset
   986
Chengsong
parents:
diff changeset
   987
// @arg(doc = "small tests")
Chengsong
parents:
diff changeset
   988
val STARREG = //((( (STAR("aa")) | STAR("aaa") ).%).%)
Chengsong
parents:
diff changeset
   989
(((STAR("a") | ( STAR("aaa")) | STAR("aaaaa"| ( STAR("aaaaaaa")) | STAR("aaaaaaaaaaa"))).%).%).%
Chengsong
parents:
diff changeset
   990
Chengsong
parents:
diff changeset
   991
// @main
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   992
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   993
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   994
431
Chengsong
parents:
diff changeset
   995
def small() = {
Chengsong
parents:
diff changeset
   996
Chengsong
parents:
diff changeset
   997
Chengsong
parents:
diff changeset
   998
//   println(lexing_simp(NOTREG, prog0))
Chengsong
parents:
diff changeset
   999
//   val v = lex_simp(NOTREG, prog0.toList)
Chengsong
parents:
diff changeset
  1000
//   println(v)
Chengsong
parents:
diff changeset
  1001
Chengsong
parents:
diff changeset
  1002
//   val d =  (lex_simp(NOTREG, prog0.toList))
Chengsong
parents:
diff changeset
  1003
//   println(d)
Chengsong
parents:
diff changeset
  1004
  val pderSTAR = pderUNIV(STARREG)
Chengsong
parents:
diff changeset
  1005
Chengsong
parents:
diff changeset
  1006
  val refSize = pderSTAR.map(size(_)).sum
435
Chengsong
parents: 432
diff changeset
  1007
  // println("different partial derivative terms:")
Chengsong
parents: 432
diff changeset
  1008
  // pderSTAR.foreach(r => r match {
431
Chengsong
parents:
diff changeset
  1009
      
435
Chengsong
parents: 432
diff changeset
  1010
  //       case SEQ(head, rstar) =>
Chengsong
parents: 432
diff changeset
  1011
  //         println(shortRexpOutput(head) ++ "~STARREG")
Chengsong
parents: 432
diff changeset
  1012
  //       case STAR(rstar) =>
Chengsong
parents: 432
diff changeset
  1013
  //         println("STARREG")
431
Chengsong
parents:
diff changeset
  1014
      
435
Chengsong
parents: 432
diff changeset
  1015
  //   }
Chengsong
parents: 432
diff changeset
  1016
  //   )
Chengsong
parents: 432
diff changeset
  1017
  // println("the total number of terms is")
Chengsong
parents: 432
diff changeset
  1018
  // //println(refSize)
Chengsong
parents: 432
diff changeset
  1019
  // println(pderSTAR.size)
431
Chengsong
parents:
diff changeset
  1020
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1021
  // val A : Rexp= ("c" | (ONE | "b") ~ "d") ~((ONE).%)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1022
  // val B : Rexp = ((ONE).%)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1023
  // val C : Rexp = ("d") ~ ((ONE).%)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1024
  // val PRUNE_REG : Rexp = (C | B | A)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1025
  // val APRUNE_REG = internalise(PRUNE_REG)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1026
  // val program_solution = pruneRexp(APRUNE_REG, breakIntoTerms(PRUNE_REG))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1027
  // println("program executes and gives: as disired!")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1028
  // println(shortRexpOutput(erase(program_solution)))
435
Chengsong
parents: 432
diff changeset
  1029
  // val simpedPruneReg = strongBsimp(APRUNE_REG)
Chengsong
parents: 432
diff changeset
  1030
Chengsong
parents: 432
diff changeset
  1031
  // println(shortRexpOutput(erase(simpedPruneReg)))
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1032
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1033
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1034
  for(i <- List(1,2,3,4,10, 100, 400, 841, 900 ) ){// 100, 400, 800, 840, 841, 900
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1035
    val prog0 = "a" * i
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1036
    //println(s"test: $prog0")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1037
    println(s"testing with $i a's" )
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1038
    //val bd = bdersSimp(prog0, STARREG)//DB
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1039
    val sbd = bdersStrongRexp(prog0, STARREG)//strongDB
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1040
    starPrint(erase(sbd))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1041
    val subTerms = breakIntoTerms(erase(sbd))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1042
    //val subTermsLarge = breakIntoTerms(erase(bd))
431
Chengsong
parents:
diff changeset
  1043
    
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1044
    println(s"subterms of regex with strongDB: ${subTerms.length}")//, standard DB: ${subTermsLarge.length}")
431
Chengsong
parents:
diff changeset
  1045
Chengsong
parents:
diff changeset
  1046
Chengsong
parents:
diff changeset
  1047
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1048
    println("the number of distinct subterms for bsimp with strongDB")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1049
    println(subTerms.distinct.size)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1050
    //println(subTermsLarge.distinct.size)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1051
    if(pderSTAR.size > subTerms.length)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1052
      println(s"which is less than or equal to the number of PDER terms: ${pderSTAR.size}")
431
Chengsong
parents:
diff changeset
  1053
Chengsong
parents:
diff changeset
  1054
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1055
    // println(shortRexpOutput(erase(sbd)))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1056
    // println(shortRexpOutput(erase(bd)))
431
Chengsong
parents:
diff changeset
  1057
    
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1058
    println("pdersize, original, strongSimp")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1059
    println(refSize, size(STARREG),  asize(sbd))
431
Chengsong
parents:
diff changeset
  1060
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1061
    //val vres = strong_blexing_simp( STARREG, prog0)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1062
    //println(vres)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1063
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1064
  // println(vs.length)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1065
  // println(vs)
431
Chengsong
parents:
diff changeset
  1066
   
Chengsong
parents:
diff changeset
  1067
Chengsong
parents:
diff changeset
  1068
  // val prog1 = """read  n; write n"""  
Chengsong
parents:
diff changeset
  1069
  // println(s"test: $prog1")
Chengsong
parents:
diff changeset
  1070
  // println(lexing_simp(WHILE_REGS, prog1))
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1071
  // val display = ("a"| "ab").%
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1072
  // val adisplay = internalise(display)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1073
  // bders_simp( "aaaaa".toList, adisplay)
431
Chengsong
parents:
diff changeset
  1074
}
Chengsong
parents:
diff changeset
  1075
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1076
def generator_test() {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1077
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1078
  // test(rexp(7), 1000) { (r: Rexp) => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1079
  //   val ss = stringsFromRexp(r)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1080
  //   val boolList = ss.map(s => {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1081
  //     val simpVal = simpBlexer(r, s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1082
  //     val strongVal = strongBlexer(r, s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1083
  //     // println(simpVal)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1084
  //     // println(strongVal)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1085
  //     (simpVal == strongVal) && (simpVal != None) 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1086
  //   })
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1087
  //   !boolList.exists(b => b == false)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1088
  // }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1089
  // test(single(STAR(ALTS(STAR(CHAR('c')),ALTS(CHAR('c'),ZERO)))), 100000) { (r: Rexp) => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1090
  //   val ss = stringsFromRexp(r)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1091
  //   val boolList = ss.map(s => {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1092
  //     val bdStrong = bdersStrong(s.toList, internalise(r))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1093
  //     val bdStrong5 = bdersStrong5(s.toList, internalise(r))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1094
  //     // println(shortRexpOutput(r))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1095
  //     // println(s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1096
  //     // println(strongVal)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1097
  //     // println(strongVal5)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1098
  //     // (strongVal == strongVal5) 
493
Chengsong
parents: 492
diff changeset
  1099
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1100
  //     if(asize(bdStrong5) > asize(bdStrong)){
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1101
  //       println(s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1102
  //       println(shortRexpOutput(erase(bdStrong5)))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1103
  //       println(shortRexpOutput(erase(bdStrong)))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1104
  //     }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1105
  //     asize(bdStrong5) <= asize(bdStrong)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1106
  //   })
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1107
  //   !boolList.exists(b => b == false)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1108
  // }
500
Chengsong
parents: 494
diff changeset
  1109
  //*** example where bdStrong5 has a smaller size than bdStrong
Chengsong
parents: 494
diff changeset
  1110
  // test(single(STAR(SEQ(ALTS(SEQ(STAR(CHAR('a')),ALTS(ALTS(ONE,ZERO),SEQ(ONE,ONE))),CHAR('a')),ONE))), 1) { (r: Rexp) => 
Chengsong
parents: 494
diff changeset
  1111
  //*** depth 5 example bdStrong5 larger size than bdStrong
Chengsong
parents: 494
diff changeset
  1112
  // test(single(STAR(SEQ(SEQ(ALTS(CHAR('b'),STAR(CHAR('b'))),CHAR('b')),(ALTS(STAR(CHAR('c')), ONE))))), 1) {(r: Rexp) =>
Chengsong
parents: 494
diff changeset
  1113
 
Chengsong
parents: 494
diff changeset
  1114
 
Chengsong
parents: 494
diff changeset
  1115
 
Chengsong
parents: 494
diff changeset
  1116
  //sanity check from Christian's request
Chengsong
parents: 494
diff changeset
  1117
  // val r = ("a" | "ab") ~ ("bc" | "c")
Chengsong
parents: 494
diff changeset
  1118
  // val a = internalise(r)
Chengsong
parents: 494
diff changeset
  1119
  // val aval = blexing_simp(r, "abc")
Chengsong
parents: 494
diff changeset
  1120
  // println(aval)
Chengsong
parents: 494
diff changeset
  1121
Chengsong
parents: 494
diff changeset
  1122
  //sample counterexample:(depth 7)
Chengsong
parents: 494
diff changeset
  1123
  //STAR(SEQ(ALTS(STAR(STAR(STAR(STAR(CHAR(c))))),ALTS(CHAR(c),CHAR(b))),ALTS(ZERO,SEQ(ALTS(ALTS(STAR(CHAR(c)),SEQ(CHAR(b),CHAR(a))),CHAR(c)),STAR(ALTS(ALTS(ONE,CHAR(a)),STAR(CHAR(c))))))))
Chengsong
parents: 494
diff changeset
  1124
  //(depth5)
Chengsong
parents: 494
diff changeset
  1125
  //STAR(SEQ(ALTS(ALTS(STAR(CHAR(b)),SEQ(ONE,CHAR(b))),SEQ(STAR(CHAR(a)),CHAR(b))),ALTS(ZERO,ALTS(STAR(CHAR(b)),STAR(CHAR(a))))))
Chengsong
parents: 494
diff changeset
  1126
  test(rexp(4), 10000000) { (r: Rexp) => 
Chengsong
parents: 494
diff changeset
  1127
  // ALTS(SEQ(SEQ(ONE,CHAR('a')),STAR(CHAR('a'))),SEQ(ALTS(CHAR('c'),ONE),STAR(ZERO))))))), 1) { (r: Rexp) => 
493
Chengsong
parents: 492
diff changeset
  1128
    val ss = stringsFromRexp(r)
Chengsong
parents: 492
diff changeset
  1129
    val boolList = ss.map(s => {
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1130
      val bdStrong = bdersStrong(s.toList, internalise(r))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1131
      val bdStrong5 = bdersStrong5(s.toList, internalise(r))
500
Chengsong
parents: 494
diff changeset
  1132
      val bdFurther5 = strongBsimp5(bdStrong5)
Chengsong
parents: 494
diff changeset
  1133
      val sizeFurther5 = asize(bdFurther5)
Chengsong
parents: 494
diff changeset
  1134
      val pdersSet = pderUNIV(r)
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1135
      val size5 = asize(bdStrong5)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1136
      val size0 = asize(bdStrong)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1137
      // println(s)
500
Chengsong
parents: 494
diff changeset
  1138
      // println("pdersSet size")
Chengsong
parents: 494
diff changeset
  1139
      // println(pdersSet.size)
Chengsong
parents: 494
diff changeset
  1140
      // pdersSet.foreach(r => println(shortRexpOutput(r)))
Chengsong
parents: 494
diff changeset
  1141
      // println("after bdStrong5")
Chengsong
parents: 494
diff changeset
  1142
      
Chengsong
parents: 494
diff changeset
  1143
      // println(shortRexpOutput(erase(bdStrong5)))
Chengsong
parents: 494
diff changeset
  1144
      // println(breakIntoTerms(erase(bdStrong5)).size)
Chengsong
parents: 494
diff changeset
  1145
      
Chengsong
parents: 494
diff changeset
  1146
      // println("after bdStrong")
Chengsong
parents: 494
diff changeset
  1147
      // println(shortRexpOutput(erase(bdStrong)))
Chengsong
parents: 494
diff changeset
  1148
      // println(breakIntoTerms(erase(bdStrong)).size)
Chengsong
parents: 494
diff changeset
  1149
      // println(size5, size0, sizeFurther5)
Chengsong
parents: 494
diff changeset
  1150
      // aprint(strongBsimp5(bdStrong))
Chengsong
parents: 494
diff changeset
  1151
      // println(asize(strongBsimp5(bdStrong5)))
Chengsong
parents: 494
diff changeset
  1152
      // println(s)
Chengsong
parents: 494
diff changeset
  1153
      size5 <= size0 
493
Chengsong
parents: 492
diff changeset
  1154
    })
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1155
    // println(boolList)
500
Chengsong
parents: 494
diff changeset
  1156
    //!boolList.exists(b => b == false)
493
Chengsong
parents: 492
diff changeset
  1157
    !boolList.exists(b => b == false)
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1158
  }
493
Chengsong
parents: 492
diff changeset
  1159
Chengsong
parents: 492
diff changeset
  1160
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1161
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1162
// small()
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1163
generator_test()
493
Chengsong
parents: 492
diff changeset
  1164
Chengsong
parents: 492
diff changeset
  1165
1
Chengsong
parents: 492
diff changeset
  1166
Chengsong
parents: 492
diff changeset
  1167
SEQ(SEQ(SEQ(ONE,CHAR('b')),STAR(CHAR('b'))),
Chengsong
parents: 492
diff changeset
  1168
SEQ(ALTS(ALTS(ZERO,STAR(CHAR('b'))),
Chengsong
parents: 492
diff changeset
  1169
STAR(ALTS(CHAR('a'),SEQ(SEQ(STAR(ALTS(STAR(CHAR('c')),CHAR('a'))),
Chengsong
parents: 492
diff changeset
  1170
SEQ(CHAR('a'),SEQ(ALTS(CHAR('b'),ZERO),SEQ(ONE,CHAR('b'))))),ONE)))),ONE))
Chengsong
parents: 492
diff changeset
  1171
Chengsong
parents: 492
diff changeset
  1172
Chengsong
parents: 492
diff changeset
  1173
// Sequ(Sequ(Sequ(Empty,Chr(b)),Stars(List(Chr(b), Chr(b)))),Sequ(Right(Stars(List(Right(Sequ(Sequ(Stars(List(Right(Chr(a)), Right(Chr(a)))),Sequ(Chr(a),Sequ(Left(Chr(b)),Sequ(Empty,Chr(b))))),Empty)), Right(Sequ(Sequ(Stars(List(Right(Chr(a)), Right(Chr(a)))),Sequ(Chr(a),Sequ(Left(Chr(b)),Sequ(Empty,Chr(b))))),Empty))))),Empty))
Chengsong
parents: 492
diff changeset
  1174
// Sequ(Sequ(Sequ(Empty,Chr(b)),Stars(List(Chr(b), Chr(b)))),Sequ(Right(Stars(List(Right(Sequ(Sequ(Stars(List(Right(Chr(a)), Right(Chr(a)))),Sequ(Chr(a),Sequ(Left(Chr(b)),Sequ(Empty,Chr(b))))),Empty)), Right(Sequ(Sequ(Stars(List(Right(Chr(a)), Right(Chr(a)))),Sequ(Chr(a),Sequ(Left(Chr(b)),Sequ(Empty,Chr(b))))),Empty))))),Empty))