thys2/blexer2.sc
author Chengsong
Mon, 25 Apr 2022 17:00:18 +0100
changeset 494 c730d018ebfa
parent 493 1481f465e6ea
child 500 4d9eecfc936a
permissions -rw-r--r--
blexer2
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
431
Chengsong
parents:
diff changeset
     1
// A simple lexer inspired by work of Sulzmann & Lu
Chengsong
parents:
diff changeset
     2
//==================================================
Chengsong
parents:
diff changeset
     3
//
Chengsong
parents:
diff changeset
     4
// Call the test cases with 
Chengsong
parents:
diff changeset
     5
//
Chengsong
parents:
diff changeset
     6
//   amm lexer.sc small
Chengsong
parents:
diff changeset
     7
//   amm lexer.sc fib
Chengsong
parents:
diff changeset
     8
//   amm lexer.sc loops
Chengsong
parents:
diff changeset
     9
//   amm lexer.sc email
Chengsong
parents:
diff changeset
    10
//
Chengsong
parents:
diff changeset
    11
//   amm lexer.sc all
Chengsong
parents:
diff changeset
    12
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    13
import scala.util.Try
431
Chengsong
parents:
diff changeset
    14
Chengsong
parents:
diff changeset
    15
// regular expressions including records
Chengsong
parents:
diff changeset
    16
abstract class Rexp 
Chengsong
parents:
diff changeset
    17
case object ZERO extends Rexp
Chengsong
parents:
diff changeset
    18
case object ONE extends Rexp
Chengsong
parents:
diff changeset
    19
case object ANYCHAR extends Rexp
Chengsong
parents:
diff changeset
    20
case class CHAR(c: Char) extends Rexp
Chengsong
parents:
diff changeset
    21
case class ALTS(r1: Rexp, r2: Rexp) extends Rexp 
Chengsong
parents:
diff changeset
    22
case class SEQ(r1: Rexp, r2: Rexp) extends Rexp 
Chengsong
parents:
diff changeset
    23
case class STAR(r: Rexp) extends Rexp 
Chengsong
parents:
diff changeset
    24
case class RECD(x: String, r: Rexp) extends Rexp  
Chengsong
parents:
diff changeset
    25
case class NTIMES(n: Int, r: Rexp) extends Rexp
Chengsong
parents:
diff changeset
    26
case class OPTIONAL(r: Rexp) extends Rexp
Chengsong
parents:
diff changeset
    27
case class NOT(r: Rexp) extends Rexp
Chengsong
parents:
diff changeset
    28
                // records for extracting strings or tokens
Chengsong
parents:
diff changeset
    29
  
Chengsong
parents:
diff changeset
    30
// values  
Chengsong
parents:
diff changeset
    31
abstract class Val
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    32
case object Failure extends Val
431
Chengsong
parents:
diff changeset
    33
case object Empty extends Val
Chengsong
parents:
diff changeset
    34
case class Chr(c: Char) extends Val
Chengsong
parents:
diff changeset
    35
case class Sequ(v1: Val, v2: Val) extends Val
Chengsong
parents:
diff changeset
    36
case class Left(v: Val) extends Val
Chengsong
parents:
diff changeset
    37
case class Right(v: Val) extends Val
Chengsong
parents:
diff changeset
    38
case class Stars(vs: List[Val]) extends Val
Chengsong
parents:
diff changeset
    39
case class Rec(x: String, v: Val) extends Val
Chengsong
parents:
diff changeset
    40
case class Ntime(vs: List[Val]) extends Val
Chengsong
parents:
diff changeset
    41
case class Optionall(v: Val) extends Val
Chengsong
parents:
diff changeset
    42
case class Nots(s: String) extends Val
Chengsong
parents:
diff changeset
    43
Chengsong
parents:
diff changeset
    44
Chengsong
parents:
diff changeset
    45
Chengsong
parents:
diff changeset
    46
abstract class Bit
Chengsong
parents:
diff changeset
    47
case object Z extends Bit
Chengsong
parents:
diff changeset
    48
case object S extends Bit
Chengsong
parents:
diff changeset
    49
Chengsong
parents:
diff changeset
    50
Chengsong
parents:
diff changeset
    51
type Bits = List[Bit]
Chengsong
parents:
diff changeset
    52
Chengsong
parents:
diff changeset
    53
abstract class ARexp 
Chengsong
parents:
diff changeset
    54
case object AZERO extends ARexp
Chengsong
parents:
diff changeset
    55
case class AONE(bs: Bits) extends ARexp
Chengsong
parents:
diff changeset
    56
case class ACHAR(bs: Bits, c: Char) extends ARexp
Chengsong
parents:
diff changeset
    57
case class AALTS(bs: Bits, rs: List[ARexp]) extends ARexp 
Chengsong
parents:
diff changeset
    58
case class ASEQ(bs: Bits, r1: ARexp, r2: ARexp) extends ARexp 
Chengsong
parents:
diff changeset
    59
case class ASTAR(bs: Bits, r: ARexp) extends ARexp 
Chengsong
parents:
diff changeset
    60
case class ANOT(bs: Bits, r: ARexp) extends ARexp
Chengsong
parents:
diff changeset
    61
case class AANYCHAR(bs: Bits) extends ARexp
Chengsong
parents:
diff changeset
    62
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    63
trait Generator[+T] {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    64
    self => // an alias for "this"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    65
    def generate(): T
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    66
  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    67
    def gen(n: Int) : List[T] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    68
      if (n == 0) Nil else self.generate() :: gen(n - 1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    69
    
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    70
    def map[S](f: T => S): Generator[S] = new Generator[S] {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    71
      def generate = f(self.generate())  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    72
    }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    73
    def flatMap[S](f: T => Generator[S]): Generator[S] = new Generator[S] {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    74
      def generate = f(self.generate()).generate()
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    75
    }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    76
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    77
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    78
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    79
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    80
  // tests a property according to a given random generator
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    81
  def test[T](r: Generator[T], amount: Int = 100)(pred: T => Boolean) {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    82
    for (_ <- 0 until amount) {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    83
      val value = r.generate()
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    84
      assert(pred(value), s"Test failed for: $value")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    85
    }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    86
    println(s"Test passed $amount times")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    87
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    88
  def test2[T, S](r: Generator[T], s: Generator[S], amount: Int = 100)(pred: (T, S) => Boolean) {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    89
    for (_ <- 0 until amount) {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    90
      val valueR = r.generate()
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    91
      val valueS = s.generate()
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    92
      assert(pred(valueR, valueS), s"Test failed for: $valueR, $valueS")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    93
    }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    94
    println(s"Test passed $amount times")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    95
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    96
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    97
// random integers
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    98
val integers = new Generator[Int] {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
    99
  val rand = new java.util.Random
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   100
  def generate() = rand.nextInt()
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   101
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   102
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   103
// random booleans
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   104
val booleans = integers.map(_ > 0)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   105
  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   106
// random integers in the range lo and high  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   107
def range(lo: Int, hi: Int): Generator[Int] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   108
  for (x <- integers) yield (lo + x.abs % (hi - lo)).abs
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   109
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   110
// random characters
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   111
def chars_range(lo: Char, hi: Char) = range(lo, hi).map(_.toChar)  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   112
val chars = chars_range('a', 'z')
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   113
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   114
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   115
def oneOf[T](xs: T*): Generator[T] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   116
  for (idx <- range(0, xs.length)) yield xs(idx)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   117
  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   118
def single[T](x: T) = new Generator[T] {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   119
  def generate() = x
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   120
}   
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   121
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   122
def pairs[T, U](t: Generator[T], u: Generator[U]): Generator[(T, U)] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   123
  for (x <- t; y <- u) yield (x, y)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   124
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   125
// lists
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   126
def emptyLists = single(Nil) 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   127
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   128
def nonEmptyLists : Generator[List[Int]] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   129
  for (head <- integers; tail <- lists) yield head :: tail
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   130
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   131
def lists: Generator[List[Int]] = for {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   132
  kind <- booleans
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   133
  list <- if (kind) emptyLists else nonEmptyLists
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   134
} yield list
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   135
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   136
def char_list(len: Int): Generator[List[Char]] = {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   137
  if(len <= 0) single(Nil)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   138
  else{
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   139
    for { 
493
Chengsong
parents: 492
diff changeset
   140
      c <- chars_range('a', 'd')
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   141
      tail <- char_list(len - 1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   142
    } yield c :: tail
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   143
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   144
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   145
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   146
def strings(len: Int): Generator[String] = for(cs <- char_list(len)) yield cs.toString
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   147
493
Chengsong
parents: 492
diff changeset
   148
def sampleString(r: Rexp) : List[String] = r match {
Chengsong
parents: 492
diff changeset
   149
  case STAR(r) => stringsFromRexp(r).flatMap(s => List("", s, s ++ s))//only generate 0, 1, 2 reptitions
Chengsong
parents: 492
diff changeset
   150
  case SEQ(r1, r2) => stringsFromRexp(r1).flatMap(s1 => stringsFromRexp(r2).map(s2 => s1 ++ s2) )
Chengsong
parents: 492
diff changeset
   151
  case ALTS(r1, r2) => throw new Error(s" Rexp ${r} not expected: all alternatives are supposed to have been opened up")
Chengsong
parents: 492
diff changeset
   152
  case ONE => "" :: Nil
Chengsong
parents: 492
diff changeset
   153
  case ZERO => Nil
Chengsong
parents: 492
diff changeset
   154
  case CHAR(c) => c.toString :: Nil
Chengsong
parents: 492
diff changeset
   155
Chengsong
parents: 492
diff changeset
   156
}
Chengsong
parents: 492
diff changeset
   157
Chengsong
parents: 492
diff changeset
   158
def stringsFromRexp(r: Rexp) : List[String] = 
Chengsong
parents: 492
diff changeset
   159
  breakIntoTerms(r).flatMap(r => sampleString(r))
Chengsong
parents: 492
diff changeset
   160
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   161
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   162
// (simple) binary trees
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   163
trait Tree[T]
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   164
case class Inner[T](left: Tree[T], right: Tree[T]) extends Tree[T]
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   165
case class Leaf[T](x: T) extends Tree[T]
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   166
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   167
def leafs[T](t: Generator[T]): Generator[Leaf[T]] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   168
  for (x <- t) yield Leaf(x)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   169
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   170
def inners[T](t: Generator[T]): Generator[Inner[T]] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   171
  for (l <- trees(t); r <- trees(t)) yield Inner(l, r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   172
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   173
def trees[T](t: Generator[T]): Generator[Tree[T]] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   174
  for (kind <- range(0, 2);  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   175
       tree <- if (kind == 0) leafs(t) else inners(t)) yield tree
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   176
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   177
// regular expressions
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   178
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   179
// generates random leaf-regexes; prefers CHAR-regexes
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   180
def leaf_rexp() : Generator[Rexp] =
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   181
  for (kind <- range(0, 5);
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   182
       c <- chars_range('a', 'd')) yield
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   183
    kind match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   184
      case 0 => ZERO
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   185
      case 1 => ONE
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   186
      case _ => CHAR(c) 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   187
    }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   188
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   189
// generates random inner regexes with maximum depth d
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   190
def inner_rexp(d: Int) : Generator[Rexp] =
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   191
  for (kind <- range(0, 3);
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   192
       l <- rexp(d); 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   193
       r <- rexp(d))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   194
  yield kind match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   195
    case 0 => ALTS(l, r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   196
    case 1 => SEQ(l, r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   197
    case 2 => STAR(r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   198
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   199
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   200
// generates random regexes with maximum depth d;
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   201
// prefers inner regexes in 2/3 of the cases
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   202
def rexp(d: Int = 100): Generator[Rexp] = 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   203
  for (kind <- range(0, 3);
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   204
       r <- if (d <= 0 || kind == 0) leaf_rexp() else inner_rexp(d - 1)) yield r
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   205
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   206
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   207
// some test functions for rexps
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   208
def height(r: Rexp) : Int = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   209
  case ZERO => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   210
  case ONE => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   211
  case CHAR(_) => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   212
  case ALTS(r1, r2) => 1 + List(height(r1), height(r2)).max
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   213
  case SEQ(r1, r2) =>  1 + List(height(r1), height(r2)).max
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   214
  case STAR(r) => 1 + height(r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   215
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   216
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   217
// def size(r: Rexp) : Int = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   218
//   case ZERO => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   219
//   case ONE => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   220
//   case CHAR(_) => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   221
//   case ALTS(r1, r2) => 1 + size(r1) + size(r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   222
//   case SEQ(r1, r2) =>  1 + size(r1) + size(r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   223
//   case STAR(r) => 1 + size(r) 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   224
// }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   225
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   226
// randomly subtracts 1 or 2 from the STAR case
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   227
def size_faulty(r: Rexp) : Int = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   228
  case ZERO => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   229
  case ONE => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   230
  case CHAR(_) => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   231
  case ALTS(r1, r2) => 1 + size_faulty(r1) + size_faulty(r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   232
  case SEQ(r1, r2) =>  1 + size_faulty(r1) + size_faulty(r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   233
  case STAR(r) => 1 + size_faulty(r) - range(0, 2).generate
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   234
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   235
431
Chengsong
parents:
diff changeset
   236
Chengsong
parents:
diff changeset
   237
   
Chengsong
parents:
diff changeset
   238
// some convenience for typing in regular expressions
Chengsong
parents:
diff changeset
   239
Chengsong
parents:
diff changeset
   240
def charlist2rexp(s : List[Char]): Rexp = s match {
Chengsong
parents:
diff changeset
   241
  case Nil => ONE
Chengsong
parents:
diff changeset
   242
  case c::Nil => CHAR(c)
Chengsong
parents:
diff changeset
   243
  case c::s => SEQ(CHAR(c), charlist2rexp(s))
Chengsong
parents:
diff changeset
   244
}
Chengsong
parents:
diff changeset
   245
implicit def string2rexp(s : String) : Rexp = 
Chengsong
parents:
diff changeset
   246
  charlist2rexp(s.toList)
Chengsong
parents:
diff changeset
   247
Chengsong
parents:
diff changeset
   248
implicit def RexpOps(r: Rexp) = new {
Chengsong
parents:
diff changeset
   249
  def | (s: Rexp) = ALTS(r, s)
Chengsong
parents:
diff changeset
   250
  def % = STAR(r)
Chengsong
parents:
diff changeset
   251
  def ~ (s: Rexp) = SEQ(r, s)
Chengsong
parents:
diff changeset
   252
}
Chengsong
parents:
diff changeset
   253
Chengsong
parents:
diff changeset
   254
implicit def stringOps(s: String) = new {
Chengsong
parents:
diff changeset
   255
  def | (r: Rexp) = ALTS(s, r)
Chengsong
parents:
diff changeset
   256
  def | (r: String) = ALTS(s, r)
Chengsong
parents:
diff changeset
   257
  def % = STAR(s)
Chengsong
parents:
diff changeset
   258
  def ~ (r: Rexp) = SEQ(s, r)
Chengsong
parents:
diff changeset
   259
  def ~ (r: String) = SEQ(s, r)
Chengsong
parents:
diff changeset
   260
  def $ (r: Rexp) = RECD(s, r)
Chengsong
parents:
diff changeset
   261
}
Chengsong
parents:
diff changeset
   262
Chengsong
parents:
diff changeset
   263
def nullable(r: Rexp) : Boolean = r match {
Chengsong
parents:
diff changeset
   264
  case ZERO => false
Chengsong
parents:
diff changeset
   265
  case ONE => true
Chengsong
parents:
diff changeset
   266
  case CHAR(_) => false
Chengsong
parents:
diff changeset
   267
  case ANYCHAR => false
Chengsong
parents:
diff changeset
   268
  case ALTS(r1, r2) => nullable(r1) || nullable(r2)
Chengsong
parents:
diff changeset
   269
  case SEQ(r1, r2) => nullable(r1) && nullable(r2)
Chengsong
parents:
diff changeset
   270
  case STAR(_) => true
Chengsong
parents:
diff changeset
   271
  case RECD(_, r1) => nullable(r1)
Chengsong
parents:
diff changeset
   272
  case NTIMES(n, r) => if (n == 0) true else nullable(r)
Chengsong
parents:
diff changeset
   273
  case OPTIONAL(r) => true
Chengsong
parents:
diff changeset
   274
  case NOT(r) => !nullable(r)
Chengsong
parents:
diff changeset
   275
}
Chengsong
parents:
diff changeset
   276
Chengsong
parents:
diff changeset
   277
def der(c: Char, r: Rexp) : Rexp = r match {
Chengsong
parents:
diff changeset
   278
  case ZERO => ZERO
Chengsong
parents:
diff changeset
   279
  case ONE => ZERO
Chengsong
parents:
diff changeset
   280
  case CHAR(d) => if (c == d) ONE else ZERO
Chengsong
parents:
diff changeset
   281
  case ANYCHAR => ONE 
Chengsong
parents:
diff changeset
   282
  case ALTS(r1, r2) => ALTS(der(c, r1), der(c, r2))
Chengsong
parents:
diff changeset
   283
  case SEQ(r1, r2) => 
Chengsong
parents:
diff changeset
   284
    if (nullable(r1)) ALTS(SEQ(der(c, r1), r2), der(c, r2))
Chengsong
parents:
diff changeset
   285
    else SEQ(der(c, r1), r2)
Chengsong
parents:
diff changeset
   286
  case STAR(r) => SEQ(der(c, r), STAR(r))
Chengsong
parents:
diff changeset
   287
  case RECD(_, r1) => der(c, r1)
Chengsong
parents:
diff changeset
   288
  case NTIMES(n, r) => if(n > 0) SEQ(der(c, r), NTIMES(n - 1, r)) else ZERO
Chengsong
parents:
diff changeset
   289
  case OPTIONAL(r) => der(c, r)
Chengsong
parents:
diff changeset
   290
  case NOT(r) =>  NOT(der(c, r))
Chengsong
parents:
diff changeset
   291
}
Chengsong
parents:
diff changeset
   292
Chengsong
parents:
diff changeset
   293
Chengsong
parents:
diff changeset
   294
// extracts a string from a value
Chengsong
parents:
diff changeset
   295
def flatten(v: Val) : String = v match {
Chengsong
parents:
diff changeset
   296
  case Empty => ""
Chengsong
parents:
diff changeset
   297
  case Chr(c) => c.toString
Chengsong
parents:
diff changeset
   298
  case Left(v) => flatten(v)
Chengsong
parents:
diff changeset
   299
  case Right(v) => flatten(v)
Chengsong
parents:
diff changeset
   300
  case Sequ(v1, v2) => flatten(v1) ++ flatten(v2)
Chengsong
parents:
diff changeset
   301
  case Stars(vs) => vs.map(flatten).mkString
Chengsong
parents:
diff changeset
   302
  case Ntime(vs) => vs.map(flatten).mkString
Chengsong
parents:
diff changeset
   303
  case Optionall(v) => flatten(v)
Chengsong
parents:
diff changeset
   304
  case Rec(_, v) => flatten(v)
Chengsong
parents:
diff changeset
   305
}
Chengsong
parents:
diff changeset
   306
Chengsong
parents:
diff changeset
   307
Chengsong
parents:
diff changeset
   308
// extracts an environment from a value;
Chengsong
parents:
diff changeset
   309
// used for tokenising a string
Chengsong
parents:
diff changeset
   310
def env(v: Val) : List[(String, String)] = v match {
Chengsong
parents:
diff changeset
   311
  case Empty => Nil
Chengsong
parents:
diff changeset
   312
  case Chr(c) => Nil
Chengsong
parents:
diff changeset
   313
  case Left(v) => env(v)
Chengsong
parents:
diff changeset
   314
  case Right(v) => env(v)
Chengsong
parents:
diff changeset
   315
  case Sequ(v1, v2) => env(v1) ::: env(v2)
Chengsong
parents:
diff changeset
   316
  case Stars(vs) => vs.flatMap(env)
Chengsong
parents:
diff changeset
   317
  case Ntime(vs) => vs.flatMap(env)
Chengsong
parents:
diff changeset
   318
  case Rec(x, v) => (x, flatten(v))::env(v)
Chengsong
parents:
diff changeset
   319
  case Optionall(v) => env(v)
Chengsong
parents:
diff changeset
   320
  case Nots(s) => ("Negative", s) :: Nil
Chengsong
parents:
diff changeset
   321
}
Chengsong
parents:
diff changeset
   322
Chengsong
parents:
diff changeset
   323
Chengsong
parents:
diff changeset
   324
// The injection and mkeps part of the lexer
Chengsong
parents:
diff changeset
   325
//===========================================
Chengsong
parents:
diff changeset
   326
Chengsong
parents:
diff changeset
   327
def mkeps(r: Rexp) : Val = r match {
Chengsong
parents:
diff changeset
   328
  case ONE => Empty
Chengsong
parents:
diff changeset
   329
  case ALTS(r1, r2) => 
Chengsong
parents:
diff changeset
   330
    if (nullable(r1)) Left(mkeps(r1)) else Right(mkeps(r2))
Chengsong
parents:
diff changeset
   331
  case SEQ(r1, r2) => Sequ(mkeps(r1), mkeps(r2))
Chengsong
parents:
diff changeset
   332
  case STAR(r) => Stars(Nil)
Chengsong
parents:
diff changeset
   333
  case RECD(x, r) => Rec(x, mkeps(r))
Chengsong
parents:
diff changeset
   334
  case NTIMES(n, r) => Ntime(List.fill(n)(mkeps(r)))
Chengsong
parents:
diff changeset
   335
  case OPTIONAL(r) => Optionall(Empty)
Chengsong
parents:
diff changeset
   336
  case NOT(rInner) => if(nullable(rInner)) throw new Exception("error")  
Chengsong
parents:
diff changeset
   337
                         else Nots("")//Nots(s.reverse.toString)
Chengsong
parents:
diff changeset
   338
//   case NOT(ZERO) => Empty
Chengsong
parents:
diff changeset
   339
//   case NOT(CHAR(c)) => Empty
Chengsong
parents:
diff changeset
   340
//   case NOT(SEQ(r1, r2)) => Sequ(mkeps(NOT(r1)), mkeps(NOT(r2)))
Chengsong
parents:
diff changeset
   341
//   case NOT(ALTS(r1, r2)) => if(!nullable(r1)) Left(mkeps(NOT(r1))) else Right(mkeps(NOT(r2)))
Chengsong
parents:
diff changeset
   342
//   case NOT(STAR(r)) => Stars(Nil) 
Chengsong
parents:
diff changeset
   343
Chengsong
parents:
diff changeset
   344
}
Chengsong
parents:
diff changeset
   345
Chengsong
parents:
diff changeset
   346
def inj(r: Rexp, c: Char, v: Val) : Val = (r, v) match {
Chengsong
parents:
diff changeset
   347
  case (STAR(r), Sequ(v1, Stars(vs))) => Stars(inj(r, c, v1)::vs)
Chengsong
parents:
diff changeset
   348
  case (SEQ(r1, r2), Sequ(v1, v2)) => Sequ(inj(r1, c, v1), v2)
Chengsong
parents:
diff changeset
   349
  case (SEQ(r1, r2), Left(Sequ(v1, v2))) => Sequ(inj(r1, c, v1), v2)
Chengsong
parents:
diff changeset
   350
  case (SEQ(r1, r2), Right(v2)) => Sequ(mkeps(r1), inj(r2, c, v2))
Chengsong
parents:
diff changeset
   351
  case (ALTS(r1, r2), Left(v1)) => Left(inj(r1, c, v1))
Chengsong
parents:
diff changeset
   352
  case (ALTS(r1, r2), Right(v2)) => Right(inj(r2, c, v2))
Chengsong
parents:
diff changeset
   353
  case (CHAR(d), Empty) => Chr(c) 
Chengsong
parents:
diff changeset
   354
  case (RECD(x, r1), _) => Rec(x, inj(r1, c, v))
Chengsong
parents:
diff changeset
   355
  case (NTIMES(n, r), Sequ(v1, Ntime(vs))) => Ntime(inj(r, c, v1)::vs)
Chengsong
parents:
diff changeset
   356
  case (OPTIONAL(r), v) => Optionall(inj(r, c, v))
Chengsong
parents:
diff changeset
   357
  case (NOT(r), Nots(s)) => Nots(c.toString ++ s)
Chengsong
parents:
diff changeset
   358
  case (ANYCHAR, Empty) => Chr(c)
Chengsong
parents:
diff changeset
   359
}
Chengsong
parents:
diff changeset
   360
Chengsong
parents:
diff changeset
   361
// some "rectification" functions for simplification
Chengsong
parents:
diff changeset
   362
Chengsong
parents:
diff changeset
   363
Chengsong
parents:
diff changeset
   364
Chengsong
parents:
diff changeset
   365
Chengsong
parents:
diff changeset
   366
// The Lexing Rules for the WHILE Language
Chengsong
parents:
diff changeset
   367
Chengsong
parents:
diff changeset
   368
  // bnullable function: tests whether the aregular 
Chengsong
parents:
diff changeset
   369
  // expression can recognise the empty string
Chengsong
parents:
diff changeset
   370
def bnullable (r: ARexp) : Boolean = r match {
Chengsong
parents:
diff changeset
   371
    case AZERO => false
Chengsong
parents:
diff changeset
   372
    case AONE(_) => true
Chengsong
parents:
diff changeset
   373
    case ACHAR(_,_) => false
Chengsong
parents:
diff changeset
   374
    case AALTS(_, rs) => rs.exists(bnullable)
Chengsong
parents:
diff changeset
   375
    case ASEQ(_, r1, r2) => bnullable(r1) && bnullable(r2)
Chengsong
parents:
diff changeset
   376
    case ASTAR(_, _) => true
Chengsong
parents:
diff changeset
   377
    case ANOT(_, rn) => !bnullable(rn)
Chengsong
parents:
diff changeset
   378
  }
Chengsong
parents:
diff changeset
   379
Chengsong
parents:
diff changeset
   380
def mkepsBC(r: ARexp) : Bits = r match {
Chengsong
parents:
diff changeset
   381
    case AONE(bs) => bs
Chengsong
parents:
diff changeset
   382
    case AALTS(bs, rs) => {
Chengsong
parents:
diff changeset
   383
      val n = rs.indexWhere(bnullable)
Chengsong
parents:
diff changeset
   384
      bs ++ mkepsBC(rs(n))
Chengsong
parents:
diff changeset
   385
    }
Chengsong
parents:
diff changeset
   386
    case ASEQ(bs, r1, r2) => bs ++ mkepsBC(r1) ++ mkepsBC(r2)
Chengsong
parents:
diff changeset
   387
    case ASTAR(bs, r) => bs ++ List(Z)
Chengsong
parents:
diff changeset
   388
    case ANOT(bs, rn) => bs
Chengsong
parents:
diff changeset
   389
  }
Chengsong
parents:
diff changeset
   390
Chengsong
parents:
diff changeset
   391
Chengsong
parents:
diff changeset
   392
def bder(c: Char, r: ARexp) : ARexp = r match {
Chengsong
parents:
diff changeset
   393
    case AZERO => AZERO
Chengsong
parents:
diff changeset
   394
    case AONE(_) => AZERO
Chengsong
parents:
diff changeset
   395
    case ACHAR(bs, f) => if (c == f) AONE(bs) else AZERO
Chengsong
parents:
diff changeset
   396
    case AALTS(bs, rs) => AALTS(bs, rs.map(bder(c, _)))
Chengsong
parents:
diff changeset
   397
    case ASEQ(bs, r1, r2) => 
Chengsong
parents:
diff changeset
   398
      if (bnullable(r1)) AALTS(bs, ASEQ(Nil, bder(c, r1), r2) :: fuse(mkepsBC(r1), bder(c, r2)) :: Nil )
Chengsong
parents:
diff changeset
   399
      else ASEQ(bs, bder(c, r1), r2)
Chengsong
parents:
diff changeset
   400
    case ASTAR(bs, r) => ASEQ(bs, fuse(List(S), bder(c, r)), ASTAR(Nil, r))
Chengsong
parents:
diff changeset
   401
    case ANOT(bs, rn) => ANOT(bs, bder(c, rn))
Chengsong
parents:
diff changeset
   402
    case AANYCHAR(bs) => AONE(bs)
Chengsong
parents:
diff changeset
   403
  } 
Chengsong
parents:
diff changeset
   404
Chengsong
parents:
diff changeset
   405
def fuse(bs: Bits, r: ARexp) : ARexp = r match {
Chengsong
parents:
diff changeset
   406
    case AZERO => AZERO
Chengsong
parents:
diff changeset
   407
    case AONE(cs) => AONE(bs ++ cs)
Chengsong
parents:
diff changeset
   408
    case ACHAR(cs, f) => ACHAR(bs ++ cs, f)
Chengsong
parents:
diff changeset
   409
    case AALTS(cs, rs) => AALTS(bs ++ cs, rs)
Chengsong
parents:
diff changeset
   410
    case ASEQ(cs, r1, r2) => ASEQ(bs ++ cs, r1, r2)
Chengsong
parents:
diff changeset
   411
    case ASTAR(cs, r) => ASTAR(bs ++ cs, r)
Chengsong
parents:
diff changeset
   412
    case ANOT(cs, r) => ANOT(bs ++ cs, r)
Chengsong
parents:
diff changeset
   413
  }
Chengsong
parents:
diff changeset
   414
Chengsong
parents:
diff changeset
   415
Chengsong
parents:
diff changeset
   416
def internalise(r: Rexp) : ARexp = r match {
Chengsong
parents:
diff changeset
   417
    case ZERO => AZERO
Chengsong
parents:
diff changeset
   418
    case ONE => AONE(Nil)
Chengsong
parents:
diff changeset
   419
    case CHAR(c) => ACHAR(Nil, c)
Chengsong
parents:
diff changeset
   420
    //case PRED(f) => APRED(Nil, f)
Chengsong
parents:
diff changeset
   421
    case ALTS(r1, r2) => 
Chengsong
parents:
diff changeset
   422
      AALTS(Nil, List(fuse(List(Z), internalise(r1)), fuse(List(S), internalise(r2))))
Chengsong
parents:
diff changeset
   423
    // case ALTS(r1::rs) => {
Chengsong
parents:
diff changeset
   424
    //   val AALTS(Nil, rs2) = internalise(ALTS(rs))
Chengsong
parents:
diff changeset
   425
    //   AALTS(Nil, fuse(List(Z), internalise(r1)) :: rs2.map(fuse(List(S), _)))
Chengsong
parents:
diff changeset
   426
    // }
Chengsong
parents:
diff changeset
   427
    case SEQ(r1, r2) => ASEQ(Nil, internalise(r1), internalise(r2))
Chengsong
parents:
diff changeset
   428
    case STAR(r) => ASTAR(Nil, internalise(r))
Chengsong
parents:
diff changeset
   429
    case RECD(x, r) => internalise(r)
Chengsong
parents:
diff changeset
   430
    case NOT(r) => ANOT(Nil, internalise(r))
Chengsong
parents:
diff changeset
   431
    case ANYCHAR => AANYCHAR(Nil)
Chengsong
parents:
diff changeset
   432
  }
Chengsong
parents:
diff changeset
   433
Chengsong
parents:
diff changeset
   434
Chengsong
parents:
diff changeset
   435
def bsimp(r: ARexp): ARexp = 
Chengsong
parents:
diff changeset
   436
  {
Chengsong
parents:
diff changeset
   437
    r match {
Chengsong
parents:
diff changeset
   438
      case ASEQ(bs1, r1, r2) => (bsimp(r1), bsimp(r2)) match {
Chengsong
parents:
diff changeset
   439
          case (AZERO, _) => AZERO
Chengsong
parents:
diff changeset
   440
          case (_, AZERO) => AZERO
Chengsong
parents:
diff changeset
   441
          case (AONE(bs2), r2s) => fuse(bs1 ++ bs2, r2s)
Chengsong
parents:
diff changeset
   442
          case (r1s, r2s) => ASEQ(bs1, r1s, r2s)
Chengsong
parents:
diff changeset
   443
      }
Chengsong
parents:
diff changeset
   444
      case AALTS(bs1, rs) => {
Chengsong
parents:
diff changeset
   445
            val rs_simp = rs.map(bsimp(_))
Chengsong
parents:
diff changeset
   446
            val flat_res = flats(rs_simp)
Chengsong
parents:
diff changeset
   447
            val dist_res = distinctBy(flat_res, erase)//strongDB(flat_res)//distinctBy(flat_res, erase)
Chengsong
parents:
diff changeset
   448
            dist_res match {
Chengsong
parents:
diff changeset
   449
              case Nil => AZERO
Chengsong
parents:
diff changeset
   450
              case s :: Nil => fuse(bs1, s)
Chengsong
parents:
diff changeset
   451
              case rs => AALTS(bs1, rs)  
Chengsong
parents:
diff changeset
   452
            }
Chengsong
parents:
diff changeset
   453
          
Chengsong
parents:
diff changeset
   454
      }
Chengsong
parents:
diff changeset
   455
      case r => r
Chengsong
parents:
diff changeset
   456
    }
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   457
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   458
def strongBsimp(r: ARexp): ARexp =
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   459
{
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   460
  r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   461
    case ASEQ(bs1, r1, r2) => (strongBsimp(r1), strongBsimp(r2)) match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   462
        case (AZERO, _) => AZERO
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   463
        case (_, AZERO) => AZERO
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   464
        case (AONE(bs2), r2s) => fuse(bs1 ++ bs2, r2s)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   465
        case (r1s, r2s) => ASEQ(bs1, r1s, r2s)
431
Chengsong
parents:
diff changeset
   466
    }
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   467
    case AALTS(bs1, rs) => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   468
          val rs_simp = rs.map(strongBsimp(_))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   469
          val flat_res = flats(rs_simp)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   470
          val dist_res = distinctBy4(flat_res)//distinctBy(flat_res, erase)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   471
          dist_res match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   472
            case Nil => AZERO
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   473
            case s :: Nil => fuse(bs1, s)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   474
            case rs => AALTS(bs1, rs)  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   475
          }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   476
        
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   477
    }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   478
    case r => r
431
Chengsong
parents:
diff changeset
   479
  }
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   480
}
431
Chengsong
parents:
diff changeset
   481
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   482
def strongBsimp5(r: ARexp): ARexp =
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   483
{
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   484
  // println("was this called?")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   485
  r match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   486
    case ASEQ(bs1, r1, r2) => (strongBsimp5(r1), strongBsimp5(r2)) match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   487
        case (AZERO, _) => AZERO
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   488
        case (_, AZERO) => AZERO
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   489
        case (AONE(bs2), r2s) => fuse(bs1 ++ bs2, r2s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   490
        case (r1s, r2s) => ASEQ(bs1, r1s, r2s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   491
    }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   492
    case AALTS(bs1, rs) => {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   493
        // println("alts case")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   494
          val rs_simp = rs.map(strongBsimp5(_))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   495
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   496
          val flat_res = flats(rs_simp)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   497
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   498
          val dist_res = distinctBy5(flat_res)//distinctBy(flat_res, erase)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   499
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   500
          dist_res match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   501
            case Nil => AZERO
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   502
            case s :: Nil => fuse(bs1, s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   503
            case rs => AALTS(bs1, rs)  
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   504
          }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   505
        
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   506
    }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   507
    case r => r
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   508
  }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   509
}
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   510
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   511
def bders (s: List[Char], r: ARexp) : ARexp = s match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   512
  case Nil => r
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   513
  case c::s => bders(s, bder(c, r))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   514
}
431
Chengsong
parents:
diff changeset
   515
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   516
def flats(rs: List[ARexp]): List[ARexp] = rs match {
431
Chengsong
parents:
diff changeset
   517
    case Nil => Nil
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   518
    case AZERO :: rs1 => flats(rs1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   519
    case AALTS(bs, rs1) :: rs2 => rs1.map(fuse(bs, _)) ::: flats(rs2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   520
    case r1 :: rs2 => r1 :: flats(rs2)
431
Chengsong
parents:
diff changeset
   521
  }
Chengsong
parents:
diff changeset
   522
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   523
def distinctBy[B, C](xs: List[B], f: B => C, acc: List[C] = Nil): List[B] = xs match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   524
  case Nil => Nil
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   525
  case (x::xs) => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   526
    val res = f(x)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   527
    if (acc.contains(res)) distinctBy(xs, f, acc)  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   528
    else x::distinctBy(xs, f, res::acc)
431
Chengsong
parents:
diff changeset
   529
  }
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   530
} 
431
Chengsong
parents:
diff changeset
   531
Chengsong
parents:
diff changeset
   532
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   533
def pruneRexp(r: ARexp, allowableTerms: List[Rexp]) : ARexp = {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   534
  r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   535
    case ASEQ(bs, r1, r2) => 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   536
      val termsTruncated = allowableTerms.collect(rt => rt match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   537
        case SEQ(r1p, r2p) if(r2p == erase(r2)) => r1p//if(r2p == erase(r2)) 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   538
      })
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   539
      val pruned : ARexp = pruneRexp(r1, termsTruncated)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   540
      pruned match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   541
        case AZERO => AZERO
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   542
        case AONE(bs1) => fuse(bs ++ bs1, r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   543
        case pruned1 => ASEQ(bs, pruned1, r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   544
      }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   545
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   546
    case AALTS(bs, rs) => 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   547
      //allowableTerms.foreach(a => println(shortRexpOutput(a)))        
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   548
      val rsp = rs.map(r => 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   549
                    pruneRexp(r, allowableTerms)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   550
                  )
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   551
                  .filter(r => r != AZERO)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   552
      rsp match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   553
        case Nil => AZERO
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   554
        case r1::Nil => fuse(bs, r1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   555
        case rs1 => AALTS(bs, rs1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   556
      }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   557
    case r => 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   558
      if(allowableTerms.contains(erase(r))) r else AZERO //assert(r != AZERO)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   559
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   560
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   561
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   562
def oneSimp(r: Rexp) : Rexp = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   563
  case SEQ(ONE, r) => r
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   564
  case SEQ(r1, r2) => SEQ(oneSimp(r1), r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   565
  case r => r//assert r != 0 
432
994403dbbed5 strong!
Chengsong
parents: 431
diff changeset
   566
    
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   567
}
431
Chengsong
parents:
diff changeset
   568
Chengsong
parents:
diff changeset
   569
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   570
def distinctBy4(xs: List[ARexp], acc: List[Rexp] = Nil) : List[ARexp] = xs match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   571
  case Nil => Nil
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   572
  case x :: xs =>
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   573
    //assert(acc.distinct == acc)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   574
    val erased = erase(x)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   575
    if(acc.contains(erased))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   576
      distinctBy4(xs, acc)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   577
    else{
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   578
      val addToAcc =  breakIntoTerms(erased).filter(r => !acc.contains(oneSimp(r)))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   579
      //val xp = pruneRexp(x, addToAcc)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   580
      pruneRexp(x, addToAcc) match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   581
        case AZERO => distinctBy4(xs, addToAcc.map(oneSimp(_)) ::: acc)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   582
        case xPrime => xPrime :: distinctBy4(xs, addToAcc.map(oneSimp(_)) ::: acc)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   583
      }
431
Chengsong
parents:
diff changeset
   584
    }
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   585
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   586
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   587
// fun pAKC_aux :: "arexp list ⇒ arexp ⇒ rexp ⇒ arexp"
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   588
//   where
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   589
// "pAKC_aux rsa r ctx = (if (L (SEQ (erase r) ( ctx) )) ⊆ (L (erase (AALTs [] rsa))) then AZERO else
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   590
//                           case r of (ASEQ bs r1 r2) ⇒ 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   591
//                             bsimp_ASEQ bs (pAKC_aux rsa r1 (SEQ  (erase r2) ( ctx) )) r2   |
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   592
//                                     (AALTs bs rs) ⇒ 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   593
//                             bsimp_AALTs bs (flts (map (λr. pAKC_aux rsa r ( ctx) ) rs) )    |
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   594
//                                     r             ⇒ r
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   595
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   596
// def canonicalSeq(rs: List[Rexp], acc: Rexp) = rs match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   597
//   case r::Nil => SEQ(r, acc)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   598
//   case Nil => acc
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   599
//   case r1::r2::Nil => SEQ(SEQ(r1, r2), acc)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   600
// }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   601
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   602
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   603
//the "fake" Language interpretation: just concatenates!
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   604
def L(acc: Rexp, rs: List[Rexp]) : Rexp = rs match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   605
  case Nil => acc
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   606
  case r :: rs1 => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   607
    if(acc == ONE) 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   608
      L(r, rs1) 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   609
    else
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   610
      L(SEQ(acc, r), rs1)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   611
}
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   612
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   613
def pAKC(rs: List[Rexp], r: ARexp, ctx: List[Rexp]) : ARexp = {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   614
  if (breakIntoTerms(L(erase(r), ctx)).map(oneSimp).forall(rs.contains)) {//rs.flatMap(breakIntoTerms
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   615
    AZERO
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   616
  }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   617
  else{
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   618
    r match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   619
      case ASEQ(bs, r1, r2) => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   620
      (pAKC(rs, r1, erase(r2) :: ctx)) match{
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   621
        case AZERO => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   622
          AZERO
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   623
        case AONE(bs1) => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   624
          fuse(bs1, r2)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   625
        case r1p => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   626
          ASEQ(bs, r1p, r2)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   627
      }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   628
      case AALTS(bs, rs0) => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   629
        // println("before pruning")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   630
        // println(s"ctx is ")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   631
        // ctx.foreach(r => println(shortRexpOutput(r)))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   632
        // println(s"rs0 is ")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   633
        // rs0.foreach(r => println(shortRexpOutput(erase(r))))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   634
        // println(s"rs is ")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   635
        // rs.foreach(r => println(shortRexpOutput(r)))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   636
        rs0.map(r => pAKC(rs, r, ctx)).filter(_ != AZERO) match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   637
          case Nil => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   638
            // println("after pruning Nil")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   639
            AZERO
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   640
          case r :: Nil => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   641
            // println("after pruning singleton")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   642
            // println(shortRexpOutput(erase(r)))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   643
            r 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   644
          case rs0p => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   645
          // println("after pruning non-singleton")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   646
            AALTS(bs, rs0p)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   647
        }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   648
      case r => r
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   649
    }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   650
  }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   651
}
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   652
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   653
def distinctBy5(xs: List[ARexp], acc: List[Rexp] = Nil) : List[ARexp] = xs match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   654
  case Nil => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   655
    Nil
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   656
  case x :: xs => {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   657
    val erased = erase(x)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   658
    if(acc.contains(erased)){
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   659
      distinctBy5(xs, acc)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   660
    }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   661
    else{
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   662
      val pruned = pAKC(acc, x, Nil)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   663
      val newTerms = breakIntoTerms(erase(pruned))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   664
      pruned match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   665
        case AZERO => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   666
          distinctBy5(xs, acc)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   667
        case xPrime => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   668
          xPrime :: distinctBy5(xs, newTerms.map(oneSimp) ::: acc)//distinctBy5(xs, addToAcc.map(oneSimp(_)) ::: acc)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   669
      }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   670
    }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   671
  }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   672
}
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   673
431
Chengsong
parents:
diff changeset
   674
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   675
def breakIntoTerms(r: Rexp) : List[Rexp] = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   676
  case SEQ(r1, r2)  => breakIntoTerms(r1).map(r11 => SEQ(r11, r2))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   677
  case ALTS(r1, r2) => breakIntoTerms(r1) ::: breakIntoTerms(r2)
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   678
  case ZERO => Nil
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   679
  case _ => r::Nil
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   680
}
431
Chengsong
parents:
diff changeset
   681
Chengsong
parents:
diff changeset
   682
Chengsong
parents:
diff changeset
   683
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   684
def decode_aux(r: Rexp, bs: Bits) : (Val, Bits) = (r, bs) match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   685
  case (ONE, bs) => (Empty, bs)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   686
  case (CHAR(f), bs) => (Chr(f), bs)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   687
  case (ALTS(r1, r2), Z::bs1) => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   688
      val (v, bs2) = decode_aux(r1, bs1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   689
      (Left(v), bs2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   690
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   691
  case (ALTS(r1, r2), S::bs1) => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   692
      val (v, bs2) = decode_aux(r2, bs1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   693
      (Right(v), bs2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   694
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   695
  case (SEQ(r1, r2), bs) => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   696
    val (v1, bs1) = decode_aux(r1, bs)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   697
    val (v2, bs2) = decode_aux(r2, bs1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   698
    (Sequ(v1, v2), bs2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   699
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   700
  case (STAR(r1), S::bs) => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   701
    val (v, bs1) = decode_aux(r1, bs)
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   702
    //(v)
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   703
    val (Stars(vs), bs2) = decode_aux(STAR(r1), bs1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   704
    (Stars(v::vs), bs2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   705
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   706
  case (STAR(_), Z::bs) => (Stars(Nil), bs)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   707
  case (RECD(x, r1), bs) => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   708
    val (v, bs1) = decode_aux(r1, bs)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   709
    (Rec(x, v), bs1)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   710
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   711
  case (NOT(r), bs) => (Nots(r.toString), bs)
431
Chengsong
parents:
diff changeset
   712
}
Chengsong
parents:
diff changeset
   713
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   714
def decode(r: Rexp, bs: Bits) = decode_aux(r, bs) match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   715
  case (v, Nil) => v
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   716
  case _ => throw new Exception("Not decodable")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   717
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   718
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   719
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   720
431
Chengsong
parents:
diff changeset
   721
def blexing_simp(r: Rexp, s: String) : Val = {
Chengsong
parents:
diff changeset
   722
    val bit_code = blex_simp(internalise(r), s.toList)
Chengsong
parents:
diff changeset
   723
    decode(r, bit_code)
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   724
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   725
def simpBlexer(r: Rexp, s: String) : Val = {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   726
  Try(blexing_simp(r, s)).getOrElse(Failure)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   727
}
431
Chengsong
parents:
diff changeset
   728
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   729
def strong_blexing_simp(r: Rexp, s: String) : Val = {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   730
  decode(r, strong_blex_simp(internalise(r), s.toList))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   731
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   732
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   733
def strong_blexing_simp5(r: Rexp, s: String) : Val = {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   734
  decode(r, strong_blex_simp5(internalise(r), s.toList))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   735
}
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   736
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   737
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   738
def strongBlexer(r: Rexp, s: String) : Val = {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   739
  Try(strong_blexing_simp(r, s)).getOrElse(Failure)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   740
}
431
Chengsong
parents:
diff changeset
   741
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   742
def strongBlexer5(r: Rexp, s: String): Val = {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   743
  Try(strong_blexing_simp5(r, s)).getOrElse(Failure)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   744
}
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   745
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   746
def strong_blex_simp(r: ARexp, s: List[Char]) : Bits = s match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   747
  case Nil => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   748
    if (bnullable(r)) {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   749
      //println(asize(r))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   750
      val bits = mkepsBC(r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   751
      bits
431
Chengsong
parents:
diff changeset
   752
    }
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   753
    else 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   754
      throw new Exception("Not matched")
431
Chengsong
parents:
diff changeset
   755
  }
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   756
  case c::cs => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   757
    val der_res = bder(c,r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   758
    val simp_res = strongBsimp(der_res)  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   759
    strong_blex_simp(simp_res, cs)      
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   760
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   761
}
431
Chengsong
parents:
diff changeset
   762
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   763
def strong_blex_simp5(r: ARexp, s: List[Char]) : Bits = s match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   764
  case Nil => {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   765
    if (bnullable(r)) {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   766
      //println(asize(r))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   767
      val bits = mkepsBC(r)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   768
      bits
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   769
    }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   770
    else 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   771
      throw new Exception("Not matched")
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   772
  }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   773
  case c::cs => {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   774
    val der_res = bder(c,r)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   775
    val simp_res = strongBsimp5(der_res)  
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   776
    strong_blex_simp5(simp_res, cs)      
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   777
  }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   778
}
431
Chengsong
parents:
diff changeset
   779
Chengsong
parents:
diff changeset
   780
Chengsong
parents:
diff changeset
   781
  def bders_simp(s: List[Char], r: ARexp) : ARexp = s match {
Chengsong
parents:
diff changeset
   782
    case Nil => r
435
Chengsong
parents: 432
diff changeset
   783
    case c::s => 
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   784
      //println(erase(r))
435
Chengsong
parents: 432
diff changeset
   785
      bders_simp(s, bsimp(bder(c, r)))
431
Chengsong
parents:
diff changeset
   786
  }
Chengsong
parents:
diff changeset
   787
  
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   788
  def bdersStrong5(s: List[Char], r: ARexp) : ARexp = s match {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   789
    case Nil => r
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   790
    case c::s => bdersStrong5(s, strongBsimp5(bder(c, r)))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   791
  }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
   792
431
Chengsong
parents:
diff changeset
   793
  def bdersSimp(s: String, r: Rexp) : ARexp = bders_simp(s.toList, internalise(r))
Chengsong
parents:
diff changeset
   794
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   795
  def bdersStrong(s: List[Char], r: ARexp) : ARexp = s match {
431
Chengsong
parents:
diff changeset
   796
    case Nil => r 
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   797
    case c::s => bdersStrong(s, strongBsimp(bder(c, r)))
431
Chengsong
parents:
diff changeset
   798
  }
Chengsong
parents:
diff changeset
   799
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   800
  def bdersStrongRexp(s: String, r: Rexp) : ARexp = bdersStrong(s.toList, internalise(r))
431
Chengsong
parents:
diff changeset
   801
Chengsong
parents:
diff changeset
   802
  def erase(r:ARexp): Rexp = r match{
Chengsong
parents:
diff changeset
   803
    case AZERO => ZERO
Chengsong
parents:
diff changeset
   804
    case AONE(_) => ONE
Chengsong
parents:
diff changeset
   805
    case ACHAR(bs, c) => CHAR(c)
Chengsong
parents:
diff changeset
   806
    case AALTS(bs, Nil) => ZERO
Chengsong
parents:
diff changeset
   807
    case AALTS(bs, a::Nil) => erase(a)
Chengsong
parents:
diff changeset
   808
    case AALTS(bs, a::as) => ALTS(erase(a), erase(AALTS(bs, as)))
Chengsong
parents:
diff changeset
   809
    case ASEQ(bs, r1, r2) => SEQ (erase(r1), erase(r2))
Chengsong
parents:
diff changeset
   810
    case ASTAR(cs, r)=> STAR(erase(r))
Chengsong
parents:
diff changeset
   811
    case ANOT(bs, r) => NOT(erase(r))
Chengsong
parents:
diff changeset
   812
    case AANYCHAR(bs) => ANYCHAR
Chengsong
parents:
diff changeset
   813
  }
Chengsong
parents:
diff changeset
   814
Chengsong
parents:
diff changeset
   815
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   816
  def allCharSeq(r: Rexp) : Boolean = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   817
    case CHAR(c) => true
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   818
    case SEQ(r1, r2) => allCharSeq(r1) && allCharSeq(r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   819
    case _ => false
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   820
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   821
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   822
  def flattenSeq(r: Rexp) : String = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   823
    case CHAR(c) => c.toString
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   824
    case SEQ(r1, r2) => flattenSeq(r1) ++ flattenSeq(r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   825
    case _ => throw new Error("flatten unflattenable rexp")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   826
  } 
431
Chengsong
parents:
diff changeset
   827
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   828
  def shortRexpOutput(r: Rexp) : String = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   829
      case CHAR(c) => c.toString
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   830
      case ONE => "1"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   831
      case ZERO => "0"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   832
      case SEQ(r1, r2) if(allCharSeq(r)) => flattenSeq(r)//"[" ++ shortRexpOutput(r1) ++ "~" ++ shortRexpOutput(r2) ++ "]"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   833
      case SEQ(r1, r2) => "[" ++ shortRexpOutput(r1) ++ "~" ++ shortRexpOutput(r2) ++ "]"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   834
      case ALTS(r1, r2) => "(" ++ shortRexpOutput(r1) ++ "+" ++ shortRexpOutput(r2) ++ ")"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   835
      case STAR(STAR(r)) => "(..)*"// ++ shortRexpOutput(r) ++ "]*"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   836
      case STAR(r) => "STAR(" ++ shortRexpOutput(r) ++ ")"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   837
      //case RTOP => "RTOP"
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   838
    }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   839
431
Chengsong
parents:
diff changeset
   840
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   841
  def blex_simp(r: ARexp, s: List[Char]) : Bits = s match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   842
      case Nil => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   843
        if (bnullable(r)) {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   844
          val bits = mkepsBC(r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   845
          bits
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   846
        }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   847
        else 
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   848
          throw new Exception("Not matched")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   849
      }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   850
      case c::cs => {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   851
        val der_res = bder(c,r)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   852
        val simp_res = bsimp(der_res)  
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   853
        blex_simp(simp_res, cs)      
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   854
      }
431
Chengsong
parents:
diff changeset
   855
  }
Chengsong
parents:
diff changeset
   856
Chengsong
parents:
diff changeset
   857
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   858
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   859
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   860
    def size(r: Rexp) : Int = r match {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   861
      case ZERO => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   862
      case ONE => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   863
      case CHAR(_) => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   864
      case ANYCHAR => 1
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   865
      case NOT(r0) => 1 + size(r0)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   866
      case SEQ(r1, r2) => 1 + size(r1) + size(r2)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   867
      case ALTS(r1, r2) => 1 + List(r1, r2).map(size).sum
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   868
      case STAR(r) => 1 + size(r)
431
Chengsong
parents:
diff changeset
   869
    }
Chengsong
parents:
diff changeset
   870
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   871
    def asize(a: ARexp) = size(erase(a))
431
Chengsong
parents:
diff changeset
   872
Chengsong
parents:
diff changeset
   873
//pder related
Chengsong
parents:
diff changeset
   874
type Mon = (Char, Rexp)
Chengsong
parents:
diff changeset
   875
type Lin = Set[Mon]
Chengsong
parents:
diff changeset
   876
Chengsong
parents:
diff changeset
   877
def dot_prod(rs: Set[Rexp], r: Rexp): Set[Rexp] = r match {
Chengsong
parents:
diff changeset
   878
    case ZERO => Set()
Chengsong
parents:
diff changeset
   879
    case ONE => rs
Chengsong
parents:
diff changeset
   880
    case r => rs.map((re) => if (re == ONE) r else SEQ(re, r)  )   
Chengsong
parents:
diff changeset
   881
  }
Chengsong
parents:
diff changeset
   882
  def cir_prod(l: Lin, t: Rexp): Lin = t match {//remember this Lin is different from the Lin in Antimirov's paper. Here it does not mean the set of all subsets of linear forms that does not contain zero, but rather the type a set of linear forms
Chengsong
parents:
diff changeset
   883
    case ZERO => Set()
Chengsong
parents:
diff changeset
   884
    case ONE => l
Chengsong
parents:
diff changeset
   885
    case t => l.map( m => m._2 match {case ZERO => m case ONE => (m._1, t) case p => (m._1, SEQ(p, t)) }  )
Chengsong
parents:
diff changeset
   886
  }
Chengsong
parents:
diff changeset
   887
  def lf(r: Rexp): Lin = r match {
Chengsong
parents:
diff changeset
   888
    case ZERO => Set()
Chengsong
parents:
diff changeset
   889
    case ONE => Set()
Chengsong
parents:
diff changeset
   890
    case CHAR(f) => {
Chengsong
parents:
diff changeset
   891
      //val Some(c) = alphabet.find(f) 
Chengsong
parents:
diff changeset
   892
      Set((f, ONE))
Chengsong
parents:
diff changeset
   893
    }
Chengsong
parents:
diff changeset
   894
    case ALTS(r1, r2) => {
Chengsong
parents:
diff changeset
   895
      lf(r1 ) ++ lf(r2)
Chengsong
parents:
diff changeset
   896
    }
Chengsong
parents:
diff changeset
   897
    case STAR(r1) => cir_prod(lf(r1), STAR(r1)) //may try infix notation later......
Chengsong
parents:
diff changeset
   898
    case SEQ(r1, r2) =>{
Chengsong
parents:
diff changeset
   899
      if (nullable(r1))
Chengsong
parents:
diff changeset
   900
        cir_prod(lf(r1), r2) ++ lf(r2)
Chengsong
parents:
diff changeset
   901
      else
Chengsong
parents:
diff changeset
   902
        cir_prod(lf(r1), r2) 
Chengsong
parents:
diff changeset
   903
    }
Chengsong
parents:
diff changeset
   904
  }
Chengsong
parents:
diff changeset
   905
  def lfs(r: Set[Rexp]): Lin = {
Chengsong
parents:
diff changeset
   906
    r.foldLeft(Set[Mon]())((acc, r) => acc ++ lf(r))
Chengsong
parents:
diff changeset
   907
  }
Chengsong
parents:
diff changeset
   908
Chengsong
parents:
diff changeset
   909
  def pder(x: Char, t: Rexp): Set[Rexp] = {
Chengsong
parents:
diff changeset
   910
    val lft = lf(t)
Chengsong
parents:
diff changeset
   911
    (lft.filter(mon => if(mon._1 == x) true else false)).map(mon => mon._2)
Chengsong
parents:
diff changeset
   912
  }
Chengsong
parents:
diff changeset
   913
  def pders_single(s: List[Char], t: Rexp) : Set[Rexp] = s match {
Chengsong
parents:
diff changeset
   914
    case x::xs => pders(xs, pder(x, t))
Chengsong
parents:
diff changeset
   915
    case Nil => Set(t)
Chengsong
parents:
diff changeset
   916
  }
Chengsong
parents:
diff changeset
   917
  def pders(s: List[Char], ts: Set[Rexp]) : Set[Rexp] = s match {
Chengsong
parents:
diff changeset
   918
    case x::xs => pders(xs, ts.foldLeft(Set[Rexp]())((acc, t) => acc ++ pder(x, t)))
Chengsong
parents:
diff changeset
   919
    case Nil => ts 
Chengsong
parents:
diff changeset
   920
  }
Chengsong
parents:
diff changeset
   921
  def pderss(ss: List[List[Char]], t: Rexp): Set[Rexp] = ss.foldLeft( Set[Rexp]() )( (acc, s) => pders_single(s, t) ++ acc )
Chengsong
parents:
diff changeset
   922
  def pdera(t: Rexp): Set[Rexp] = lf(t).map(mon => mon._2)
Chengsong
parents:
diff changeset
   923
  //all implementation of partial derivatives that involve set union are potentially buggy
Chengsong
parents:
diff changeset
   924
  //because they don't include the original regular term before they are pdered.
Chengsong
parents:
diff changeset
   925
  //now only pderas is fixed.
Chengsong
parents:
diff changeset
   926
  def pderas(t: Set[Rexp], d: Int): Set[Rexp] = if(d > 0) pderas(lfs(t).map(mon => mon._2), d - 1) ++ t else lfs(t).map(mon => mon._2) ++ t//repeated application of pderas over the newest set of pders.
Chengsong
parents:
diff changeset
   927
  def pderUNIV(r: Rexp) : Set[Rexp] = pderas(Set(r), awidth(r) + 1)
Chengsong
parents:
diff changeset
   928
  def awidth(r: Rexp) : Int = r match {
Chengsong
parents:
diff changeset
   929
    case CHAR(c) => 1
Chengsong
parents:
diff changeset
   930
    case SEQ(r1, r2) => awidth(r1) + awidth(r2)
Chengsong
parents:
diff changeset
   931
    case ALTS(r1, r2) => awidth(r1) + awidth(r2)
Chengsong
parents:
diff changeset
   932
    case ONE => 0
Chengsong
parents:
diff changeset
   933
    case ZERO => 0
Chengsong
parents:
diff changeset
   934
    case STAR(r) => awidth(r)
Chengsong
parents:
diff changeset
   935
  }
Chengsong
parents:
diff changeset
   936
  //def sigma_lf(l: Set[Mon]) : Rexp = ALTS(l.map(mon => SEQ(CHAR(mon._1),mon._2)).toList)
Chengsong
parents:
diff changeset
   937
  //def sigma(rs: Set[Rexp]) : Rexp = ALTS(rs.toList)
Chengsong
parents:
diff changeset
   938
  def o(r: Rexp) = if (nullable(r)) ONE else ZERO
Chengsong
parents:
diff changeset
   939
  //def nlf(t: Rexp) : Rexp = ALTS(List( o(t), sigma_lf(lf(t)) ))
Chengsong
parents:
diff changeset
   940
  def pdp(x: Char, r: Rexp) : Set[Rexp] = r match {
Chengsong
parents:
diff changeset
   941
    case ZERO => Set[Rexp]()
Chengsong
parents:
diff changeset
   942
    case ONE => Set[Rexp]()
Chengsong
parents:
diff changeset
   943
    case CHAR(f) => if(x == f) Set(ONE) else Set[Rexp]()
Chengsong
parents:
diff changeset
   944
    case ALTS(r1, r2) => pdp(x, r1) ++ pdp(x, r2)
Chengsong
parents:
diff changeset
   945
    case STAR(r1) => pdp(x, r).map(a => SEQ(a, STAR(r1)))
Chengsong
parents:
diff changeset
   946
    case SEQ(a0, b) => if(nullable(a0)) pdp(x, a0).map(a => SEQ(a, b)) ++ pdp(x, b) else pdp(x, a0).map(a => SEQ(a, b))
Chengsong
parents:
diff changeset
   947
  }
Chengsong
parents:
diff changeset
   948
  def pdps(s: List[Char], ts: Set[Rexp]): Set[Rexp] = s match {
Chengsong
parents:
diff changeset
   949
    case x::xs => pdps(xs, ts.foldLeft(Set[Rexp]())((acc, t) => acc ++ pder(x, t)))
Chengsong
parents:
diff changeset
   950
    case Nil => ts   
Chengsong
parents:
diff changeset
   951
  }
Chengsong
parents:
diff changeset
   952
  def pdpss(ss: List[List[Char]], t: Rexp): Set[Rexp] = ss.foldLeft( Set[Rexp]())((acc, s) => pdps(s, Set(t)) ++ acc)
Chengsong
parents:
diff changeset
   953
Chengsong
parents:
diff changeset
   954
Chengsong
parents:
diff changeset
   955
Chengsong
parents:
diff changeset
   956
def starPrint(r: Rexp) : Unit = r match {
Chengsong
parents:
diff changeset
   957
        
Chengsong
parents:
diff changeset
   958
          case SEQ(head, rstar) =>
Chengsong
parents:
diff changeset
   959
            println(shortRexpOutput(head) ++ "~STARREG")
Chengsong
parents:
diff changeset
   960
          case STAR(rstar) =>
Chengsong
parents:
diff changeset
   961
            println("STARREG")
Chengsong
parents:
diff changeset
   962
          case ALTS(r1, r2) =>  
Chengsong
parents:
diff changeset
   963
            println("(")
Chengsong
parents:
diff changeset
   964
            starPrint(r1)
Chengsong
parents:
diff changeset
   965
            println("+")
Chengsong
parents:
diff changeset
   966
            starPrint(r2)
Chengsong
parents:
diff changeset
   967
            println(")")
Chengsong
parents:
diff changeset
   968
          case ZERO => println("0")
Chengsong
parents:
diff changeset
   969
        
Chengsong
parents:
diff changeset
   970
      }
Chengsong
parents:
diff changeset
   971
Chengsong
parents:
diff changeset
   972
// @arg(doc = "small tests")
Chengsong
parents:
diff changeset
   973
val STARREG = //((( (STAR("aa")) | STAR("aaa") ).%).%)
Chengsong
parents:
diff changeset
   974
(((STAR("a") | ( STAR("aaa")) | STAR("aaaaa"| ( STAR("aaaaaaa")) | STAR("aaaaaaaaaaa"))).%).%).%
Chengsong
parents:
diff changeset
   975
Chengsong
parents:
diff changeset
   976
// @main
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   977
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   978
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
   979
431
Chengsong
parents:
diff changeset
   980
def small() = {
Chengsong
parents:
diff changeset
   981
Chengsong
parents:
diff changeset
   982
Chengsong
parents:
diff changeset
   983
//   println(lexing_simp(NOTREG, prog0))
Chengsong
parents:
diff changeset
   984
//   val v = lex_simp(NOTREG, prog0.toList)
Chengsong
parents:
diff changeset
   985
//   println(v)
Chengsong
parents:
diff changeset
   986
Chengsong
parents:
diff changeset
   987
//   val d =  (lex_simp(NOTREG, prog0.toList))
Chengsong
parents:
diff changeset
   988
//   println(d)
Chengsong
parents:
diff changeset
   989
  val pderSTAR = pderUNIV(STARREG)
Chengsong
parents:
diff changeset
   990
Chengsong
parents:
diff changeset
   991
  val refSize = pderSTAR.map(size(_)).sum
435
Chengsong
parents: 432
diff changeset
   992
  // println("different partial derivative terms:")
Chengsong
parents: 432
diff changeset
   993
  // pderSTAR.foreach(r => r match {
431
Chengsong
parents:
diff changeset
   994
      
435
Chengsong
parents: 432
diff changeset
   995
  //       case SEQ(head, rstar) =>
Chengsong
parents: 432
diff changeset
   996
  //         println(shortRexpOutput(head) ++ "~STARREG")
Chengsong
parents: 432
diff changeset
   997
  //       case STAR(rstar) =>
Chengsong
parents: 432
diff changeset
   998
  //         println("STARREG")
431
Chengsong
parents:
diff changeset
   999
      
435
Chengsong
parents: 432
diff changeset
  1000
  //   }
Chengsong
parents: 432
diff changeset
  1001
  //   )
Chengsong
parents: 432
diff changeset
  1002
  // println("the total number of terms is")
Chengsong
parents: 432
diff changeset
  1003
  // //println(refSize)
Chengsong
parents: 432
diff changeset
  1004
  // println(pderSTAR.size)
431
Chengsong
parents:
diff changeset
  1005
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1006
  // val A : Rexp= ("c" | (ONE | "b") ~ "d") ~((ONE).%)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1007
  // val B : Rexp = ((ONE).%)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1008
  // val C : Rexp = ("d") ~ ((ONE).%)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1009
  // val PRUNE_REG : Rexp = (C | B | A)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1010
  // val APRUNE_REG = internalise(PRUNE_REG)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1011
  // val program_solution = pruneRexp(APRUNE_REG, breakIntoTerms(PRUNE_REG))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1012
  // println("program executes and gives: as disired!")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1013
  // println(shortRexpOutput(erase(program_solution)))
435
Chengsong
parents: 432
diff changeset
  1014
  // val simpedPruneReg = strongBsimp(APRUNE_REG)
Chengsong
parents: 432
diff changeset
  1015
Chengsong
parents: 432
diff changeset
  1016
  // println(shortRexpOutput(erase(simpedPruneReg)))
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1017
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1018
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1019
  for(i <- List(1,2,3,4,10, 100, 400, 841, 900 ) ){// 100, 400, 800, 840, 841, 900
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1020
    val prog0 = "a" * i
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1021
    //println(s"test: $prog0")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1022
    println(s"testing with $i a's" )
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1023
    //val bd = bdersSimp(prog0, STARREG)//DB
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1024
    val sbd = bdersStrongRexp(prog0, STARREG)//strongDB
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1025
    starPrint(erase(sbd))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1026
    val subTerms = breakIntoTerms(erase(sbd))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1027
    //val subTermsLarge = breakIntoTerms(erase(bd))
431
Chengsong
parents:
diff changeset
  1028
    
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1029
    println(s"subterms of regex with strongDB: ${subTerms.length}")//, standard DB: ${subTermsLarge.length}")
431
Chengsong
parents:
diff changeset
  1030
Chengsong
parents:
diff changeset
  1031
Chengsong
parents:
diff changeset
  1032
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1033
    println("the number of distinct subterms for bsimp with strongDB")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1034
    println(subTerms.distinct.size)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1035
    //println(subTermsLarge.distinct.size)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1036
    if(pderSTAR.size > subTerms.length)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1037
      println(s"which is less than or equal to the number of PDER terms: ${pderSTAR.size}")
431
Chengsong
parents:
diff changeset
  1038
Chengsong
parents:
diff changeset
  1039
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1040
    // println(shortRexpOutput(erase(sbd)))
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1041
    // println(shortRexpOutput(erase(bd)))
431
Chengsong
parents:
diff changeset
  1042
    
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1043
    println("pdersize, original, strongSimp")
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1044
    println(refSize, size(STARREG),  asize(sbd))
431
Chengsong
parents:
diff changeset
  1045
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1046
    //val vres = strong_blexing_simp( STARREG, prog0)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1047
    //println(vres)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1048
  }
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1049
  // println(vs.length)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1050
  // println(vs)
431
Chengsong
parents:
diff changeset
  1051
   
Chengsong
parents:
diff changeset
  1052
Chengsong
parents:
diff changeset
  1053
  // val prog1 = """read  n; write n"""  
Chengsong
parents:
diff changeset
  1054
  // println(s"test: $prog1")
Chengsong
parents:
diff changeset
  1055
  // println(lexing_simp(WHILE_REGS, prog1))
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1056
  // val display = ("a"| "ab").%
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1057
  // val adisplay = internalise(display)
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1058
  // bders_simp( "aaaaa".toList, adisplay)
431
Chengsong
parents:
diff changeset
  1059
}
Chengsong
parents:
diff changeset
  1060
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1061
def generator_test() {
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1062
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1063
  // test(rexp(7), 1000) { (r: Rexp) => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1064
  //   val ss = stringsFromRexp(r)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1065
  //   val boolList = ss.map(s => {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1066
  //     val simpVal = simpBlexer(r, s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1067
  //     val strongVal = strongBlexer(r, s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1068
  //     // println(simpVal)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1069
  //     // println(strongVal)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1070
  //     (simpVal == strongVal) && (simpVal != None) 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1071
  //   })
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1072
  //   !boolList.exists(b => b == false)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1073
  // }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1074
  // test(single(STAR(ALTS(STAR(CHAR('c')),ALTS(CHAR('c'),ZERO)))), 100000) { (r: Rexp) => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1075
  //   val ss = stringsFromRexp(r)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1076
  //   val boolList = ss.map(s => {
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1077
  //     val bdStrong = bdersStrong(s.toList, internalise(r))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1078
  //     val bdStrong5 = bdersStrong5(s.toList, internalise(r))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1079
  //     // println(shortRexpOutput(r))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1080
  //     // println(s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1081
  //     // println(strongVal)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1082
  //     // println(strongVal5)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1083
  //     // (strongVal == strongVal5) 
493
Chengsong
parents: 492
diff changeset
  1084
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1085
  //     if(asize(bdStrong5) > asize(bdStrong)){
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1086
  //       println(s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1087
  //       println(shortRexpOutput(erase(bdStrong5)))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1088
  //       println(shortRexpOutput(erase(bdStrong)))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1089
  //     }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1090
  //     asize(bdStrong5) <= asize(bdStrong)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1091
  //   })
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1092
  //   !boolList.exists(b => b == false)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1093
  // }
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1094
  //test(rexp(3), 10000000) { (r: Rexp) => 
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1095
  test(single(STAR(SEQ(SEQ(ALTS(CHAR('b'),STAR(CHAR('b'))),CHAR('b')),ALTS(ALTS(STAR(CHAR('c')),SEQ(CHAR('a'),CHAR('c'))),ALTS(ZERO,ONE))))), 1) {(r: Rexp) =>
493
Chengsong
parents: 492
diff changeset
  1096
    val ss = stringsFromRexp(r)
Chengsong
parents: 492
diff changeset
  1097
    val boolList = ss.map(s => {
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1098
      val bdStrong = bdersStrong(s.toList, internalise(r))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1099
      val bdStrong5 = bdersStrong5(s.toList, internalise(r))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1100
      val size5 = asize(bdStrong5)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1101
      val size0 = asize(bdStrong)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1102
      println(s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1103
      println(shortRexpOutput(erase(bdStrong5)))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1104
      println(shortRexpOutput(erase(bdStrong)))
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1105
      println(size5, size0)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1106
      // println(s)
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1107
      size5 <= size0
493
Chengsong
parents: 492
diff changeset
  1108
    })
494
c730d018ebfa blexer2
Chengsong
parents: 493
diff changeset
  1109
    // println(boolList)
493
Chengsong
parents: 492
diff changeset
  1110
    !boolList.exists(b => b == false)
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1111
  }
493
Chengsong
parents: 492
diff changeset
  1112
Chengsong
parents: 492
diff changeset
  1113
492
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1114
}
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1115
// small()
61eff2abb0b6 problem with erase
Chengsong
parents: 435
diff changeset
  1116
generator_test()
493
Chengsong
parents: 492
diff changeset
  1117
Chengsong
parents: 492
diff changeset
  1118
1
Chengsong
parents: 492
diff changeset
  1119
Chengsong
parents: 492
diff changeset
  1120
SEQ(SEQ(SEQ(ONE,CHAR('b')),STAR(CHAR('b'))),
Chengsong
parents: 492
diff changeset
  1121
SEQ(ALTS(ALTS(ZERO,STAR(CHAR('b'))),
Chengsong
parents: 492
diff changeset
  1122
STAR(ALTS(CHAR('a'),SEQ(SEQ(STAR(ALTS(STAR(CHAR('c')),CHAR('a'))),
Chengsong
parents: 492
diff changeset
  1123
SEQ(CHAR('a'),SEQ(ALTS(CHAR('b'),ZERO),SEQ(ONE,CHAR('b'))))),ONE)))),ONE))
Chengsong
parents: 492
diff changeset
  1124
Chengsong
parents: 492
diff changeset
  1125
Chengsong
parents: 492
diff changeset
  1126
// Sequ(Sequ(Sequ(Empty,Chr(b)),Stars(List(Chr(b), Chr(b)))),Sequ(Right(Stars(List(Right(Sequ(Sequ(Stars(List(Right(Chr(a)), Right(Chr(a)))),Sequ(Chr(a),Sequ(Left(Chr(b)),Sequ(Empty,Chr(b))))),Empty)), Right(Sequ(Sequ(Stars(List(Right(Chr(a)), Right(Chr(a)))),Sequ(Chr(a),Sequ(Left(Chr(b)),Sequ(Empty,Chr(b))))),Empty))))),Empty))
Chengsong
parents: 492
diff changeset
  1127
// Sequ(Sequ(Sequ(Empty,Chr(b)),Stars(List(Chr(b), Chr(b)))),Sequ(Right(Stars(List(Right(Sequ(Sequ(Stars(List(Right(Chr(a)), Right(Chr(a)))),Sequ(Chr(a),Sequ(Left(Chr(b)),Sequ(Empty,Chr(b))))),Empty)), Right(Sequ(Sequ(Stars(List(Right(Chr(a)), Right(Chr(a)))),Sequ(Chr(a),Sequ(Left(Chr(b)),Sequ(Empty,Chr(b))))),Empty))))),Empty))