progs/automata/der.sc
author Christian Urban <christian.urban@kcl.ac.uk>
Mon, 22 Nov 2021 11:35:38 +0000
changeset 851 2918388fe4ab
parent 784 3bc2c370c2e3
child 1007 5ebe843c1184
permissions -rw-r--r--
updated
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
784
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
     1
// Another automaton construction
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
     2
//================================
733
4d37ccc8c5be updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 586
diff changeset
     3
4d37ccc8c5be updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 586
diff changeset
     4
import $file.dfa, dfa._ 
487
ffbc65112d48 updated
Christian Urban <urbanc@in.tum.de>
parents: 486
diff changeset
     5
ffbc65112d48 updated
Christian Urban <urbanc@in.tum.de>
parents: 486
diff changeset
     6
// regular expressions
ffbc65112d48 updated
Christian Urban <urbanc@in.tum.de>
parents: 486
diff changeset
     7
abstract class Rexp
ffbc65112d48 updated
Christian Urban <urbanc@in.tum.de>
parents: 486
diff changeset
     8
case object ZERO extends Rexp                    // matches nothing
ffbc65112d48 updated
Christian Urban <urbanc@in.tum.de>
parents: 486
diff changeset
     9
case object ONE extends Rexp                     // matches the empty string
ffbc65112d48 updated
Christian Urban <urbanc@in.tum.de>
parents: 486
diff changeset
    10
case class CHAR(c: Char) extends Rexp            // matches a character c
ffbc65112d48 updated
Christian Urban <urbanc@in.tum.de>
parents: 486
diff changeset
    11
case class ALT(r1: Rexp, r2: Rexp) extends Rexp  // alternative
ffbc65112d48 updated
Christian Urban <urbanc@in.tum.de>
parents: 486
diff changeset
    12
case class SEQ(r1: Rexp, r2: Rexp) extends Rexp  // sequence
ffbc65112d48 updated
Christian Urban <urbanc@in.tum.de>
parents: 486
diff changeset
    13
case class STAR(r: Rexp) extends Rexp            // star
ffbc65112d48 updated
Christian Urban <urbanc@in.tum.de>
parents: 486
diff changeset
    14
784
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    15
// the nullable function: tests whether the regular 
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    16
// expression can recognise the empty string
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    17
def nullable (r: Rexp) : Boolean = r match {
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    18
  case ZERO => false
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    19
  case ONE => true
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    20
  case CHAR(_) => false
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    21
  case ALT(r1, r2) => nullable(r1) || nullable(r2)
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    22
  case SEQ(r1, r2) => nullable(r1) && nullable(r2)
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    23
  case STAR(_) => true
486
3cc1799daf08 updated
Christian Urban <urbanc@in.tum.de>
parents:
diff changeset
    24
}
487
ffbc65112d48 updated
Christian Urban <urbanc@in.tum.de>
parents: 486
diff changeset
    25
784
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    26
// the derivative of a regular expression w.r.t. a character
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    27
def der (c: Char, r: Rexp) : Rexp = r match {
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    28
  case ZERO => ZERO
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    29
  case ONE => ZERO
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    30
  case CHAR(d) => if (c == d) ONE else ZERO
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    31
  case ALT(r1, r2) => ALT(der(c, r1), der(c, r2))
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    32
  case SEQ(r1, r2) => 
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    33
    if (nullable(r1)) ALT(SEQ(der(c, r1), r2), der(c, r2))
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    34
    else SEQ(der(c, r1), r2)
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    35
  case STAR(r1) => SEQ(der(c, r1), STAR(r1))
487
ffbc65112d48 updated
Christian Urban <urbanc@in.tum.de>
parents: 486
diff changeset
    36
}
ffbc65112d48 updated
Christian Urban <urbanc@in.tum.de>
parents: 486
diff changeset
    37
ffbc65112d48 updated
Christian Urban <urbanc@in.tum.de>
parents: 486
diff changeset
    38
784
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    39
def flaw(r: Rexp) : DFA[Rexp, Char] = {
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    40
  DFA(r, 
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    41
      { case (r, c) => der(c, r) }, 
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    42
      nullable(_))
488
057b4603b940 updated
Christian Urban <urbanc@in.tum.de>
parents: 487
diff changeset
    43
}
487
ffbc65112d48 updated
Christian Urban <urbanc@in.tum.de>
parents: 486
diff changeset
    44
784
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    45
val r = STAR(CHAR('a'))
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    46
val pseudo = flaw(r)
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    47
println(pseudo.accepts("".toList))    // true
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    48
println(pseudo.accepts("a".toList))   // true
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    49
println(pseudo.accepts("aa".toList))  // true
3bc2c370c2e3 updated
Christian Urban <christian.urban@kcl.ac.uk>
parents: 779
diff changeset
    50
println(pseudo.accepts("bb".toList))  // false