| author | Christian Urban <christian.urban@kcl.ac.uk> | 
| Sun, 19 Oct 2025 09:51:35 +0200 | |
| changeset 1012 | c01dfa3ff177 | 
| parent 981 | 14e5ae1fb541 | 
| permissions | -rw-r--r-- | 
| 167 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 1 | theory Matcher | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 2 | imports "Main" | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 3 | begin | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 4 | |
| 208 
bd5a8a6b3871
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
167diff
changeset | 5 | |
| 882 | 6 | section \<open>Regular Expressions\<close> | 
| 167 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 7 | |
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 8 | datatype rexp = | 
| 495 | 9 | ZERO | 
| 10 | | ONE | |
| 882 | 11 | | CH char | 
| 167 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 12 | | SEQ rexp rexp | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 13 | | ALT rexp rexp | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 14 | | STAR rexp | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 15 | |
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 16 | |
| 882 | 17 | section \<open>Sequential Composition of Sets of Strings\<close> | 
| 167 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 18 | |
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 19 | definition | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 20 |   Seq :: "string set \<Rightarrow> string set \<Rightarrow> string set" ("_ ;; _" [100,100] 100)
 | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 21 | where | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 22 |   "A ;; B = {s1 @ s2 | s1 s2. s1 \<in> A \<and> s2 \<in> B}"
 | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 23 | |
| 882 | 24 | text \<open>Two Simple Properties about Sequential Composition\<close> | 
| 167 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 25 | |
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 26 | lemma seq_empty [simp]: | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 27 |   shows "A ;; {[]} = A"
 | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 28 |   and   "{[]} ;; A = A"
 | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 29 | by (simp_all add: Seq_def) | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 30 | |
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 31 | lemma seq_null [simp]: | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 32 |   shows "A ;; {} = {}"
 | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 33 |   and   "{} ;; A = {}"
 | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 34 | by (simp_all add: Seq_def) | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 35 | |
| 882 | 36 | section \<open>Kleene Star for Sets\<close> | 
| 167 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 37 | |
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 38 | inductive_set | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 39 |   Star :: "string set \<Rightarrow> string set" ("_\<star>" [101] 102)
 | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 40 | for A :: "string set" | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 41 | where | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 42 | start[intro]: "[] \<in> A\<star>" | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 43 | | step[intro]: "\<lbrakk>s1 \<in> A; s2 \<in> A\<star>\<rbrakk> \<Longrightarrow> s1 @ s2 \<in> A\<star>" | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 44 | |
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 45 | |
| 882 | 46 | text \<open>A Standard Property of Star\<close> | 
| 167 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 47 | |
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 48 | lemma star_cases: | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 49 |   shows "A\<star> = {[]} \<union> A ;; A\<star>"
 | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 50 | unfolding Seq_def | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 51 | by (auto) (metis Star.simps) | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 52 | |
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 53 | lemma star_decomp: | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 54 | assumes a: "c # x \<in> A\<star>" | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 55 | shows "\<exists>a b. x = a @ b \<and> c # a \<in> A \<and> b \<in> A\<star>" | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 56 | using a | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 57 | by (induct x\<equiv>"c # x" rule: Star.induct) | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 58 | (auto simp add: append_eq_Cons_conv) | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 59 | |
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 60 | |
| 882 | 61 | section \<open>Meaning of Regular Expressions\<close> | 
| 167 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 62 | |
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 63 | fun | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 64 | L :: "rexp \<Rightarrow> string set" | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 65 | where | 
| 495 | 66 |   "L (ZERO) = {}"
 | 
| 67 | | "L (ONE) = {[]}"
 | |
| 882 | 68 | | "L (CH c) = {[c]}"
 | 
| 167 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 69 | | "L (SEQ r1 r2) = (L r1) ;; (L r2)" | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 70 | | "L (ALT r1 r2) = (L r1) \<union> (L r2)" | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 71 | | "L (STAR r) = (L r)\<star>" | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 72 | |
| 882 | 73 | section \<open>The Matcher\<close> | 
| 167 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 74 | |
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 75 | fun | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 76 | nullable :: "rexp \<Rightarrow> bool" | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 77 | where | 
| 495 | 78 | "nullable (ZERO) = False" | 
| 79 | | "nullable (ONE) = True" | |
| 882 | 80 | | "nullable (CH c) = False" | 
| 167 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 81 | | "nullable (ALT r1 r2) = (nullable r1 \<or> nullable r2)" | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 82 | | "nullable (SEQ r1 r2) = (nullable r1 \<and> nullable r2)" | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 83 | | "nullable (STAR r) = True" | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 84 | |
| 208 
bd5a8a6b3871
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
167diff
changeset | 85 | |
| 882 | 86 | section \<open>Correctness Proof for Nullable\<close> | 
| 167 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 87 | |
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 88 | lemma nullable_correctness: | 
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 89 | shows "nullable r \<longleftrightarrow> [] \<in> (L r)" | 
| 208 
bd5a8a6b3871
added
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: 
167diff
changeset | 90 | apply(induct r) | 
| 495 | 91 | (* ZERO case *) | 
| 92 | apply(simp only: nullable.simps) | |
| 93 | apply(simp only: L.simps) | |
| 94 | apply(simp) | |
| 95 | (* ONE case *) | |
| 96 | apply(simp only: nullable.simps) | |
| 97 | apply(simp only: L.simps) | |
| 98 | apply(simp) | |
| 99 | (* CHAR case *) | |
| 100 | apply(simp only: nullable.simps) | |
| 101 | apply(simp only: L.simps) | |
| 102 | apply(simp) | |
| 103 | prefer 2 | |
| 104 | (* ALT case *) | |
| 105 | apply(simp (no_asm) only: nullable.simps) | |
| 106 | apply(simp only:) | |
| 107 | apply(simp only: L.simps) | |
| 108 | apply(simp) | |
| 109 | (* SEQ case *) | |
| 981 | 110 | apply(simp only: L.simps) | 
| 111 | apply(simp) | |
| 495 | 112 | oops | 
| 167 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 113 | |
| 495 | 114 | lemma nullable_correctness: | 
| 115 | shows "nullable r \<longleftrightarrow> [] \<in> (L r)" | |
| 116 | apply(induct r) | |
| 117 | apply(simp_all) | |
| 118 | (* all easy subgoals are proved except the last 2 *) | |
| 119 | (* where the definition of Seq needs to be unfolded. *) | |
| 120 | oops | |
| 167 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 121 | |
| 495 | 122 | lemma nullable_correctness: | 
| 123 | shows "nullable r \<longleftrightarrow> [] \<in> (L r)" | |
| 124 | apply(induct r) | |
| 125 | apply(simp_all add: Seq_def) | |
| 126 | (* except the star case every thing is proved *) | |
| 127 | (* we need to use the rule for Star.start *) | |
| 128 | oops | |
| 167 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 129 | |
| 495 | 130 | lemma nullable_correctness: | 
| 131 | shows "nullable r \<longleftrightarrow> [] \<in> (L r)" | |
| 132 | apply(induct r) | |
| 133 | apply(simp_all add: Seq_def Star.start) | |
| 134 | done | |
| 167 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 135 | |
| 882 | 136 | section \<open>Derivative Operation\<close> | 
| 137 | ||
| 138 | fun der :: "char \<Rightarrow> rexp \<Rightarrow> rexp" | |
| 139 | where | |
| 140 | "der c (ZERO) = ZERO" | |
| 141 | | "der c (ONE) = ZERO" | |
| 142 | | "der c (CH d) = (if c = d then ONE else ZERO)" | |
| 143 | | "der c (ALT r1 r2) = ALT (der c r1) (der c r2)" | |
| 144 | | "der c (SEQ r1 r2) = (if nullable r1 then ALT (SEQ (der c r1) r2) (der c r2) | |
| 145 | else SEQ (der c r1) r2)" | |
| 146 | | "der c (STAR r) = SEQ (der c r) (STAR r)" | |
| 147 | ||
| 148 | fun | |
| 149 | ders :: "string \<Rightarrow> rexp \<Rightarrow> rexp" | |
| 150 | where | |
| 151 | "ders [] r = r" | |
| 152 | | "ders (c # s) r = ders s (der c r)" | |
| 153 | ||
| 154 | fun | |
| 155 | matcher :: "rexp \<Rightarrow> string \<Rightarrow> bool" | |
| 156 | where | |
| 157 | "matcher r s = nullable (ders s r)" | |
| 158 | ||
| 159 | definition | |
| 160 | Der :: "char \<Rightarrow> string set \<Rightarrow> string set" | |
| 161 | where | |
| 162 |   "Der c A \<equiv> {s. [c] @ s \<in> A}"
 | |
| 163 | ||
| 164 | lemma Der_null [simp]: | |
| 165 |   shows "Der c {} = {}"
 | |
| 166 | unfolding Der_def | |
| 167 | by auto | |
| 168 | ||
| 169 | lemma Der_empty [simp]: | |
| 170 |   shows "Der c {[]} = {}"
 | |
| 171 | unfolding Der_def | |
| 172 | by auto | |
| 173 | ||
| 174 | lemma Der_char [simp]: | |
| 175 |   shows "Der c {[d]} = (if c = d then {[]} else {})"
 | |
| 176 | unfolding Der_def | |
| 177 | by auto | |
| 178 | ||
| 179 | lemma Der_union [simp]: | |
| 180 | shows "Der c (A \<union> B) = Der c A \<union> Der c B" | |
| 181 | unfolding Der_def | |
| 182 | by auto | |
| 183 | ||
| 184 | lemma Der_insert_nil [simp]: | |
| 185 | shows "Der c (insert [] A) = Der c A" | |
| 186 | unfolding Der_def | |
| 187 | by auto | |
| 188 | ||
| 189 | lemma Der_seq [simp]: | |
| 190 |   shows "Der c (A ;; B) = (Der c A) ;; B \<union> (if [] \<in> A then Der c B else {})"
 | |
| 191 | unfolding Der_def Seq_def | |
| 192 | by (auto simp add: Cons_eq_append_conv) | |
| 193 | ||
| 194 | lemma Der_star [simp]: | |
| 195 | shows "Der c (A\<star>) = (Der c A) ;; A\<star>" | |
| 196 | proof - | |
| 197 |   have "Der c (A\<star>) = Der c ({[]} \<union> A ;; A\<star>)"
 | |
| 198 | by (simp only: star_cases[symmetric]) | |
| 199 | also have "... = Der c (A ;; A\<star>)" | |
| 200 | by (simp only: Der_union Der_empty) (simp) | |
| 201 |   also have "... = (Der c A) ;; A\<star> \<union> (if [] \<in> A then Der c (A\<star>) else {})"
 | |
| 202 | by simp | |
| 203 | also have "... = (Der c A) ;; A\<star>" | |
| 204 | unfolding Seq_def Der_def | |
| 205 | by (auto dest: star_decomp) | |
| 206 | finally show "Der c (A\<star>) = (Der c A) ;; A\<star>" . | |
| 207 | qed | |
| 208 | ||
| 209 | lemma der_correctness: | |
| 210 | shows "L (der c r) = Der c (L r)" | |
| 211 | apply(induct rule: der.induct) | |
| 212 | apply(auto simp add: nullable_correctness) | |
| 213 | done | |
| 214 | ||
| 215 | ||
| 216 | lemma matcher_correctness: | |
| 217 | shows "matcher r s \<longleftrightarrow> s \<in> L r" | |
| 218 | by (induct s arbitrary: r) | |
| 219 | (simp_all add: nullable_correctness der_correctness Der_def) | |
| 220 | ||
| 221 | ||
| 167 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 222 | |
| 
cfba674a8fdf
added matcher
 Christian Urban <christian dot urban at kcl dot ac dot uk> parents: diff
changeset | 223 | end |