regexp: comparison Myhill.thy

equal deleted inserted replaced

-:a1268fb0deea
+:a59473f0229d
 *)
 section {* Preliminary definitions *}
-text {* Sequential composition of two languages @{text "L1"} and @{text "L2"} *}
+types lang = "string set"
-definition Seq :: "string set \<Rightarrow> string set \<Rightarrow> string set" ("_ ;; _" [100,100] 100)
+text {*
+Sequential composition of two languages @{text "L1"} and @{text "L2"}
+*}
+definition Seq :: "lang \<Rightarrow> lang \<Rightarrow> lang" ("_ ;; _" [100,100] 100)
 where
 "L1 ;; L2 = {s1 @ s2 | s1 s2. s1 \<in> L1 \<and> s2 \<in> L2}"
 text {* Transitive closure of language @{text "L"}. *}
 inductive_set
 by simp
 text {*
 @{text "\<approx>L"} is an equivalent class defined by language @{text "Lang"}.
 *}
 definition
-str_eq_rel ("\<approx>_")
+str_eq_rel ("\<approx>_" [100] 100)
 where
 "\<approx>Lang \<equiv> {(x, y).  (\<forall>z. x @ z \<in> Lang \<longleftrightarrow> y @ z \<in> Lang)}"
 text {*
 Among equivlant clases of @{text "\<approx>Lang"}, the set @{text "finals(Lang)"} singles out
 next
 show "\<Union> (finals Lang) \<subseteq> Lang"
 apply (clarsimp simp:finals_def str_eq_rel_def)
 by (drule_tac x = "[]" in spec, auto)
 qed
 section {* Direction @{text "finite partition \<Rightarrow> regular language"}*}
 text {*
 The relationship between equivalent classes can be described by an
 using f_prop rs_def finals_in_partitions[of "Lang"] by auto
 qed
 finally show ?thesis by blast
 qed
-section {* Direction: @{text "regular language \<Rightarrow>finite partition"} *}
+section {* Direction: @{text "regular language \<Rightarrow> finite partitions"} *}
 subsection {* The scheme for this direction *}
 text {*
 The following convenient notation @{text "x \<approx>Lang y"} means:
 str_eq ("_ \<approx>_ _")
 where
 "x \<approx>Lang y \<equiv> (x, y) \<in> (\<approx>Lang)"
 text {*
-The very basic scheme to show the finiteness of the partion generated by a language @{text "Lang"}
+The very basic scheme to show the finiteness of the partion generated by a
-is by attaching tags to every string. The set of tags are carfully choosen to make it finite.
+language @{text "Lang"} is by attaching tags to every string. The set of
-If it can be proved that strings with the same tag are equivlent with respect @{text "Lang"},
+tags are carefully choosen to make it finite.  If it can be proved that
-then the partition given rise by @{text "Lang"} must be finite. The reason for this is a lemma
+strings with the same tag are equivlent with respect @{text "Lang"}, then
-in standard library (@{text "finite_imageD"}), which says: if the image of an injective
+the partition given rise by @{text "Lang"} must be finite. The reason for
-function on a set @{text "A"} is finite, then @{text "A"} is finite. It can be shown that
+this is a lemma in standard library (@{text "finite_imageD"}), which says:
-the function obtained by llifting @{text "tag"}
+if the image of an injective function on a set @{text "A"} is finite, then
-to the level of equalent classes (i.e. @{text "((op `) tag)"}) is injective
+@{text "A"} is finite. It can be shown that the function obtained by
-(by lemma @{text "tag_image_injI"}) and the image of this function is finite
+lifting @{text "tag"} to the level of equivalence classes (i.e. @{text "((op
-(with the help of lemma @{text "finite_tag_imageI"}). This argument is formalized
+`) tag)"}) is injective (by lemma @{text "tag_image_injI"}) and the image of
-by the following lemma @{text "tag_finite_imageD"}.
+this function is finite (with the help of lemma @{text
-*}
+"finite_tag_imageI"}). This argument is formalized by the following lemma
+@{text "tag_finite_imageD"}.
+{\bf
+Theorems @{text "tag_image_injI"} and @{text
+"finite_tag_imageI"} do not exist. Can this comment be deleted?
+\marginpar{\bf COMMENT}
+}
+*}
 lemma tag_finite_imageD:
-assumes str_inj: "\<And> m n. tag m = tag (n::string) \<Longrightarrow> m \<approx>lang n"
+fixes L1::"lang"
+assumes str_inj: "\<And> m n. tag m = tag n \<Longrightarrow> m \<approx>L1 n"
 and range: "finite (range tag)"
-shows "finite (UNIV // (\<approx>lang))"
+shows "finite (UNIV // \<approx>L1)"
 proof (rule_tac f = "(op `) tag" in finite_imageD)
-show "finite (op ` tag ` UNIV // \<approx>lang)" using range
+show "finite (op ` tag ` UNIV // \<approx>L1)" using range
 apply (rule_tac B = "Pow (tag ` UNIV)" in finite_subset)
 by (auto simp add:image_def Pow_def)
 next
-show "inj_on (op ` tag) (UNIV // \<approx>lang)"
+show "inj_on (op ` tag) (UNIV // \<approx>L1)"
 proof-
 { fix X Y
-assume X_in: "X \<in> UNIV // \<approx>lang"
+assume X_in: "X \<in> UNIV // \<approx>L1"
-and  Y_in: "Y \<in> UNIV // \<approx>lang"
+and  Y_in: "Y \<in> UNIV // \<approx>L1"
 and  tag_eq: "tag ` X = tag ` Y"
 then obtain x y where "x \<in> X" and "y \<in> Y" and "tag x = tag y"
 unfolding quotient_def Image_def str_eq_rel_def str_eq_def image_def
 apply simp by blast
 with X_in Y_in str_inj[of x y]
 qed
 subsection {* Lemmas for basic cases *}
 text {*
-The the final result of this direction is in @{text "easier_direction"}, which
+The the final result of this direction is in @{text "rexp_imp_finite"},
-is an induction on the structure of regular expressions. There is one case
+which is an induction on the structure of regular expressions. There is one
-for each regular expression operator. For basic operators such as @{text "NULL, EMPTY, CHAR c"},
+case for each regular expression operator. For basic operators such as
-the finiteness of their language partition can be established directly with no need
+@{const NULL}, @{const EMPTY}, @{const CHAR}, the finiteness of their
-of taggiing. This section contains several technical lemma for these base cases.
+language partition can be established directly with no need of tagging.
+This section contains several technical lemma for these base cases.
-The inductive cases involve operators @{text "ALT, SEQ"} and @{text "STAR"}.
-Tagging functions need to be defined individually for each of them. There will be one
+The inductive cases involve operators @{const ALT}, @{const SEQ} and @{const
-dedicated section for each of these cases, and each section goes virtually the same way:
+STAR}. Tagging functions need to be defined individually for each of
-gives definition of the tagging function and prove that strings
+them. There will be one dedicated section for each of these cases, and each
-with the same tag are equivalent.
+section goes virtually the same way: gives definition of the tagging
-*}
+function and prove that strings with the same tag are equivalent.
+*}
+subsection {* The case for @{const "NULL"} *}
+lemma quot_null_eq:
+shows "(UNIV // \<approx>{}) = ({UNIV}::lang set)"
+unfolding quotient_def Image_def str_eq_rel_def by auto
+lemma quot_null_finiteI [intro]:
+shows "finite ((UNIV // \<approx>{})::lang set)"
+unfolding quot_null_eq by simp
+subsection {* The case for @{const "EMPTY"} *}
 lemma quot_empty_subset:
 "UNIV // (\<approx>{[]}) \<subseteq> {{[]}, UNIV - {[]}}"
 proof
 fix x
 assume "x \<in> UNIV // \<approx>{[]}"
 then obtain y where h: "x = {z. (y, z) \<in> \<approx>{[]}}"
 unfolding quotient_def Image_def by blast
 show "x \<in> {{[]}, UNIV - {[]}}"
 proof (cases "y = []")
 case True with h
-have "x = {[]}" by (auto simp:str_eq_rel_def)
+have "x = {[]}" by (auto simp: str_eq_rel_def)
 thus ?thesis by simp
 next
 case False with h
-have "x = UNIV - {[]}" by (auto simp:str_eq_rel_def)
+have "x = UNIV - {[]}" by (auto simp: str_eq_rel_def)
 thus ?thesis by simp
 qed
 qed
+lemma quot_empty_finiteI [intro]:
+shows "finite (UNIV // (\<approx>{[]}))"
+by (rule finite_subset[OF quot_empty_subset]) (simp)
+subsection {* The case for @{const "CHAR"} *}
 lemma quot_char_subset:
 "UNIV // (\<approx>{[c]}) \<subseteq> {{[]},{[c]}, UNIV - {[], [c]}}"
 proof
 fix x
 by (auto simp add:str_eq_rel_def)
 } ultimately show ?thesis by blast
 qed
 qed
-subsection {* The case for @{text "SEQ"}*}
+lemma quot_char_finiteI [intro]:
+shows "finite (UNIV // (\<approx>{[c]}))"
+by (rule finite_subset[OF quot_char_subset]) (simp)
+subsection {* The case for @{const "SEQ"}*}
 definition
 "tag_str_SEQ L\<^isub>1 L\<^isub>2 x \<equiv>
 ((\<approx>L\<^isub>1) `` {x}, {(\<approx>L\<^isub>2) `` {x - xa}| xa.  xa \<le> x \<and> xa \<in> L\<^isub>1})"
 qed
 } thus "tag_str_SEQ L\<^isub>1 L\<^isub>2 m = tag_str_SEQ L\<^isub>1 L\<^isub>2 n \<Longrightarrow> m \<approx>(L\<^isub>1 ;; L\<^isub>2) n"
 by (auto simp add: str_eq_def str_eq_rel_def)
 qed
-lemma quot_seq_finiteI:
+lemma quot_seq_finiteI [intro]:
 "\<lbrakk>finite (UNIV // \<approx>L\<^isub>1); finite (UNIV // \<approx>L\<^isub>2)\<rbrakk>
 \<Longrightarrow> finite (UNIV // \<approx>(L\<^isub>1 ;; L\<^isub>2))"
 apply (rule_tac tag = "tag_str_SEQ L\<^isub>1 L\<^isub>2" in tag_finite_imageD)
 by (auto intro:tag_str_SEQ_injI elim:tag_str_seq_range_finite)
-subsection {* The case for @{text "ALT"} *}
+subsection {* The case for @{const "ALT"} *}
 definition
-"tag_str_ALT L\<^isub>1 L\<^isub>2 (x::string) \<equiv> ((\<approx>L\<^isub>1) `` {x}, (\<approx>L\<^isub>2) `` {x})"
+tag_str_ALT :: "lang \<Rightarrow> lang \<Rightarrow> string \<Rightarrow> (lang \<times> lang)"
+where
-lemma quot_union_finiteI:
+"tag_str_ALT L1 L2 = (\<lambda>x. (\<approx>L1 `` {x}, \<approx>L2 `` {x}))"
-assumes finite1: "finite (UNIV // \<approx>(L\<^isub>1::string set))"
-and finite2: "finite (UNIV // \<approx>L\<^isub>2)"
-shows "finite (UNIV // \<approx>(L\<^isub>1 \<union> L\<^isub>2))"
+lemma quot_union_finiteI [intro]:
-proof (rule_tac tag = "tag_str_ALT L\<^isub>1 L\<^isub>2" in tag_finite_imageD)
+fixes L1 L2::"lang"
-show "\<And>m n. tag_str_ALT L\<^isub>1 L\<^isub>2 m = tag_str_ALT L\<^isub>1 L\<^isub>2 n \<Longrightarrow> m \<approx>(L\<^isub>1 \<union> L\<^isub>2) n"
+assumes finite1: "finite (UNIV // \<approx>L1)"
-unfolding tag_str_ALT_def str_eq_def Image_def str_eq_rel_def by auto
+and     finite2: "finite (UNIV // \<approx>L2)"
+shows "finite (UNIV // \<approx>(L1 \<union> L2))"
+proof (rule_tac tag = "tag_str_ALT L1 L2" in tag_finite_imageD)
+show "\<And>x y. tag_str_ALT L1 L2 x = tag_str_ALT L1 L2 y \<Longrightarrow> x \<approx>(L1 \<union> L2) y"
+unfolding tag_str_ALT_def
+unfolding str_eq_def
+unfolding Image_def
+unfolding str_eq_rel_def
+by auto
 next
-show "finite (range (tag_str_ALT L\<^isub>1 L\<^isub>2))" using finite1 finite2
+have *: "finite ((UNIV // \<approx>L1) \<times> (UNIV // \<approx>L2))" using finite1 finite2 by auto
-apply (rule_tac B = "(UNIV // \<approx>L\<^isub>1) \<times> (UNIV // \<approx>L\<^isub>2)" in finite_subset)
+show "finite (range (tag_str_ALT L1 L2))"
-by (auto simp:tag_str_ALT_def Image_def quotient_def)
+unfolding tag_str_ALT_def
-qed
+apply(rule finite_subset[OF _ *])
+unfolding quotient_def
-subsection {*
+by auto
-The case for @{text "STAR"}
+qed
-*}
+subsection {* The case for @{const "STAR"} *}
 text {*
 This turned out to be the trickiest case.
 *} (* I will make some illustrations for it. *)
 qed
 } thus "tag_str_STAR L\<^isub>1 m = tag_str_STAR L\<^isub>1 n \<Longrightarrow> m \<approx>(L\<^isub>1\<star>) n"
 by (auto simp add:str_eq_def str_eq_rel_def)
 qed
-lemma quot_star_finiteI:
+lemma quot_star_finiteI [intro]:
 "finite (UNIV // \<approx>L\<^isub>1) \<Longrightarrow> finite (UNIV // \<approx>(L\<^isub>1\<star>))"
 apply (rule_tac tag = "tag_str_STAR L\<^isub>1" in tag_finite_imageD)
 by (auto intro:tag_str_STAR_injI elim:tag_str_star_range_finite)
-subsection {*
-The main lemma
+subsection {* The main lemma *}
-*}
+lemma rexp_imp_finite:
-lemma easier_directio\<nu>:
+fixes r::"rexp"
-"Lang = L (r::rexp) \<Longrightarrow> finite (UNIV // (\<approx>Lang))"
+shows "finite (UNIV // \<approx>(L r))"
-proof (induct arbitrary:Lang rule:rexp.induct)
+by (induct r) (auto)
-case NULL
-have "UNIV // (\<approx>{}) \<subseteq> {UNIV} "
-by (auto simp:quotient_def str_eq_rel_def str_eq_def)
-with prems show "?case" by (auto intro:finite_subset)
-next
-case EMPTY
-have "UNIV // (\<approx>{[]}) \<subseteq> {{[]}, UNIV - {[]}}"
-by (rule quot_empty_subset)
-with prems show ?case by (auto intro:finite_subset)
-next
-case (CHAR c)
-have "UNIV // (\<approx>{[c]}) \<subseteq> {{[]},{[c]}, UNIV - {[], [c]}}"
-by (rule quot_char_subset)
-with prems show ?case by (auto intro:finite_subset)
-next
-case (SEQ r\<^isub>1 r\<^isub>2)
-have "\<lbrakk>finite (UNIV // \<approx>(L r\<^isub>1)); finite (UNIV // \<approx>(L r\<^isub>2))\<rbrakk>
-\<Longrightarrow> finite (UNIV // \<approx>(L r\<^isub>1 ;; L r\<^isub>2))"
-by (erule quot_seq_finiteI, simp)
-with prems show ?case by simp
-next
-case (ALT r\<^isub>1 r\<^isub>2)
-have "\<lbrakk>finite (UNIV // \<approx>(L r\<^isub>1)); finite (UNIV // \<approx>(L r\<^isub>2))\<rbrakk>
-\<Longrightarrow> finite (UNIV // \<approx>(L r\<^isub>1 \<union> L r\<^isub>2))"
-by (erule quot_union_finiteI, simp)
-with prems show ?case by simp
-next
-case (STAR r)
-have "finite (UNIV // \<approx>(L r))
-\<Longrightarrow> finite (UNIV // \<approx>((L r)\<star>))"
-by (erule quot_star_finiteI)
-with prems show ?case by simp
-qed
 end

changeset 39	a59473f0229d
parent 35	d2ddce8b36fd
child 40	50d00d7dc413