regexp: comparison Myhill.thy

equal deleted inserted replaced

-:28d70591042a
+:bea2466a6084
 string @{text "x"} and @{text "y"} are equivalent with respect to
 language @{text "Lang"}.
 *}
 definition
-str_eq ("_ \<approx>_ _")
+str_eq :: "string \<Rightarrow> lang \<Rightarrow> string \<Rightarrow> bool" ("_ \<approx>_ _")
 where
 "x \<approx>Lang y \<equiv> (x, y) \<in> (\<approx>Lang)"
 text {*
 The basic idea to show the finiteness of the partition induced by relation @{text "\<approx>Lang"}
 qed
 qed
 subsection {* Lemmas for basic cases *}
-text {*
+subsection {* The case for @{const "NULL"} *}
-The the final result of this direction is in @{text "easier_direction"}, which
-is an induction on the structure of regular expressions. There is one case
+lemma quot_null_eq:
-for each regular expression operator. For basic operators such as @{text "NULL, EMPTY, CHAR c"},
+shows "(UNIV // \<approx>{}) = ({UNIV}::lang set)"
-the finiteness of their language partition can be established directly with no need
+unfolding quotient_def Image_def str_eq_rel_def by auto
-of taggiing. This section contains several technical lemma for these base cases.
+lemma quot_null_finiteI [intro]:
-The inductive cases involve operators @{text "ALT, SEQ"} and @{text "STAR"}.
+shows "finite ((UNIV // \<approx>{})::lang set)"
-Tagging functions need to be defined individually for each of them. There will be one
+unfolding quot_null_eq by simp
-dedicated section for each of these cases, and each section goes virtually the same way:
-gives definition of the tagging function and prove that strings
-with the same tag are equivalent.
+subsection {* The case for @{const "EMPTY"} *}
-*}
 lemma quot_empty_subset:
 "UNIV // (\<approx>{[]}) \<subseteq> {{[]}, UNIV - {[]}}"
 proof
 fix x
 assume "x \<in> UNIV // \<approx>{[]}"
 then obtain y where h: "x = {z. (y, z) \<in> \<approx>{[]}}"
 unfolding quotient_def Image_def by blast
 show "x \<in> {{[]}, UNIV - {[]}}"
 proof (cases "y = []")
 case True with h
-have "x = {[]}" by (auto simp:str_eq_rel_def)
+have "x = {[]}" by (auto simp: str_eq_rel_def)
 thus ?thesis by simp
 next
 case False with h
-have "x = UNIV - {[]}" by (auto simp:str_eq_rel_def)
+have "x = UNIV - {[]}" by (auto simp: str_eq_rel_def)
 thus ?thesis by simp
 qed
 qed
+lemma quot_empty_finiteI [intro]:
+shows "finite (UNIV // (\<approx>{[]}))"
+by (rule finite_subset[OF quot_empty_subset]) (simp)
+subsection {* The case for @{const "CHAR"} *}
 lemma quot_char_subset:
 "UNIV // (\<approx>{[c]}) \<subseteq> {{[]},{[c]}, UNIV - {[], [c]}}"
 proof
 fix x
 by (auto simp add:str_eq_rel_def)
 } ultimately show ?thesis by blast
 qed
 qed
+lemma quot_char_finiteI [intro]:
+shows "finite (UNIV // (\<approx>{[c]}))"
+by (rule finite_subset[OF quot_char_subset]) (simp)
 subsection {* The case for @{text "SEQ"}*}
 definition
-"tag_str_SEQ L\<^isub>1 L\<^isub>2 x \<equiv>
+tag_str_SEQ :: "lang \<Rightarrow> lang \<Rightarrow> string \<Rightarrow> (lang \<times> lang set)"
-((\<approx>L\<^isub>1) `` {x}, {(\<approx>L\<^isub>2) `` {x - xa}| xa.  xa \<le> x \<and> xa \<in> L\<^isub>1})"
+where
+"tag_str_SEQ L1 L2 = (\<lambda>x. (\<approx>L1 `` {x}, {(\<approx>L2 `` {x - xa}) | xa.  xa \<le> x \<and> xa \<in> L1}))"
-lemma tag_str_seq_range_finite:
-"\<lbrakk>finite (UNIV // \<approx>L\<^isub>1); finite (UNIV // \<approx>L\<^isub>2)\<rbrakk>
-\<Longrightarrow> finite (range (tag_str_SEQ L\<^isub>1 L\<^isub>2))"
-apply (rule_tac B = "(UNIV // \<approx>L\<^isub>1) \<times> (Pow (UNIV // \<approx>L\<^isub>2))" in finite_subset)
-by (auto simp:tag_str_SEQ_def Image_def quotient_def split:if_splits)
 lemma append_seq_elim:
 assumes "x @ y \<in> L\<^isub>1 ;; L\<^isub>2"
 shows "(\<exists> xa \<le> x. xa \<in> L\<^isub>1 \<and> (x - xa) @ y \<in> L\<^isub>2) \<or>
 (\<exists> ya \<le> y. (x @ ya) \<in> L\<^isub>1 \<and> (y - ya) \<in> L\<^isub>2)"
 qed
 } thus "tag_str_SEQ L\<^isub>1 L\<^isub>2 m = tag_str_SEQ L\<^isub>1 L\<^isub>2 n \<Longrightarrow> m \<approx>(L\<^isub>1 ;; L\<^isub>2) n"
 by (auto simp add: str_eq_def str_eq_rel_def)
 qed
-lemma quot_seq_finiteI:
+lemma quot_seq_finiteI [intro]:
-"\<lbrakk>finite (UNIV // \<approx>L\<^isub>1); finite (UNIV // \<approx>L\<^isub>2)\<rbrakk>
+fixes L1 L2::"lang"
-\<Longrightarrow> finite (UNIV // \<approx>(L\<^isub>1 ;; L\<^isub>2))"
+assumes fin1: "finite (UNIV // \<approx>L1)"
-apply (rule_tac tag = "tag_str_SEQ L\<^isub>1 L\<^isub>2" in tag_finite_imageD)
+and     fin2: "finite (UNIV // \<approx>L2)"
-by (auto intro:tag_str_SEQ_injI elim:tag_str_seq_range_finite)
+shows "finite (UNIV // \<approx>(L1 ;; L2))"
+proof (rule_tac tag = "tag_str_SEQ L1 L2" in tag_finite_imageD)
-subsection {* The case for @{text "ALT"} *}
+show "\<And>x y. tag_str_SEQ L1 L2 x = tag_str_SEQ L1 L2 y \<Longrightarrow> x \<approx>(L1 ;; L2) y"
+by (rule tag_str_SEQ_injI)
+next
+have *: "finite ((UNIV // \<approx>L1) \<times> (Pow (UNIV // \<approx>L2)))"
+using fin1 fin2 by auto
+show "finite (range (tag_str_SEQ L1 L2))"
+unfolding tag_str_SEQ_def
+apply(rule finite_subset[OF _ *])
+unfolding quotient_def
+by auto
+qed
+subsection {* The case for @{const ALT} *}
 definition
-"tag_str_ALT L\<^isub>1 L\<^isub>2 (x::string) \<equiv> ((\<approx>L\<^isub>1) `` {x}, (\<approx>L\<^isub>2) `` {x})"
+tag_str_ALT :: "lang \<Rightarrow> lang \<Rightarrow> string \<Rightarrow> (lang \<times> lang)"
+where
-lemma quot_union_finiteI:
+"tag_str_ALT L1 L2 = (\<lambda>x. (\<approx>L1 `` {x}, \<approx>L2 `` {x}))"
-assumes finite1: "finite (UNIV // \<approx>(L\<^isub>1::string set))"
-and finite2: "finite (UNIV // \<approx>L\<^isub>2)"
-shows "finite (UNIV // \<approx>(L\<^isub>1 \<union> L\<^isub>2))"
+lemma quot_union_finiteI [intro]:
-proof (rule_tac tag = "tag_str_ALT L\<^isub>1 L\<^isub>2" in tag_finite_imageD)
+fixes L1 L2::"lang"
-show "\<And>m n. tag_str_ALT L\<^isub>1 L\<^isub>2 m = tag_str_ALT L\<^isub>1 L\<^isub>2 n \<Longrightarrow> m \<approx>(L\<^isub>1 \<union> L\<^isub>2) n"
+assumes finite1: "finite (UNIV // \<approx>L1)"
-unfolding tag_str_ALT_def str_eq_def Image_def str_eq_rel_def by auto
+and     finite2: "finite (UNIV // \<approx>L2)"
+shows "finite (UNIV // \<approx>(L1 \<union> L2))"
+proof (rule_tac tag = "tag_str_ALT L1 L2" in tag_finite_imageD)
+show "\<And>x y. tag_str_ALT L1 L2 x = tag_str_ALT L1 L2 y \<Longrightarrow> x \<approx>(L1 \<union> L2) y"
+unfolding tag_str_ALT_def
+unfolding str_eq_def
+unfolding Image_def
+unfolding str_eq_rel_def
+by auto
 next
-show "finite (range (tag_str_ALT L\<^isub>1 L\<^isub>2))" using finite1 finite2
+have *: "finite ((UNIV // \<approx>L1) \<times> (UNIV // \<approx>L2))"
-apply (rule_tac B = "(UNIV // \<approx>L\<^isub>1) \<times> (UNIV // \<approx>L\<^isub>2)" in finite_subset)
+using finite1 finite2 by auto
-by (auto simp:tag_str_ALT_def Image_def quotient_def)
+show "finite (range (tag_str_ALT L1 L2))"
-qed
+unfolding tag_str_ALT_def
+apply(rule finite_subset[OF _ *])
-subsection {*
+unfolding quotient_def
-The case for @{text "STAR"}
+by auto
-*}
+qed
+subsection {* The case for @{const "STAR"} *}
 text {*
 This turned out to be the trickiest case.
 Any string @{text "x"} in language @{text "L\<^isub>1\<star>"},
 can be splited into a prefix @{text "xa \<in> L\<^isub>1\<star>"} and a suffix @{text "x - xa \<in> L\<^isub>1"}.
 For one such @{text "x"}, there can be many such splits. The tagging of @{text "x"} is then
 defined by collecting the @{text "L\<^isub>1"}-state of the suffixes from every possible split.
 *}
-(* I will make some illustrations for it. *)
 definition
-"tag_str_STAR L\<^isub>1 x \<equiv> {(\<approx>L\<^isub>1) `` {x - xa} | xa. xa < x \<and> xa \<in> L\<^isub>1\<star>}"
+tag_str_STAR :: "lang \<Rightarrow> string \<Rightarrow> lang set"
+where
+"tag_str_STAR L1 = (\<lambda>x. {\<approx>L1 `` {x - xa} | xa. xa < x \<and> xa \<in> L1\<star>})"
 text {* A technical lemma. *}
 lemma finite_set_has_max: "\<lbrakk>finite A; A \<noteq> {}\<rbrakk> \<Longrightarrow>
 (\<exists> max \<in> A. \<forall> a \<in> A. f a <= (f max :: nat))"
 proof (induct rule:finite.induct)
 lemma finite_strict_prefix_set: "finite {xa. xa < (x::string)}"
 apply (induct x rule:rev_induct, simp)
 apply (subgoal_tac "{xa. xa < xs @ [x]} = {xa. xa < xs} \<union> {xs}")
 by (auto simp:strict_prefix_def)
-text {*
-The following lemma @{text "tag_str_star_range_finite"} establishes the range finiteness
-of the tagging function.
-*}
-lemma tag_str_star_range_finite:
-"finite (UNIV // \<approx>L\<^isub>1) \<Longrightarrow> finite (range (tag_str_STAR L\<^isub>1))"
-apply (rule_tac B = "Pow (UNIV // \<approx>L\<^isub>1)" in finite_subset)
-by (auto simp:tag_str_STAR_def Image_def
-quotient_def split:if_splits)
 text {*
 The following lemma @{text "tag_str_STAR_injI"} establishes the injectivity of
 the tagging function for case @{text "STAR"}.
 *}
 from this [OF _ eq_tag] and this [OF _ eq_tag [THEN sym]]
 -- {* The thesis is proved as a trival consequence: *}
 show  ?thesis by (unfold str_eq_def str_eq_rel_def, blast)
 qed
-lemma quot_star_finiteI:
+lemma quot_star_finiteI [intro]:
-"finite (UNIV // \<approx>L\<^isub>1) \<Longrightarrow> finite (UNIV // \<approx>(L\<^isub>1\<star>))"
+fixes L1::"lang"
-apply (rule_tac tag = "tag_str_STAR L\<^isub>1" in tag_finite_imageD)
+assumes finite1: "finite (UNIV // \<approx>L1)"
-by (auto intro:tag_str_STAR_injI elim:tag_str_star_range_finite)
+shows "finite (UNIV // \<approx>(L1\<star>))"
+proof (rule_tac tag = "tag_str_STAR L1" in tag_finite_imageD)
-subsection {*
+show "\<And>x y. tag_str_STAR L1 x = tag_str_STAR L1 y \<Longrightarrow> x \<approx>(L1\<star>) y"
-The main lemma
+by (rule tag_str_STAR_injI)
-*}
-lemma easier_direction:
-"Lang = L (r::rexp) \<Longrightarrow> finite (UNIV // (\<approx>Lang))"
-proof (induct arbitrary:Lang rule:rexp.induct)
-case NULL
-have "UNIV // (\<approx>{}) \<subseteq> {UNIV} "
-by (auto simp:quotient_def str_eq_rel_def str_eq_def)
-with prems show "?case" by (auto intro:finite_subset)
 next
-case EMPTY
+have *: "finite (Pow (UNIV // \<approx>L1))"
-have "UNIV // (\<approx>{[]}) \<subseteq> {{[]}, UNIV - {[]}}"
+using finite1 by auto
-by (rule quot_empty_subset)
+show "finite (range (tag_str_STAR L1))"
-with prems show ?case by (auto intro:finite_subset)
+unfolding tag_str_STAR_def
-next
+apply(rule finite_subset[OF _ *])
-case (CHAR c)
+unfolding quotient_def
-have "UNIV // (\<approx>{[c]}) \<subseteq> {{[]},{[c]}, UNIV - {[], [c]}}"
+by auto
-by (rule quot_char_subset)
+qed
-with prems show ?case by (auto intro:finite_subset)
-next
-case (SEQ r\<^isub>1 r\<^isub>2)
+lemma rexp_imp_finite:
-have "\<lbrakk>finite (UNIV // \<approx>(L r\<^isub>1)); finite (UNIV // \<approx>(L r\<^isub>2))\<rbrakk>
+fixes r::"rexp"
-\<Longrightarrow> finite (UNIV // \<approx>(L r\<^isub>1 ;; L r\<^isub>2))"
+shows "finite (UNIV // \<approx>(L r))"
-by (erule quot_seq_finiteI, simp)
+by (induct r) (auto)
-with prems show ?case by simp
-next
-case (ALT r\<^isub>1 r\<^isub>2)
-have "\<lbrakk>finite (UNIV // \<approx>(L r\<^isub>1)); finite (UNIV // \<approx>(L r\<^isub>2))\<rbrakk>
-\<Longrightarrow> finite (UNIV // \<approx>(L r\<^isub>1 \<union> L r\<^isub>2))"
-by (erule quot_union_finiteI, simp)
-with prems show ?case by simp
-next
-case (STAR r)
-have "finite (UNIV // \<approx>(L r))
-\<Longrightarrow> finite (UNIV // \<approx>((L r)\<star>))"
-by (erule quot_star_finiteI)
-with prems show ?case by simp
-qed
 end
 (*
 lemma refined_quotient_union_eq:

changeset 47	bea2466a6084
parent 45	7aa6c20e6d31
child 48	61d9684a557a