diff --git a/thys/Frequency_Moments/Frequency_Moment_0.thy b/thys/Frequency_Moments/Frequency_Moment_0.thy
--- a/thys/Frequency_Moments/Frequency_Moment_0.thy
+++ b/thys/Frequency_Moments/Frequency_Moment_0.thy
@@ -1,1314 +1,1314 @@
 section \<open>Frequency Moment $0$\label{sec:f0}\<close>
 
 theory Frequency_Moment_0
   imports
     Frequency_Moments_Preliminary_Results
     Median_Method.Median 
     K_Smallest 
     Universal_Hash_Families.Carter_Wegman_Hash_Family
     Frequency_Moments
     Landau_Ext 
     Product_PMF_Ext
-    Universal_Hash_Families.Field
+    Universal_Hash_Families.Universal_Hash_Families_More_Finite_Fields
 begin
 
 text \<open>This section contains a formalization of a new algorithm for the zero-th frequency moment
 inspired by ideas described in \<^cite>\<open>"baryossef2002"\<close>.
 It is a KMV-type ($k$-minimum value) algorithm with a rounding method and matches the space complexity 
 of the best algorithm described in \<^cite>\<open>"baryossef2002"\<close>.
 
 In addition to the Isabelle proof here, there is also an informal hand-written proof in
 Appendix~\ref{sec:f0_proof}.\<close>
 
 type_synonym f0_state = "nat \<times> nat \<times> nat \<times> nat \<times> (nat \<Rightarrow> nat list) \<times> (nat \<Rightarrow> float set)"
 
 definition hash where "hash p = ring.hash (mod_ring p)"
 
 fun f0_init :: "rat \<Rightarrow> rat \<Rightarrow> nat \<Rightarrow> f0_state pmf" where
   "f0_init \<delta> \<epsilon> n =
     do {
       let s = nat \<lceil>-18 * ln (real_of_rat \<epsilon>)\<rceil>;
       let t = nat \<lceil>80 / (real_of_rat \<delta>)\<^sup>2\<rceil>;
       let p = prime_above (max n 19);
       let r = nat (4 * \<lceil>log 2 (1 / real_of_rat \<delta>)\<rceil> + 23); 
       h \<leftarrow> prod_pmf {..<s} (\<lambda>_. pmf_of_set (bounded_degree_polynomials (mod_ring p) 2));
       return_pmf (s, t, p, r, h, (\<lambda>_ \<in> {0..<s}. {}))
     }"
 
 fun f0_update :: "nat \<Rightarrow> f0_state \<Rightarrow> f0_state pmf" where
   "f0_update x (s, t, p, r, h, sketch) = 
     return_pmf (s, t, p, r, h, \<lambda>i \<in> {..<s}.
       least t (insert (float_of (truncate_down r (hash p x (h i)))) (sketch i)))"
 
 fun f0_result :: "f0_state \<Rightarrow> rat pmf" where
   "f0_result (s, t, p, r, h, sketch) = return_pmf (median s (\<lambda>i \<in> {..<s}.
       (if card (sketch i) < t then of_nat (card (sketch i)) else
         rat_of_nat t* rat_of_nat p / rat_of_float (Max (sketch i)))
     ))"
 
 fun f0_space_usage :: "(nat \<times> rat \<times> rat) \<Rightarrow> real" where
   "f0_space_usage (n, \<epsilon>, \<delta>) = (
     let s = nat \<lceil>-18 * ln (real_of_rat \<epsilon>)\<rceil> in 
     let r = nat (4 * \<lceil>log 2 (1 / real_of_rat \<delta>)\<rceil> + 23) in
     let t = nat \<lceil>80 / (real_of_rat \<delta>)\<^sup>2 \<rceil> in
     6 +
     2 * log 2 (real s + 1) +
     2 * log 2 (real t + 1) +
     2 * log 2 (real n + 21) +
     2 * log 2 (real r + 1) +
     real s * (5 + 2 * log 2 (21 + real n) +
     real t * (13 + 4 * r + 2 * log 2 (log 2 (real n + 13)))))"
 
 definition encode_f0_state :: "f0_state \<Rightarrow> bool list option" where
   "encode_f0_state = 
     N\<^sub>e \<Join>\<^sub>e (\<lambda>s. 
     N\<^sub>e \<times>\<^sub>e (
     N\<^sub>e \<Join>\<^sub>e (\<lambda>p. 
     N\<^sub>e \<times>\<^sub>e ( 
     ([0..<s] \<rightarrow>\<^sub>e (P\<^sub>e p 2)) \<times>\<^sub>e
     ([0..<s] \<rightarrow>\<^sub>e (S\<^sub>e F\<^sub>e))))))"
 
 lemma "inj_on encode_f0_state (dom encode_f0_state)"
 proof -
   have "is_encoding encode_f0_state" 
     unfolding encode_f0_state_def
     by (intro dependent_encoding exp_golomb_encoding poly_encoding fun_encoding set_encoding float_encoding)
   thus ?thesis  by (rule encoding_imp_inj)
 qed
 
 context
   fixes \<epsilon> \<delta> :: rat
   fixes n :: nat
   fixes as :: "nat list"
   fixes result
   assumes \<epsilon>_range: "\<epsilon> \<in> {0<..<1}"
   assumes \<delta>_range: "\<delta> \<in> {0<..<1}"
   assumes as_range: "set as \<subseteq> {..<n}"
   defines "result \<equiv> fold (\<lambda>a state. state \<bind> f0_update a) as (f0_init \<delta> \<epsilon> n) \<bind> f0_result"
 begin  
 
 private definition t where "t = nat \<lceil>80 / (real_of_rat \<delta>)\<^sup>2\<rceil>"
 private lemma t_gt_0: "t > 0" using \<delta>_range by (simp add:t_def)
 
 private definition s where "s = nat \<lceil>-(18 * ln (real_of_rat \<epsilon>))\<rceil>"
 private lemma s_gt_0: "s > 0" using \<epsilon>_range by (simp add:s_def)
 
 private definition p where "p = prime_above (max n 19)"
 
 private lemma p_prime:"Factorial_Ring.prime p"
   using p_def prime_above_prime by presburger
 
 private lemma p_ge_18: "p \<ge> 18"
 proof -
   have "p \<ge> 19" 
     by (metis p_def prime_above_lower_bound max.bounded_iff)
   thus ?thesis by simp
 qed
 
 private lemma p_gt_0: "p > 0" using p_ge_18 by simp
 private lemma p_gt_1: "p > 1" using p_ge_18 by simp
 
 private lemma n_le_p: "n \<le> p"
 proof -
   have "n \<le> max n 19" by simp
   also have "... \<le> p"
     unfolding p_def by (rule prime_above_lower_bound)
   finally show ?thesis by simp
 qed
 
 private lemma p_le_n: "p \<le> 2*n + 40"
 proof -
   have "p \<le> 2 * (max n 19) + 2"
     by (subst p_def, rule prime_above_upper_bound)
   also have "... \<le> 2 * n + 40"
     by (cases "n \<ge> 19", auto)
   finally show ?thesis by simp
 qed
 
 private lemma as_lt_p: "\<And>x. x \<in> set as \<Longrightarrow> x < p" 
   using as_range atLeastLessThan_iff
   by (intro order_less_le_trans[OF _ n_le_p]) blast
 
 private lemma as_subset_p: "set as \<subseteq> {..<p}"
    using as_lt_p  by (simp add: subset_iff)
 
 private definition r where "r = nat (4 * \<lceil>log 2 (1 / real_of_rat \<delta>)\<rceil> + 23)"
 
 private lemma r_bound: "4 * log 2 (1 / real_of_rat \<delta>) + 23 \<le> r"
 proof -
   have "0 \<le> log 2 (1 / real_of_rat \<delta>)" using \<delta>_range by simp 
   hence "0 \<le> \<lceil>log 2 (1 / real_of_rat \<delta>)\<rceil>" by simp
   hence "0 \<le> 4 * \<lceil>log 2 (1 / real_of_rat \<delta>)\<rceil> + 23"
     by (intro add_nonneg_nonneg mult_nonneg_nonneg, auto)
   thus ?thesis by (simp add:r_def)
 qed
 
 private lemma r_ge_23: "r \<ge> 23"
 proof -
   have "(23::real) = 0 + 23" by simp
   also have "... \<le> 4 * log 2 (1 / real_of_rat \<delta>) + 23" 
     using \<delta>_range by (intro add_mono mult_nonneg_nonneg, auto) 
   also have "... \<le> r" using r_bound by simp
   finally show "23 \<le> r" by simp
 qed
 
 private lemma two_pow_r_le_1: "0 < 1 - 2 powr - real r"
 proof -
   have a: "2 powr (0::real) = 1"
     by simp
   show ?thesis using r_ge_23 
     by (simp, subst a[symmetric], intro powr_less_mono, auto)
 qed
 
 interpretation carter_wegman_hash_family "mod_ring p" 2
   rewrites "ring.hash (mod_ring p) = Frequency_Moment_0.hash p"
   using carter_wegman_hash_familyI[OF mod_ring_is_field mod_ring_finite]
   using hash_def p_prime by auto
 
 private definition tr_hash where "tr_hash x \<omega> = truncate_down r (hash x \<omega>)"
 
 private definition sketch_rv where
   "sketch_rv \<omega> = least t ((\<lambda>x. float_of (tr_hash x \<omega>)) ` set as)"
 
 private definition estimate 
    where "estimate S = (if card S < t then of_nat (card S) else of_nat t * of_nat p / rat_of_float (Max S))"
 
 private definition sketch_rv' where "sketch_rv' \<omega> = least t ((\<lambda>x. tr_hash x \<omega>) ` set as)"
 private definition estimate' where "estimate' S = (if card S < t then real (card S) else real t * real p / Max S)"
 
 private definition \<Omega>\<^sub>0 where "\<Omega>\<^sub>0 = prod_pmf {..<s} (\<lambda>_. pmf_of_set space)"
 
 private lemma f0_alg_sketch:
   defines "sketch \<equiv> fold (\<lambda>a state. state \<bind> f0_update a) as (f0_init \<delta> \<epsilon> n)"
   shows "sketch = map_pmf (\<lambda>x. (s,t,p,r, x, \<lambda>i \<in> {..<s}. sketch_rv (x i))) \<Omega>\<^sub>0" 
   unfolding sketch_rv_def 
 proof (subst sketch_def, induction as rule:rev_induct)
   case Nil
   then show ?case
     by (simp add:s_def p_def[symmetric] map_pmf_def t_def r_def Let_def least_def restrict_def space_def \<Omega>\<^sub>0_def)
 next
   case (snoc x xs)
   let ?sketch = "\<lambda>\<omega> xs. least t ((\<lambda>a. float_of (tr_hash a \<omega>)) ` set xs)"
   have "fold (\<lambda>a state. state \<bind> f0_update a) (xs @ [x]) (f0_init \<delta> \<epsilon> n) =
      (map_pmf (\<lambda>\<omega>. (s, t, p, r, \<omega>, \<lambda>i \<in> {..<s}. ?sketch (\<omega> i) xs)) \<Omega>\<^sub>0) \<bind> f0_update x"
     by (simp add: restrict_def snoc del:f0_init.simps)
   also have "... = \<Omega>\<^sub>0 \<bind> (\<lambda>\<omega>. f0_update x (s, t, p, r, \<omega>, \<lambda>i\<in>{..<s}. ?sketch (\<omega> i) xs)) "
     by (simp add:map_pmf_def bind_assoc_pmf bind_return_pmf del:f0_update.simps)
   also have "... = map_pmf (\<lambda>\<omega>. (s, t, p, r, \<omega>, \<lambda>i\<in>{..<s}. ?sketch (\<omega> i) (xs@[x]))) \<Omega>\<^sub>0"
     by (simp add:least_insert map_pmf_def tr_hash_def cong:restrict_cong)
   finally show ?case by blast
 qed
 
 private lemma card_nat_in_ball:
   fixes x :: nat
   fixes q :: real
   assumes "q \<ge> 0"
   defines "A \<equiv> {k. abs (real x - real k) \<le> q \<and> k \<noteq> x}"
   shows "real (card A) \<le> 2 * q" and "finite A"
 proof -
   have a: "of_nat x \<in> {\<lceil>real x-q\<rceil>..\<lfloor>real x+q\<rfloor>}"
     using assms 
     by (simp add: ceiling_le_iff)
 
   have "card A = card (int ` A)"
     by (rule card_image[symmetric], simp)
   also have "... \<le> card ({\<lceil>real x-q\<rceil>..\<lfloor>real x+q\<rfloor>} - {of_nat x})"
     by (intro card_mono image_subsetI, simp_all add:A_def abs_le_iff, linarith)
   also have "... = card {\<lceil>real x-q\<rceil>..\<lfloor>real x+q\<rfloor>} - 1"
     by (rule card_Diff_singleton, rule a)
   also have "... = int (card {\<lceil>real x-q\<rceil>..\<lfloor>real x+q\<rfloor>}) - int 1"
     by (intro of_nat_diff)
      (metis a card_0_eq empty_iff finite_atLeastAtMost_int less_one linorder_not_le)
   also have "... \<le> \<lfloor>q+real x\<rfloor>+1 -\<lceil>real x-q\<rceil> - 1"
     using assms by (simp, linarith)
   also have "... \<le> 2*q"
     by linarith
   finally show "card A \<le> 2 * q"
     by simp
 
   have "A \<subseteq> {..x + nat \<lceil>q\<rceil>}"
     by (rule subsetI, simp add:A_def abs_le_iff, linarith)
   thus "finite A"
     by (rule finite_subset, simp)
 qed
 
 private lemma prob_degree_lt_1:
    "prob {\<omega>. degree \<omega> < 1} \<le> 1/real p" 
 proof -
   have "space \<inter> {\<omega>. length \<omega> \<le> Suc 0} = bounded_degree_polynomials (mod_ring p) 1"
     by (auto simp:set_eq_iff bounded_degree_polynomials_def space_def)
   moreover have "field_size = p" by (simp add:mod_ring_def)
   hence "real (card (bounded_degree_polynomials (mod_ring p) (Suc 0))) / real (card space) = 1 / real p"
     by (simp add:space_def bounded_degree_polynomials_card power2_eq_square)
   ultimately show ?thesis
     by (simp add:M_def measure_pmf_of_set)
 qed
 
 private lemma collision_prob:
   assumes "c \<ge> 1"
   shows "prob {\<omega>. \<exists>x \<in> set as. \<exists>y \<in> set as. x \<noteq> y \<and> tr_hash x \<omega> \<le> c \<and> tr_hash x \<omega> = tr_hash y \<omega>} \<le> 
     (5/2) * (real (card (set as)))\<^sup>2 * c\<^sup>2 * 2 powr -(real r) / (real p)\<^sup>2 + 1/real p" (is "prob {\<omega>. ?l \<omega>} \<le> ?r1 + ?r2")
 proof -
   define \<rho> :: real where "\<rho> = 9/8"
 
   have rho_c_ge_0: "\<rho> * c \<ge> 0" unfolding \<rho>_def using assms by simp 
 
   have c_ge_0: "c\<ge>0" using assms by simp
   
   have "degree \<omega> \<ge> 1 \<Longrightarrow> \<omega> \<in> space \<Longrightarrow> degree \<omega> = 1" for \<omega>
     by (simp add:bounded_degree_polynomials_def space_def) 
      (metis One_nat_def Suc_1 le_less_Suc_eq less_imp_diff_less list.size(3) pos2)
 
   hence a: "\<And>\<omega> x y. x < p \<Longrightarrow> y < p \<Longrightarrow>  x \<noteq> y \<Longrightarrow> degree \<omega> \<ge> 1 \<Longrightarrow> \<omega> \<in> space \<Longrightarrow>  hash x \<omega> \<noteq> hash y \<omega>" 
     using inj_onD[OF inj_if_degree_1]  mod_ring_carr by blast 
 
   have b: "prob {\<omega>. degree \<omega> \<ge> 1 \<and> tr_hash x \<omega> \<le> c \<and> tr_hash x \<omega> = tr_hash y \<omega>} \<le> 5 * c\<^sup>2 * 2 powr (-real r) /(real p)\<^sup>2"
     if b_assms: "x \<in> set as"  "y \<in> set as"  "x < y" for x y
   proof -
     have c: "real u \<le> \<rho> * c \<and> \<bar>real u - real v\<bar> \<le> \<rho> * c * 2 powr (-real r)"
       if c_assms:"truncate_down r (real u) \<le> c" "truncate_down r (real u) = truncate_down r (real v)" for u v
     proof -
       have "9 * 2 powr - real r \<le> 9 * 2 powr (- real 23)" 
         using r_ge_23 by (intro mult_left_mono powr_mono, auto)
 
       also have "... \<le> 1" by simp
 
       finally have "9 * 2 powr - real r \<le> 1" by simp
 
       hence "1 \<le> \<rho> * (1 - 2 powr (- real r))" 
         by (simp add:\<rho>_def)
 
       hence d: "(c*1) / (1 - 2 powr (-real r)) \<le> c * \<rho>" 
         using assms two_pow_r_le_1 by (simp add: pos_divide_le_eq)
 
       have "\<And>x. truncate_down r (real x) \<le> c \<Longrightarrow> real x * (1 - 2 powr - real r) \<le> c * 1" 
         using  truncate_down_pos[OF of_nat_0_le_iff] order_trans by (simp, blast)
 
       hence "\<And>x. truncate_down r (real x) \<le>  c  \<Longrightarrow> real x \<le> c * \<rho>"
         using two_pow_r_le_1 by (intro order_trans[OF _ d], simp add: pos_le_divide_eq) 
 
       hence e: "real u \<le> c * \<rho>" "real v \<le> c * \<rho>" 
         using c_assms by auto
 
       have " \<bar>real u - real v\<bar> \<le> (max \<bar>real u\<bar> \<bar>real v\<bar>) * 2 powr (-real r)"
         using c_assms by (intro truncate_down_eq, simp)
 
       also have "... \<le> (c * \<rho>) * 2 powr (-real r)"
         using e by (intro mult_right_mono, auto)
 
       finally have "\<bar>real u - real v\<bar> \<le> \<rho> * c * 2 powr (-real r)"
         by (simp add:algebra_simps)
 
       thus ?thesis using e by (simp add:algebra_simps)
     qed
 
     have "prob {\<omega>. degree \<omega> \<ge> 1 \<and> tr_hash x \<omega> \<le> c \<and> tr_hash x \<omega> = tr_hash y \<omega>} \<le>
       prob (\<Union> i \<in> {(u,v) \<in> {..<p} \<times> {..<p}. u \<noteq> v \<and> truncate_down r u \<le> c \<and> truncate_down r u = truncate_down r v}.
       {\<omega>.  hash x \<omega> = fst i \<and> hash y \<omega> = snd i})"
       using a by (intro pmf_mono[OF M_def], simp add:tr_hash_def) 
        (metis hash_range mod_ring_carr b_assms as_subset_p lessThan_iff nat_neq_iff subset_eq) 
 
     also have "... \<le> (\<Sum> i\<in> {(u,v) \<in> {..<p} \<times> {..<p}. u \<noteq> v \<and>
       truncate_down r u \<le> c \<and> truncate_down r u = truncate_down r v}. 
       prob {\<omega>. hash x \<omega> = fst i \<and> hash  y \<omega> = snd i})"
       by (intro measure_UNION_le finite_cartesian_product finite_subset[where B="{0..<p} \<times> {0..<p}"])
        (auto simp add:M_def)
 
     also have "... \<le> (\<Sum> i\<in> {(u,v) \<in> {..<p} \<times> {..<p}. u \<noteq> v \<and>
       truncate_down r u \<le> c \<and> truncate_down r u = truncate_down r v}. 
       prob {\<omega>. (\<forall>u \<in> {x,y}. hash u \<omega> = (if u = x then (fst i) else (snd i)))})" 
       by (intro sum_mono  pmf_mono[OF M_def]) force
 
     also have "... \<le> (\<Sum> i\<in> {(u,v) \<in> {..<p} \<times> {..<p}. u \<noteq> v \<and>
       truncate_down r u \<le> c \<and> truncate_down r u = truncate_down r v}. 1/(real p)\<^sup>2)"
       using assms as_subset_p b_assms
       by (intro sum_mono, subst hash_prob)  (auto simp add: mod_ring_def power2_eq_square)
 
     also have "... = 1/(real p)\<^sup>2 * 
       card {(u,v) \<in> {0..<p} \<times> {0..<p}. u \<noteq> v \<and> truncate_down r u \<le> c \<and> truncate_down r u = truncate_down r v}"
       by simp
 
     also have "... \<le> 1/(real p)\<^sup>2 * 
       card {(u,v) \<in> {..<p} \<times> {..<p}. u \<noteq> v \<and> real u \<le> \<rho> * c \<and> abs (real u - real v) \<le> \<rho> * c * 2 powr (-real r)}"
       using c
       by (intro mult_mono of_nat_mono card_mono finite_cartesian_product finite_subset[where B="{..<p}\<times>{..<p}"])
         auto
 
     also have "... \<le> 1/(real p)\<^sup>2 * card (\<Union>u' \<in> {u. u < p \<and> real u \<le> \<rho> * c}.
         {(u::nat,v::nat). u = u' \<and> abs (real u - real v) \<le> \<rho> * c * 2 powr (-real r) \<and> v < p \<and> v \<noteq> u'})"
       by (intro mult_left_mono of_nat_mono card_mono finite_cartesian_product finite_subset[where B="{..<p}\<times>{..<p}"])
        auto
 
     also have "... \<le> 1/(real p)\<^sup>2 * (\<Sum> u' \<in> {u. u < p \<and> real u \<le> \<rho> * c}.
       card  {(u,v). u = u' \<and> abs (real u - real v) \<le> \<rho> * c * 2 powr (-real r) \<and> v < p \<and> v \<noteq> u'})"
       by (intro mult_left_mono of_nat_mono card_UN_le, auto)
 
     also have "... = 1/(real p)\<^sup>2 * (\<Sum> u' \<in> {u. u < p \<and>  real u \<le> \<rho> * c}.
       card ((\<lambda>x. (u' ,x)) ` {v. abs (real u' - real v) \<le> \<rho> * c * 2 powr (-real r) \<and> v < p \<and> v \<noteq> u'}))"
       by (intro arg_cong2[where f="(*)"] arg_cong[where f="real"] sum.cong arg_cong[where f="card"])
        (auto simp add:set_eq_iff)
 
     also have "... \<le> 1/(real p)\<^sup>2 * (\<Sum> u' \<in> {u. u < p \<and> real u \<le> \<rho> * c}.
       card {v. abs (real u' - real v) \<le> \<rho> * c * 2 powr (-real r) \<and> v < p \<and> v \<noteq> u'})"
       by (intro mult_left_mono of_nat_mono sum_mono card_image_le, auto)
 
     also have "... \<le> 1/(real p)\<^sup>2 * (\<Sum> u' \<in> {u. u < p \<and> real u \<le> \<rho> * c}.
       card {v. abs (real u' - real v) \<le> \<rho> * c * 2 powr (-real r) \<and> v \<noteq> u'})"
       by (intro mult_left_mono sum_mono of_nat_mono card_mono card_nat_in_ball subsetI)  auto
 
     also have "... \<le> 1/(real p)\<^sup>2 * (\<Sum> u' \<in> {u. u < p \<and> real u \<le> \<rho> * c}.
       real (card {v. abs (real u' - real v) \<le> \<rho> * c * 2 powr (-real r) \<and> v \<noteq> u'}))"
       by simp
 
     also have "... \<le> 1/(real p)\<^sup>2 * (\<Sum> u' \<in> {u. u < p \<and> real u \<le> \<rho> * c}. 2 * (\<rho> * c * 2 powr (-real r)))"
       by (intro mult_left_mono sum_mono card_nat_in_ball(1), auto)
 
     also have "... =  1/(real p)\<^sup>2 * (real (card {u. u < p \<and> real u \<le> \<rho> * c}) * (2 * (\<rho> * c * 2 powr (-real r))))"
       by simp
 
     also have "... \<le>  1/(real p)\<^sup>2 * (real (card {u. u \<le> nat (\<lfloor>\<rho> * c \<rfloor>)}) * (2 * (\<rho> * c * 2 powr (-real r))))"
       using rho_c_ge_0 le_nat_floor
       by (intro mult_left_mono mult_right_mono of_nat_mono card_mono subsetI) auto
 
     also have "... \<le>  1/(real p)\<^sup>2 * ((1+\<rho> * c) * (2 * (\<rho> * c * 2 powr (-real r))))"
       using rho_c_ge_0 by (intro mult_left_mono mult_right_mono, auto)
 
     also have "... \<le>  1/(real p)\<^sup>2 * (((1+\<rho>) * c) * (2 * (\<rho> * c * 2 powr (-real r))))" 
       using assms by (intro mult_mono, auto simp add:distrib_left distrib_right \<rho>_def)
 
     also have "... = (\<rho> * (2 + \<rho> * 2)) * c\<^sup>2 * 2 powr (-real r) /(real p)\<^sup>2"
       by (simp add:ac_simps power2_eq_square) 
 
     also have "... \<le> 5 * c\<^sup>2 *  2 powr (-real r) /(real p)\<^sup>2"
       by (intro divide_right_mono mult_right_mono) (auto simp add:\<rho>_def)
 
     finally show ?thesis by simp
   qed
 
   have "prob {\<omega>. ?l \<omega> \<and> degree \<omega> \<ge> 1} \<le> 
     prob (\<Union> i \<in> {(x,y) \<in> (set as) \<times> (set as). x < y}. {\<omega>. degree \<omega> \<ge> 1 \<and> tr_hash (fst i) \<omega> \<le> c \<and>
     tr_hash (fst i) \<omega> = tr_hash (snd i) \<omega>})"
     by (rule pmf_mono[OF M_def], simp, metis linorder_neqE_nat)
 
   also have "... \<le> (\<Sum> i \<in> {(x,y) \<in> (set as) \<times> (set as). x < y}. prob 
     {\<omega>. degree \<omega> \<ge> 1 \<and> tr_hash  (fst i) \<omega> \<le> c \<and> tr_hash (fst i) \<omega> = tr_hash (snd i) \<omega>})"
     unfolding M_def
     by (intro measure_UNION_le finite_cartesian_product finite_subset[where B="(set as) \<times> (set as)"])
       auto
 
   also have "... \<le> (\<Sum> i \<in> {(x,y) \<in> (set as) \<times> (set as). x < y}. 5  * c\<^sup>2 * 2 powr (-real r) /(real p)\<^sup>2)"
     using b by (intro sum_mono, simp add:case_prod_beta)
 
   also have "... =  ((5/2) * c\<^sup>2  * 2 powr (-real r) /(real p)\<^sup>2) * (2 * card  {(x,y) \<in> (set as) \<times> (set as). x < y})"
     by simp
 
   also have "... =  ((5/2) * c\<^sup>2  * 2 powr (-real r) /(real p)\<^sup>2) * (card (set as) * (card (set as) - 1))"
     by (subst card_ordered_pairs, auto) 
 
   also have "... \<le> ((5/2) * c\<^sup>2 * 2 powr (-real r) /(real p)\<^sup>2) * (real (card (set as)))\<^sup>2"
     by (intro mult_left_mono) (auto simp add:power2_eq_square mult_left_mono)
 
   also have "... = (5/2) * (real (card (set as)))\<^sup>2 * c\<^sup>2 * 2 powr (-real r) /(real p)\<^sup>2"
     by (simp add:algebra_simps)
 
   finally have f:"prob {\<omega>. ?l \<omega> \<and> degree \<omega> \<ge> 1} \<le> ?r1" by simp
 
   have "prob {\<omega>. ?l \<omega>} \<le> prob {\<omega>. ?l \<omega> \<and> degree \<omega> \<ge> 1} + prob {\<omega>. degree \<omega> < 1}"
     by (rule pmf_add[OF M_def], auto)
   also have "... \<le> ?r1 + ?r2"
     by (intro add_mono f prob_degree_lt_1)
   finally show ?thesis by simp
 qed
 
 private lemma of_bool_square: "(of_bool x)\<^sup>2 = ((of_bool x)::real)"
   by (cases x, auto)
 
 private definition Q where "Q y \<omega> = card {x \<in> set as. int (hash x \<omega>) < y}"
 
 private definition m where "m = card (set as)"
 
 private lemma
   assumes "a \<ge> 0"
   assumes "a \<le> int p"
   shows exp_Q: "expectation (\<lambda>\<omega>. real (Q a \<omega>)) = real m * (of_int a) / p"
   and var_Q: "variance (\<lambda>\<omega>. real (Q a \<omega>)) \<le> real m * (of_int a) / p"
 proof -
   have exp_single: "expectation (\<lambda>\<omega>. of_bool (int (hash x \<omega>) < a)) = real_of_int a /real p"
     if a:"x \<in> set as" for x
   proof -
     have x_le_p: "x < p" using a as_lt_p by simp
     have "expectation (\<lambda>\<omega>. of_bool (int (hash x \<omega>) < a)) = expectation (indicat_real {\<omega>. int (Frequency_Moment_0.hash p x \<omega>) < a})"
       by (intro arg_cong2[where f="integral\<^sup>L"] ext, simp_all)
     also have "... = prob {\<omega>. hash x \<omega> \<in> {k. int k < a}}"
       by (simp add:M_def)
     also have "... = card ({k. int k < a} \<inter> {..<p}) / real p"
       by (subst prob_range, simp_all add: x_le_p mod_ring_def)
     also have "... = card {..<nat a} / real p"
       using assms by (intro arg_cong2[where f="(/)"] arg_cong[where f="real"] arg_cong[where f="card"])
        (auto simp add:set_eq_iff) 
     also have "... =  real_of_int a/real p"
       using assms by simp
     finally show "expectation (\<lambda>\<omega>. of_bool (int (hash x \<omega>) < a)) = real_of_int a /real p"
       by simp
   qed
 
   have "expectation(\<lambda>\<omega>. real (Q a \<omega>)) = expectation (\<lambda>\<omega>. (\<Sum>x \<in> set as. of_bool (int (hash x \<omega>) < a)))"
     by (simp add:Q_def Int_def)
   also have "... =  (\<Sum>x \<in> set as. expectation (\<lambda>\<omega>. of_bool (int (hash x \<omega>) < a)))"
     by (rule Bochner_Integration.integral_sum, simp)
   also have "... = (\<Sum> x \<in> set as. a /real p)"
     by (rule sum.cong, simp, subst exp_single, simp, simp)
   also have "... = real m *  real_of_int a / real p"
     by (simp add:m_def)
   finally show "expectation (\<lambda>\<omega>. real (Q a \<omega>)) = real m * real_of_int a / p" by simp
 
   have indep: "J \<subseteq> set as \<Longrightarrow> card J = 2 \<Longrightarrow> indep_vars (\<lambda>_. borel) (\<lambda>i x. of_bool (int (hash i x) < a)) J" for J
     using as_subset_p mod_ring_carr
     by (intro indep_vars_compose2[where Y="\<lambda>i x. of_bool (int x < a)" and M'="\<lambda>_. discrete"]
         k_wise_indep_vars_subset[OF k_wise_indep] finite_subset[OF _ finite_set]) auto
 
   have rv: "\<And>x. x \<in> set as \<Longrightarrow> random_variable borel (\<lambda>\<omega>. of_bool (int (hash x \<omega>) < a))"
      by (simp add:M_def)
 
   have "variance (\<lambda>\<omega>. real (Q a \<omega>)) = variance (\<lambda>\<omega>. (\<Sum>x \<in> set as. of_bool (int (hash x \<omega>) < a)))"
     by (simp add:Q_def Int_def)
   also have "... = (\<Sum>x \<in> set as. variance (\<lambda>\<omega>. of_bool (int (hash x \<omega>) < a)))"
     by (intro var_sum_pairwise_indep_2 indep rv) auto
   also have "... \<le> (\<Sum> x \<in> set as. a / real p)"
     by (rule sum_mono, simp add: variance_eq of_bool_square, simp add: exp_single)
   also have "... = real m * real_of_int a /real p"
     by (simp add:m_def)
   finally show "variance (\<lambda>\<omega>. real (Q a \<omega>)) \<le> real m * real_of_int a / p"
     by simp
 qed
 
 private lemma t_bound: "t \<le> 81 / (real_of_rat \<delta>)\<^sup>2"
 proof -
   have "t \<le> 80 / (real_of_rat \<delta>)\<^sup>2 + 1" using t_def t_gt_0 by linarith
   also have "... \<le> 80 / (real_of_rat \<delta>)\<^sup>2 + 1 /  (real_of_rat \<delta>)\<^sup>2"
     using \<delta>_range by (intro add_mono, simp, simp add:power_le_one)
   also have "... = 81 / (real_of_rat \<delta>)\<^sup>2" by simp
   finally show ?thesis by simp
 qed
 
 private lemma t_r_bound:
   "18 * 40 * (real t)\<^sup>2 * 2 powr (-real r) \<le> 1"
 proof -
   have "720 * (real t)\<^sup>2 * 2 powr (-real r) \<le> 720 * (81 / (real_of_rat \<delta>)\<^sup>2)\<^sup>2 * 2 powr (-4 * log 2 (1 / real_of_rat \<delta>) - 23)"
     using r_bound t_bound by (intro mult_left_mono mult_mono power_mono powr_mono, auto)
 
   also have "... \<le> 720 * (81 / (real_of_rat \<delta>)\<^sup>2)\<^sup>2 * (2 powr (-4 * log 2 (1 / real_of_rat \<delta>)) * 2 powr (-23))"
     using \<delta>_range by (intro mult_left_mono mult_mono power_mono add_mono)
      (simp_all add:power_le_one powr_diff)
 
   also have "... = 720 * (81\<^sup>2 / (real_of_rat \<delta>)^4) * (2 powr (log 2 ((real_of_rat \<delta>)^4))  * 2 powr (-23))"
     using \<delta>_range by (intro arg_cong2[where f="(*)"])
       (simp_all add:power2_eq_square power4_eq_xxxx log_divide log_powr[symmetric])
 
   also have "... = 720 * 81\<^sup>2 * 2 powr (-23)" using \<delta>_range by simp
 
   also have "... \<le> 1" by simp
 
   finally show ?thesis by simp
 qed
 
 private lemma m_eq_F_0: "real m = of_rat (F 0 as)"
   by (simp add:m_def F_def)
 
 private lemma estimate'_bounds:
   "prob {\<omega>. of_rat \<delta> * real_of_rat (F 0 as) < \<bar>estimate' (sketch_rv' \<omega>) - of_rat (F 0 as)\<bar>} \<le> 1/3"
 proof (cases "card (set as) \<ge> t")
   case True
   define \<delta>' where "\<delta>' = 3 * real_of_rat \<delta> / 4"
   define u where "u = \<lceil>real t * p / (m * (1+\<delta>'))\<rceil>"
   define v where "v = \<lfloor>real t * p / (m * (1-\<delta>'))\<rfloor>"
 
   define has_no_collision where 
     "has_no_collision = (\<lambda>\<omega>. \<forall>x\<in> set as. \<forall>y \<in> set as. (tr_hash x \<omega> = tr_hash y \<omega> \<longrightarrow> x = y) \<or> tr_hash x \<omega> > v)"
 
   have "2 powr (-real r) \<le> 2 powr (-(4 * log 2 (1 / real_of_rat \<delta>) + 23))"
     using r_bound by (intro powr_mono, linarith, simp)
   also have "... = 2 powr (-4 * log 2 (1 /real_of_rat \<delta>) -23)"
     by (rule arg_cong2[where f="(powr)"], auto simp add:algebra_simps)
   also have "... \<le> 2 powr ( -1 * log 2 (1 /real_of_rat \<delta>) -4)"
     using \<delta>_range by (intro powr_mono diff_mono, auto)
   also have "... = 2 powr ( -1 * log 2 (1 /real_of_rat \<delta>)) /  16"
     by (simp add: powr_diff)
   also have "... = real_of_rat \<delta> / 16"
     using \<delta>_range by (simp add:log_divide)
   also have "... < real_of_rat \<delta> / 8"
     using \<delta>_range by (subst pos_divide_less_eq, auto)
   finally have r_le_\<delta>: "2 powr (-real r) < real_of_rat \<delta> / 8"
     by simp
 
   have \<delta>'_gt_0: "\<delta>' > 0" using \<delta>_range by (simp add:\<delta>'_def)
   have "\<delta>' < 3/4" using \<delta>_range by (simp add:\<delta>'_def)+
   also have "... < 1" by simp
   finally have \<delta>'_lt_1: "\<delta>' < 1" by simp
 
   have "t \<le> 81 / (real_of_rat \<delta>)\<^sup>2"
     using t_bound by simp
   also have "... = (81*9/16) / (\<delta>')\<^sup>2"
     by (simp add:\<delta>'_def power2_eq_square)
   also have "... \<le> 46 / \<delta>'\<^sup>2"
     by (intro divide_right_mono, simp, simp)
   finally have t_le_\<delta>': "t \<le> 46/ \<delta>'\<^sup>2" by simp
 
   have "80 \<le> (real_of_rat \<delta>)\<^sup>2 * (80 / (real_of_rat \<delta>)\<^sup>2)" using \<delta>_range by simp
   also have "... \<le> (real_of_rat \<delta>)\<^sup>2 * t"
     by (intro mult_left_mono, simp add:t_def of_nat_ceiling, simp)
   finally have "80 \<le> (real_of_rat \<delta>)\<^sup>2 * t" by simp
   hence t_ge_\<delta>': "45 \<le> t * \<delta>' * \<delta>'" by (simp add:\<delta>'_def power2_eq_square)
 
   have "m \<le> card {..<n}" unfolding m_def using as_range by (intro card_mono, auto)
   also have "... \<le> p" using n_le_p by simp
   finally have m_le_p: "m \<le> p" by simp
 
   hence t_le_m: "t \<le> card (set as)" using True by simp
   have m_ge_0: "real m > 0" using m_def True t_gt_0 by simp
 
   have "v \<le> real t * real p / (real m * (1 - \<delta>'))" by (simp add:v_def)
 
   also have "... \<le> real t * real p / (real m * (1/4))"
     using \<delta>'_lt_1 m_ge_0 \<delta>_range
     by (intro divide_left_mono mult_left_mono mult_nonneg_nonneg mult_pos_pos, simp_all add:\<delta>'_def)
 
   finally have v_ubound: "v \<le> 4 * real t * real p / real m" by (simp add:algebra_simps)
 
   have a_ge_1: "u \<ge> 1" using \<delta>'_gt_0 p_gt_0 m_ge_0 t_gt_0
     by (auto intro!:mult_pos_pos divide_pos_pos simp add:u_def) 
   hence a_ge_0: "u \<ge> 0" by simp
   have "real m * (1 - \<delta>') < real m" using \<delta>'_gt_0 m_ge_0 by simp
   also have "... \<le> 1 * real p" using m_le_p by simp
   also have "... \<le> real t * real p" using t_gt_0 by (intro mult_right_mono, auto)
   finally have " real m * (1 - \<delta>') < real t * real p" by simp
   hence v_gt_0: "v > 0" using mult_pos_pos m_ge_0 \<delta>'_lt_1 by (simp add:v_def)
   hence v_ge_1: "real_of_int v \<ge> 1" by linarith
 
   have "real t \<le> real m" using True m_def by linarith
   also have "... < (1 + \<delta>') * real m" using \<delta>'_gt_0 m_ge_0 by force
   finally have a_le_p_aux: "real t < (1 + \<delta>') * real m"  by simp
 
   have "u \<le> real t * real p / (real m * (1 + \<delta>'))+1" by (simp add:u_def)
   also have "... < real p + 1" 
     using m_ge_0 \<delta>'_gt_0 a_le_p_aux  a_le_p_aux p_gt_0
     by (simp add: pos_divide_less_eq ac_simps) 
   finally have "u \<le> real p" 
     by (metis int_less_real_le not_less of_int_le_iff of_int_of_nat_eq)
   hence u_le_p: "u \<le> int p" by linarith
 
   have "prob {\<omega>. Q u \<omega> \<ge> t} \<le> prob {\<omega> \<in> Sigma_Algebra.space M. abs (real (Q u \<omega>) - 
     expectation (\<lambda>\<omega>. real (Q u \<omega>))) \<ge> 3 * sqrt (m * real_of_int u / p)}"
   proof (rule pmf_mono[OF M_def])
     fix \<omega>
     assume "\<omega> \<in> {\<omega>. t \<le> Q u \<omega>}"
     hence t_le: "t \<le> Q u \<omega>" by simp
     have "real m * real_of_int u / real p \<le> real m * (real t * real p / (real m * (1 + \<delta>'))+1) / real p"
       using m_ge_0 p_gt_0 by (intro divide_right_mono mult_left_mono, simp_all add: u_def)
     also have "... = real m * real t * real p / (real m * (1+\<delta>') * real p) + real m / real p"
       by (simp add:distrib_left add_divide_distrib)
     also have "... = real t / (1+\<delta>') + real m / real p"
       using p_gt_0 m_ge_0 by simp
     also have "... \<le> real t / (1+\<delta>') + 1"
       using m_le_p p_gt_0 by (intro add_mono, auto)
     finally have "real m * real_of_int u / real p \<le> real t / (1 + \<delta>') + 1"
       by simp
 
     hence "3 * sqrt (real m * of_int u / real p) + real m * of_int u / real p \<le> 
       3 * sqrt (t / (1+\<delta>')+1)+(t/(1+\<delta>')+1)"
       by (intro add_mono mult_left_mono real_sqrt_le_mono, auto)
     also have "... \<le> 3 * sqrt (real t+1) + ((t * (1 - \<delta>' / (1+\<delta>'))) + 1)"
       using \<delta>'_gt_0 t_gt_0 by (intro add_mono mult_left_mono real_sqrt_le_mono)
         (simp_all add: pos_divide_le_eq left_diff_distrib)
     also have "... = 3 * sqrt (real t+1) + (t - \<delta>' * t / (1+\<delta>')) + 1" by (simp add:algebra_simps)
     also have "... \<le> 3 * sqrt (46 / \<delta>'\<^sup>2 + 1 / \<delta>'\<^sup>2) + (t - \<delta>' * t/2) + 1 / \<delta>'"
       using \<delta>'_gt_0 t_gt_0 \<delta>'_lt_1 add_pos_pos  t_le_\<delta>'
       by (intro add_mono mult_left_mono real_sqrt_le_mono add_mono)
        (simp_all add: power_le_one pos_le_divide_eq)
     also have "... \<le> (21 / \<delta>' + (t - 45 / (2*\<delta>'))) + 1 / \<delta>'" 
       using \<delta>'_gt_0 t_ge_\<delta>' by (intro add_mono)
          (simp_all add:real_sqrt_divide divide_le_cancel real_le_lsqrt pos_divide_le_eq ac_simps)
     also have "... \<le> t" using \<delta>'_gt_0 by simp
     also have "... \<le> Q u \<omega>" using t_le by simp
     finally have "3 * sqrt (real m * of_int u / real p) + real m * of_int u / real p \<le> Q u \<omega>"
       by simp
     hence " 3 * sqrt (real m * real_of_int u / real p) \<le> \<bar>real (Q u \<omega>) - expectation (\<lambda>\<omega>. real (Q u \<omega>))\<bar>"
       using a_ge_0 u_le_p  True by (simp add:exp_Q abs_ge_iff)
 
     thus "\<omega> \<in> {\<omega> \<in> Sigma_Algebra.space M. 3 * sqrt (real m * real_of_int u / real p) \<le> 
       \<bar>real (Q u \<omega>) - expectation (\<lambda>\<omega>. real (Q u \<omega>))\<bar>}"
       by (simp add: M_def)
   qed
   also have "... \<le> variance  (\<lambda>\<omega>. real (Q u \<omega>)) / (3 * sqrt (real m * of_int u / real p))\<^sup>2"
     using a_ge_1 p_gt_0 m_ge_0 
     by (intro Chebyshev_inequality, simp add:M_def, auto) 
 
   also have "... \<le> (real m * real_of_int u / real p) / (3 * sqrt (real m * of_int u / real p))\<^sup>2"
     using a_ge_0 u_le_p by (intro divide_right_mono var_Q, auto)
 
   also have "... \<le> 1/9" using a_ge_0 by simp
 
   finally have case_1: "prob {\<omega>. Q u \<omega> \<ge> t} \<le> 1/9" by simp
 
   have case_2: "prob {\<omega>. Q v \<omega> < t} \<le> 1/9"
   proof (cases "v \<le> p")
     case True
     have "prob {\<omega>. Q v \<omega> < t} \<le> prob {\<omega> \<in> Sigma_Algebra.space M. abs (real (Q v \<omega>) - expectation (\<lambda>\<omega>. real (Q v \<omega>))) 
       \<ge> 3 * sqrt (m * real_of_int v / p)}"
     proof (rule pmf_mono[OF M_def])
       fix \<omega>
       assume "\<omega> \<in> set_pmf (pmf_of_set space)"
       have "(real t + 3 * sqrt (real t / (1 - \<delta>') )) * (1 - \<delta>') = real t - \<delta>' * t + 3 * ((1-\<delta>') * sqrt( real t / (1-\<delta>') ))"
         by (simp add:algebra_simps)
 
       also have "... = real t - \<delta>' * t + 3 * sqrt (  (1-\<delta>')\<^sup>2 * (real t /  (1-\<delta>')))"
         using \<delta>'_lt_1 by (subst real_sqrt_mult, simp)
 
       also have "... = real t - \<delta>' * t + 3 * sqrt ( real t * (1- \<delta>'))"
         by (simp add:power2_eq_square distrib_left)
 
       also have "... \<le> real t - 45/ \<delta>' + 3 * sqrt ( real t )"
         using \<delta>'_gt_0 t_ge_\<delta>' \<delta>'_lt_1 by (intro add_mono mult_left_mono real_sqrt_le_mono)
          (simp_all add:pos_divide_le_eq ac_simps left_diff_distrib power_le_one)
 
        also have "... \<le> real t - 45/ \<delta>' + 3 * sqrt ( 46 / \<delta>'\<^sup>2)"
          using  t_le_\<delta>' \<delta>'_lt_1 \<delta>'_gt_0
          by (intro add_mono mult_left_mono real_sqrt_le_mono, simp_all add:pos_divide_le_eq power_le_one)
 
       also have "... = real t + (3 * sqrt(46) - 45)/ \<delta>'"
         using \<delta>'_gt_0 by (simp add:real_sqrt_divide diff_divide_distrib)
 
       also have "... \<le> t"
         using \<delta>'_gt_0 by (simp add:pos_divide_le_eq real_le_lsqrt)
 
       finally have aux: "(real t + 3 * sqrt (real t / (1 - \<delta>'))) * (1 - \<delta>') \<le> real t "
         by simp
 
       assume "\<omega> \<in> {\<omega>. Q v \<omega> < t}"
       hence "Q v \<omega> < t" by simp
 
       hence "real (Q v \<omega>) + 3 * sqrt (real m * real_of_int v / real p) 
         \<le> real t - 1 + 3 * sqrt (real m * real_of_int v / real p)"
         using m_le_p p_gt_0 by (intro add_mono, auto simp add: algebra_simps add_divide_distrib)
 
       also have "... \<le> (real t-1) + 3 * sqrt (real m * (real t * real p / (real m * (1- \<delta>'))) / real p)"
         by (intro add_mono mult_left_mono real_sqrt_le_mono divide_right_mono)
          (auto simp add:v_def)
 
       also have "... \<le> real t + 3 * sqrt(real t / (1-\<delta>')) - 1"
         using m_ge_0 p_gt_0 by simp
 
       also have "... \<le> real t / (1-\<delta>')-1" 
         using \<delta>'_lt_1 aux by (simp add: pos_le_divide_eq)   
       also have "... \<le> real m * (real t * real p / (real m * (1-\<delta>'))) / real p - 1"
         using p_gt_0 m_ge_0 by simp
       also have "... \<le> real m * (real t * real p / (real m * (1-\<delta>'))) / real p - real m / real p"
           using m_le_p p_gt_0
           by (intro diff_mono, auto)
       also have "... = real m * (real t * real p / (real m * (1-\<delta>'))-1) / real p" 
           by (simp add: left_diff_distrib right_diff_distrib diff_divide_distrib)
       also have "... \<le>  real m * real_of_int v / real p"      
         by (intro divide_right_mono mult_left_mono, simp_all add:v_def)
 
       finally have "real (Q v \<omega>) + 3 * sqrt (real m * real_of_int v / real p) 
         \<le> real m * real_of_int v / real p" by simp
 
       hence " 3 * sqrt (real m * real_of_int v / real p) \<le> \<bar>real (Q v \<omega>) -expectation (\<lambda>\<omega>. real (Q v \<omega>))\<bar>"  
         using v_gt_0 True by (simp add: exp_Q abs_ge_iff)
 
       thus "\<omega> \<in> {\<omega>\<in> Sigma_Algebra.space M. 3 * sqrt (real m * real_of_int v / real p) \<le> 
         \<bar>real (Q v \<omega>) - expectation (\<lambda>\<omega>. real (Q v \<omega>))\<bar>}" 
         by (simp add:M_def)
     qed
     also have "... \<le> variance (\<lambda>\<omega>. real (Q v \<omega>)) / (3 * sqrt (real m * real_of_int v / real p))\<^sup>2" 
       using v_gt_0 p_gt_0 m_ge_0 
       by (intro Chebyshev_inequality, simp add:M_def, auto)
 
     also have "... \<le> (real m * real_of_int v / real p) / (3 * sqrt (real m * real_of_int v / real p))\<^sup>2"
       using  v_gt_0 True  by (intro divide_right_mono var_Q, auto)
 
     also have "... = 1/9"
       using p_gt_0 v_gt_0 m_ge_0 by (simp add:power2_eq_square)
 
     finally show ?thesis by simp
   next
     case False
     have "prob {\<omega>. Q v \<omega> < t} \<le> prob {\<omega>. False}"
     proof (rule pmf_mono[OF M_def])
       fix \<omega>
       assume a:"\<omega> \<in> {\<omega>. Q v \<omega> < t}"
       assume "\<omega> \<in> set_pmf (pmf_of_set space)"
       hence b:"\<And>x. x < p \<Longrightarrow> hash x \<omega> < p" 
         using hash_range mod_ring_carr by (simp add:M_def measure_pmf_inverse) 
       have "t \<le> card (set as)" using True by simp
       also have "... \<le> Q v \<omega>"
         unfolding Q_def  using b False as_lt_p by (intro card_mono subsetI, simp, force) 
       also have "... < t" using a by simp
       finally have "False" by auto
       thus "\<omega> \<in> {\<omega>. False}" by simp
     qed
     also have "... = 0" by auto
     finally show ?thesis by simp
   qed
 
   have "prob {\<omega>. \<not>has_no_collision \<omega>} \<le>
     prob {\<omega>. \<exists>x \<in> set as. \<exists>y \<in> set as. x \<noteq> y \<and> tr_hash x \<omega> \<le> real_of_int v \<and> tr_hash x \<omega> = tr_hash y \<omega>}"
     by (rule pmf_mono[OF M_def]) (simp add:has_no_collision_def M_def, force) 
 
   also have "... \<le> (5/2) * (real (card (set as)))\<^sup>2 * (real_of_int v)\<^sup>2 * 2 powr - real r / (real p)\<^sup>2 + 1 / real p"
     using collision_prob v_ge_1 by blast
 
   also have "... \<le> (5/2) * (real m)\<^sup>2 * (real_of_int v)\<^sup>2 * 2 powr - real r / (real p)\<^sup>2 + 1 / real p"
     by (intro divide_right_mono add_mono mult_right_mono mult_mono power_mono, simp_all add:m_def)
 
   also have "... \<le> (5/2) * (real m)\<^sup>2 * (4 * real t * real p / real m)\<^sup>2 * (2 powr - real r) / (real p)\<^sup>2 + 1 / real p"
     using v_def v_ge_1 v_ubound
     by (intro add_mono divide_right_mono  mult_right_mono  mult_left_mono, auto)
 
   also have "... = 40 * (real t)\<^sup>2 * (2 powr -real r) + 1 / real p"
     using p_gt_0 m_ge_0 t_gt_0 by (simp add:algebra_simps power2_eq_square)
 
   also have "... \<le> 1/18 + 1/18"
     using t_r_bound p_ge_18 by (intro add_mono, simp_all add: pos_le_divide_eq)
 
   also have "... = 1/9" by simp
 
   finally have case_3: "prob {\<omega>. \<not>has_no_collision \<omega>} \<le> 1/9" by simp
 
   have "prob {\<omega>. real_of_rat \<delta> * of_rat (F 0 as) < \<bar>estimate' (sketch_rv' \<omega>) - of_rat (F 0 as)\<bar>} \<le> 
     prob {\<omega>. Q u \<omega> \<ge> t \<or> Q v \<omega> < t \<or> \<not>(has_no_collision \<omega>)}"
   proof (rule pmf_mono[OF M_def], rule ccontr)
     fix \<omega>
     assume "\<omega> \<in> set_pmf (pmf_of_set space)"
     assume "\<omega> \<in> {\<omega>. real_of_rat \<delta> * real_of_rat (F 0 as) < \<bar>estimate' (sketch_rv' \<omega>) - real_of_rat (F 0 as)\<bar>}"
     hence est: "real_of_rat \<delta> * real_of_rat (F 0 as) < \<bar>estimate' (sketch_rv' \<omega>) - real_of_rat (F 0 as)\<bar>" by simp
     assume "\<omega> \<notin> {\<omega>. t \<le> Q u \<omega> \<or> Q v \<omega> < t \<or> \<not> has_no_collision \<omega>}"
     hence "\<not>( t \<le> Q u \<omega> \<or> Q v \<omega> < t \<or> \<not> has_no_collision \<omega>)" by simp
     hence lb: "Q u \<omega> < t" and ub: "Q v \<omega> \<ge> t" and no_col: "has_no_collision \<omega>" by simp+
 
     define y where "y =  nth_mset (t-1) {#int (hash x \<omega>). x \<in># mset_set (set as)#}"
     define y' where "y' = nth_mset (t-1) {#tr_hash x \<omega>. x \<in># mset_set (set as)#}"
 
     have rank_t_lb: "u \<le> y"
       unfolding y_def using True t_gt_0 lb
       by (intro nth_mset_bound_left, simp_all add:count_less_def swap_filter_image Q_def)
   
     have rank_t_ub: "y \<le> v - 1"
       unfolding y_def using True t_gt_0 ub
       by (intro nth_mset_bound_right, simp_all add:Q_def swap_filter_image count_le_def)
 
     have y_ge_0: "real_of_int y \<ge> 0" using rank_t_lb a_ge_0 by linarith
 
     have "mono (\<lambda>x. truncate_down r (real_of_int x))" 
       by (metis truncate_down_mono mono_def of_int_le_iff)
     hence y'_eq: "y' = truncate_down r y"
       unfolding y_def y'_def  using True t_gt_0
       by (subst nth_mset_commute_mono[where f="(\<lambda>x. truncate_down r (of_int x))"]) 
         (simp_all add: multiset.map_comp comp_def tr_hash_def)
 
     have "real_of_int u * (1 - 2 powr -real r) \<le> real_of_int y * (1 - 2 powr (-real r))"
       using rank_t_lb of_int_le_iff two_pow_r_le_1
       by (intro mult_right_mono, auto)
     also have "... \<le> y'"
       using y'_eq truncate_down_pos[OF y_ge_0] by simp
     finally have rank_t_lb': "u * (1 - 2 powr -real r) \<le> y'" by simp
 
     have "y' \<le> real_of_int y"
       by (subst y'_eq, rule truncate_down_le, simp)
     also have "... \<le> real_of_int (v-1)"
       using rank_t_ub of_int_le_iff by blast
     finally have rank_t_ub': "y' \<le> v-1"
       by simp
 
     have "0 < u * (1-2 powr -real r)"
       using a_ge_1 two_pow_r_le_1 by (intro mult_pos_pos, auto)
     hence y'_pos: "y' > 0" using rank_t_lb' by linarith
 
     have no_col': "\<And>x. x \<le> y' \<Longrightarrow> count {#tr_hash x \<omega>. x \<in># mset_set (set as)#} x \<le> 1"
       using  rank_t_ub' no_col 
       by (simp add:vimage_def card_le_Suc0_iff_eq count_image_mset has_no_collision_def) force
 
     have h_1: "Max (sketch_rv' \<omega>) = y'"
       using True t_gt_0 no_col'
       by (simp add:sketch_rv'_def y'_def nth_mset_max)
 
     have "card (sketch_rv' \<omega>) = card (least ((t-1)+1) (set_mset {#tr_hash x \<omega>. x \<in># mset_set (set as)#}))"
       using t_gt_0 by (simp add:sketch_rv'_def)
     also have "... = (t-1) +1"
       using True t_gt_0 no_col' by (intro nth_mset_max(2), simp_all add:y'_def)
     also have "... = t" using t_gt_0 by simp
     finally have "card (sketch_rv' \<omega>) = t" by simp
     hence h_3: "estimate' (sketch_rv' \<omega>) = real t * real p / y'"
       using h_1 by (simp add:estimate'_def)
 
     have "(real t) * real p \<le>  (1 + \<delta>') * real m * ((real t) * real p / (real m * (1 + \<delta>')))" 
       using \<delta>'_lt_1 m_def True t_gt_0 \<delta>'_gt_0 by auto
     also have "... \<le> (1+\<delta>') * m * u"
       using \<delta>'_gt_0 by (intro mult_left_mono, simp_all add:u_def)
     also have "... < ((1 + real_of_rat \<delta>)*(1-real_of_rat \<delta>/8)) * m * u"
       using True m_def t_gt_0 a_ge_1 \<delta>_range
       by (intro mult_strict_right_mono, auto simp add:\<delta>'_def right_diff_distrib)
     also have "... \<le> ((1 + real_of_rat \<delta>)*(1-2 powr (-r))) * m * u"
       using r_le_\<delta> \<delta>_range a_ge_0 by (intro mult_right_mono mult_left_mono, auto)
     also have "... = (1 + real_of_rat \<delta>) * m * (u * (1-2 powr -real r))" 
       by simp
     also have "... \<le> (1 + real_of_rat \<delta>) * m * y'"
       using \<delta>_range by (intro mult_left_mono rank_t_lb', simp)
     finally have "real t * real p < (1 + real_of_rat \<delta>) * m * y'" by simp
     hence f_1: "estimate' (sketch_rv' \<omega>) < (1 + real_of_rat \<delta>) * m"
       using y'_pos by (simp add: h_3 pos_divide_less_eq)
 
     have "(1 - real_of_rat \<delta>) * m * y' \<le> (1 - real_of_rat \<delta>) * m * v" 
       using \<delta>_range rank_t_ub' y'_pos by (intro mult_mono rank_t_ub', simp_all)
     also have "... = (1-real_of_rat \<delta>) * (real m * v)"
       by simp
     also have "... < (1-\<delta>') * (real m * v)" 
       using \<delta>_range m_ge_0 v_ge_1
       by (intro mult_strict_right_mono mult_pos_pos, simp_all add:\<delta>'_def)
     also have "... \<le> (1-\<delta>') * (real m * (real t * real p / (real m * (1-\<delta>'))))"
       using \<delta>'_gt_0 \<delta>'_lt_1 by (intro mult_left_mono, auto simp add:v_def)
     also have "... = real t * real p"
       using \<delta>'_gt_0 \<delta>'_lt_1 t_gt_0 p_gt_0 m_ge_0 by auto
     finally have "(1 - real_of_rat \<delta>) * m * y' < real t * real p" by simp
     hence f_2: "estimate' (sketch_rv' \<omega>) > (1 - real_of_rat \<delta>) * m"
       using y'_pos by (simp add: h_3 pos_less_divide_eq)
 
     have "abs (estimate' (sketch_rv' \<omega>) - real_of_rat (F 0 as)) < real_of_rat \<delta> * (real_of_rat (F 0 as))"
       using f_1 f_2 by (simp add:abs_less_iff algebra_simps m_eq_F_0)
     thus "False" using est by linarith
   qed
   also have "... \<le> 1/9 + (1/9 + 1/9)"
     by (intro pmf_add_2[OF M_def] case_1 case_2 case_3)
   also have "... = 1/3" by simp
   finally show ?thesis by simp
 next
   case False
   have "prob {\<omega>. real_of_rat \<delta> * of_rat (F 0 as) < \<bar>estimate' (sketch_rv' \<omega>) - of_rat (F 0 as)\<bar>} \<le>
     prob {\<omega>. \<exists>x \<in> set as. \<exists>y \<in> set as. x \<noteq> y \<and> tr_hash x \<omega> \<le> real p \<and> tr_hash x \<omega> = tr_hash y \<omega>}" 
   proof (rule pmf_mono[OF M_def])
     fix \<omega>
     assume a:"\<omega> \<in> {\<omega>. real_of_rat \<delta> * real_of_rat (F 0 as) < \<bar>estimate' (sketch_rv' \<omega>) - real_of_rat (F 0 as)\<bar>}"
     assume b:"\<omega> \<in> set_pmf (pmf_of_set space)" 
     have c: "card (set as) < t" using False by auto
     hence "card ((\<lambda>x. tr_hash x \<omega>) ` set as) < t"
       using card_image_le order_le_less_trans by blast
     hence d:"card (sketch_rv' \<omega>) = card ((\<lambda>x. tr_hash x \<omega>) ` (set as))"
       by (simp add:sketch_rv'_def card_least)
     have "card (sketch_rv' \<omega>) < t"
       by (metis List.finite_set  c d card_image_le  order_le_less_trans)
     hence "estimate' (sketch_rv' \<omega>) = card (sketch_rv' \<omega>)" by (simp add:estimate'_def)
     hence "card (sketch_rv' \<omega>) \<noteq> real_of_rat (F 0 as)"
       using a \<delta>_range by simp 
         (metis abs_zero cancel_comm_monoid_add_class.diff_cancel of_nat_less_0_iff pos_prod_lt zero_less_of_rat_iff)
     hence "card (sketch_rv' \<omega>) \<noteq> card (set as)"
       using m_def m_eq_F_0 by linarith
     hence "\<not>inj_on (\<lambda>x. tr_hash x \<omega>) (set as)"
       using card_image d by auto
     moreover have "tr_hash x \<omega> \<le> real p" if a:"x \<in> set as" for x
     proof -
       have "hash x \<omega> < p" 
         using hash_range as_lt_p a b by (simp add:mod_ring_carr M_def)
       thus "tr_hash x \<omega> \<le> real p" using truncate_down_le by (simp add:tr_hash_def)
     qed
    ultimately show "\<omega> \<in> {\<omega>. \<exists>x \<in> set as. \<exists>y \<in> set as. x \<noteq> y \<and> tr_hash x \<omega> \<le> real p \<and> tr_hash x \<omega> = tr_hash y \<omega>}"
      by (simp add:inj_on_def, blast)
   qed
   also have "... \<le> (5/2) * (real (card (set as)))\<^sup>2 * (real p)\<^sup>2 * 2 powr - real r / (real p)\<^sup>2 + 1 / real p"
     using p_gt_0 by (intro collision_prob, auto)
   also have "... = (5/2) * (real (card (set as)))\<^sup>2 * 2 powr (- real r) + 1 / real p"
     using p_gt_0 by (simp add:ac_simps power2_eq_square)
   also have "... \<le> (5/2) * (real t)\<^sup>2 * 2 powr (-real r) + 1 / real p"
     using False by (intro add_mono mult_right_mono mult_left_mono power_mono, auto)
   also have "... \<le> 1/6 + 1/6"
     using t_r_bound p_ge_18 by (intro add_mono, simp_all)
   also have "... \<le> 1/3" by simp
   finally show ?thesis by simp
 qed
 
 private lemma median_bounds:
   "\<P>(\<omega> in measure_pmf \<Omega>\<^sub>0. \<bar>median s (\<lambda>i. estimate (sketch_rv (\<omega> i))) - F 0 as\<bar> \<le> \<delta> * F 0 as) \<ge> 1 - real_of_rat \<epsilon>"
 proof -
   have "strict_mono_on A real_of_float" for A by (meson less_float.rep_eq strict_mono_onI)
   hence real_g_2: "\<And>\<omega>.  sketch_rv' \<omega> = real_of_float ` sketch_rv \<omega>" 
     by (simp add: sketch_rv'_def sketch_rv_def tr_hash_def least_mono_commute image_comp)
 
   moreover have "inj_on real_of_float A" for A
     using  real_of_float_inject by (simp add:inj_on_def)
   ultimately have card_eq: "\<And>\<omega>. card (sketch_rv \<omega>) = card (sketch_rv' \<omega>)" 
     using real_g_2 by (auto intro!: card_image[symmetric])
 
   have "Max (sketch_rv' \<omega>) = real_of_float (Max (sketch_rv \<omega>))" if a:"card (sketch_rv' \<omega>) \<ge> t" for \<omega> 
   proof -
     have "mono real_of_float"
       using less_eq_float.rep_eq mono_def by blast
     moreover have "finite (sketch_rv \<omega>)"
       by (simp add:sketch_rv_def least_def)
     moreover have " sketch_rv \<omega> \<noteq> {}"
       using card_eq[symmetric] card_gt_0_iff t_gt_0 a by (simp, force)  
     ultimately show ?thesis
       by (subst mono_Max_commute[where f="real_of_float"], simp_all add:real_g_2)
   qed
   hence real_g: "\<And>\<omega>. estimate' (sketch_rv' \<omega>) = real_of_rat (estimate (sketch_rv \<omega>))"
     by (simp add:estimate_def estimate'_def card_eq of_rat_divide of_rat_mult of_rat_add real_of_rat_of_float)
 
   have indep: "prob_space.indep_vars (measure_pmf \<Omega>\<^sub>0) (\<lambda>_. borel) (\<lambda>i \<omega>. estimate' (sketch_rv' (\<omega> i))) {0..<s}"
     unfolding \<Omega>\<^sub>0_def
     by (rule indep_vars_restrict_intro', auto simp add:restrict_dfl_def lessThan_atLeast0)
 
   moreover have "- (18 * ln (real_of_rat \<epsilon>)) \<le> real s"
     using of_nat_ceiling by (simp add:s_def) blast
 
   moreover have "i < s \<Longrightarrow> measure \<Omega>\<^sub>0 {\<omega>. of_rat \<delta> * of_rat (F 0 as) < \<bar>estimate' (sketch_rv' (\<omega> i)) - of_rat (F 0 as)\<bar>} \<le> 1/3"
     for i
     using estimate'_bounds unfolding \<Omega>\<^sub>0_def M_def
     by (subst prob_prod_pmf_slice, simp_all)
  
   ultimately have "1-real_of_rat \<epsilon> \<le> \<P>(\<omega> in measure_pmf \<Omega>\<^sub>0.
       \<bar>median s (\<lambda>i. estimate' (sketch_rv' (\<omega> i))) - real_of_rat (F 0 as)\<bar> \<le>  real_of_rat \<delta> * real_of_rat (F 0 as))"
     using \<epsilon>_range prob_space_measure_pmf
     by (intro prob_space.median_bound_2) auto
   also have "... = \<P>(\<omega> in measure_pmf \<Omega>\<^sub>0. 
       \<bar>median s (\<lambda>i. estimate (sketch_rv (\<omega> i))) - F 0 as\<bar> \<le>  \<delta> * F 0 as)"
     using s_gt_0 median_rat[symmetric] real_g by (intro arg_cong2[where f="measure"]) 
       (simp_all add:of_rat_diff[symmetric] of_rat_mult[symmetric] of_rat_less_eq)
   finally show "\<P>(\<omega> in measure_pmf \<Omega>\<^sub>0. \<bar>median s (\<lambda>i. estimate (sketch_rv (\<omega> i))) - F 0 as\<bar> \<le> \<delta> * F 0 as) \<ge> 1-real_of_rat \<epsilon>"
     by blast
 qed
 
 lemma f0_alg_correct':
   "\<P>(\<omega> in measure_pmf result. \<bar>\<omega> - F 0 as\<bar> \<le> \<delta> * F 0 as) \<ge> 1 - of_rat \<epsilon>"
 proof -
   have f0_result_elim: "\<And>x. f0_result (s, t, p, r, x, \<lambda>i\<in>{..<s}. sketch_rv (x i)) =
     return_pmf (median s (\<lambda>i. estimate (sketch_rv (x i))))"
     by (simp add:estimate_def, rule median_cong, simp)
  
   have "result = map_pmf (\<lambda>x. (s, t, p, r, x, \<lambda>i\<in>{..<s}. sketch_rv (x i))) \<Omega>\<^sub>0 \<bind> f0_result"
     by (subst result_def, subst f0_alg_sketch, simp)
   also have "... = \<Omega>\<^sub>0 \<bind> (\<lambda>x. return_pmf (s, t, p, r, x, \<lambda>i\<in>{..<s}. sketch_rv (x i))) \<bind> f0_result"
     by (simp add:t_def p_def r_def s_def map_pmf_def)
   also have "... = \<Omega>\<^sub>0 \<bind> (\<lambda>x. return_pmf (median s (\<lambda>i. estimate (sketch_rv (x i)))))"
     by (subst bind_assoc_pmf, subst bind_return_pmf, subst f0_result_elim)  simp
   finally have a:"result =  \<Omega>\<^sub>0 \<bind> (\<lambda>x. return_pmf (median s (\<lambda>i. estimate (sketch_rv (x i)))))"
     by simp
 
   show ?thesis
     using median_bounds by (simp add: a map_pmf_def[symmetric])
 qed
 
 private lemma f_subset:
   assumes "g ` A \<subseteq> h ` B"
   shows "(\<lambda>x. f (g x)) ` A \<subseteq> (\<lambda>x. f (h x)) ` B"
   using assms by auto
 
 lemma f0_exact_space_usage':
   defines "\<Omega> \<equiv> fold (\<lambda>a state. state \<bind> f0_update a) as (f0_init \<delta> \<epsilon> n)"
   shows "AE \<omega> in \<Omega>. bit_count (encode_f0_state \<omega>) \<le> f0_space_usage (n, \<epsilon>, \<delta>)"
 proof -
   
   have log_2_4: "log 2 4 = 2" 
     by (metis log2_of_power_eq mult_2 numeral_Bit0 of_nat_numeral power2_eq_square)
 
   have a: "bit_count (F\<^sub>e (float_of (truncate_down r y))) \<le> 
     ereal (12 + 4 * real r + 2 * log 2 (log 2 (n+13)))" if a_1:"y \<in> {..<p}" for y
   proof (cases "y \<ge> 1")
     case True
 
     have aux_1: " 0 < 2 + log 2 (real y)" 
       using True by (intro add_pos_nonneg, auto)
     have aux_2: "0 < 2 + log 2 (real p)"
       using p_gt_1 by (intro add_pos_nonneg, auto)
 
     have "bit_count (F\<^sub>e (float_of (truncate_down r y))) \<le> 
       ereal (10 + 4 * real r + 2 * log 2 (2 + \<bar>log 2 \<bar>real y\<bar>\<bar>))"
       by (rule truncate_float_bit_count)
     also have "... = ereal (10 + 4 * real r + 2 * log 2 (2 + (log 2 (real y))))"
       using True by simp
     also have "... \<le> ereal (10 + 4 * real r + 2 * log 2 (2 + log 2 p))"
       using aux_1 aux_2 True p_gt_0 a_1 by simp
     also have "... \<le> ereal (10 + 4 * real r + 2 * log 2 (log 2 4 + log 2 (2 * n + 40)))"
       using log_2_4 p_le_n p_gt_0
       by (intro ereal_mono add_mono mult_left_mono log_mono of_nat_mono add_pos_nonneg, auto)
     also have "... = ereal (10 + 4 * real r + 2 * log 2 (log 2 (8 * n + 160)))"
       by (simp add:log_mult[symmetric])
     also have "... \<le> ereal (10 + 4 * real r + 2 * log 2 (log 2 ((n+13) powr 2)))"
       by (intro ereal_mono add_mono mult_left_mono log_mono of_nat_mono add_pos_nonneg)
        (auto simp add:power2_eq_square algebra_simps)
     also have "... = ereal (10 +  4 * real r + 2 * log 2 (log 2 4 * log 2 (n + 13)))"
       by (subst log_powr, simp_all add:log_2_4)
     also have "... = ereal (12 +  4 * real r + 2 * log 2 (log 2 (n + 13)))"
       by (subst log_mult, simp_all add:log_2_4)
     finally show ?thesis by simp
   next
     case False
     hence "y = 0" using a_1 by simp
     then show ?thesis by (simp add:float_bit_count_zero)
   qed
 
   have "bit_count (encode_f0_state (s, t, p, r, x, \<lambda>i\<in>{..<s}. sketch_rv (x i))) \<le> 
         f0_space_usage (n, \<epsilon>, \<delta>)" if b: "x \<in> {..<s} \<rightarrow>\<^sub>E space" for x
   proof -
     have c: "x \<in> extensional {..<s}" using b by (simp add:PiE_def) 
 
     have d: "sketch_rv (x y) \<subseteq> (\<lambda>k. float_of (truncate_down r k)) ` {..<p} "
       if d_1: "y < s" for y
     proof -
       have "sketch_rv (x y) \<subseteq> (\<lambda>xa. float_of (truncate_down r (hash xa (x y)))) ` set as"
         using least_subset by (auto simp add:sketch_rv_def tr_hash_def) 
       also have "... \<subseteq> (\<lambda>k. float_of (truncate_down r (real k))) ` {..<p}"
         using b hash_range as_lt_p d_1
         by (intro f_subset[where f="\<lambda>x. float_of (truncate_down r (real x))"] image_subsetI)
          (simp add: PiE_iff mod_ring_carr)
       finally show ?thesis
         by simp
     qed
 
     have "\<And>y. y < s \<Longrightarrow> finite (sketch_rv (x y))"
       unfolding sketch_rv_def by (rule finite_subset[OF least_subset], simp)
     moreover have card_sketch: "\<And>y. y < s \<Longrightarrow> card (sketch_rv (x y)) \<le> t "
       by (simp add:sketch_rv_def card_least)
     moreover have "\<And>y z. y < s \<Longrightarrow> z \<in> sketch_rv (x y) \<Longrightarrow> 
       bit_count (F\<^sub>e z) \<le> ereal (12 + 4 * real r + 2 * log 2 (log 2 (real n + 13)))"
       using a d by auto
     ultimately have e: "\<And>y. y < s \<Longrightarrow> bit_count (S\<^sub>e F\<^sub>e (sketch_rv (x y))) 
       \<le> ereal (real t) * (ereal (12 + 4 * real r + 2 * log 2 (log 2 (real (n + 13)))) + 1) + 1"
       using float_encoding by (intro set_bit_count_est, auto)
 
     have f: "\<And>y. y < s \<Longrightarrow> bit_count (P\<^sub>e p 2 (x y)) \<le> ereal (real 2 * (log 2 (real p) + 1))"
       using p_gt_1 b
       by (intro bounded_degree_polynomial_bit_count) (simp_all add:space_def PiE_def Pi_def)
 
     have "bit_count (encode_f0_state (s, t, p, r, x, \<lambda>i\<in>{..<s}. sketch_rv (x i))) =
       bit_count (N\<^sub>e s) + bit_count (N\<^sub>e t) +  bit_count (N\<^sub>e p) + bit_count (N\<^sub>e r) +
       bit_count (([0..<s] \<rightarrow>\<^sub>e P\<^sub>e p 2) x) +
       bit_count (([0..<s] \<rightarrow>\<^sub>e S\<^sub>e F\<^sub>e) (\<lambda>i\<in>{..<s}. sketch_rv (x i)))"
       by (simp add:encode_f0_state_def dependent_bit_count lessThan_atLeast0
         s_def[symmetric] t_def[symmetric] p_def[symmetric] r_def[symmetric] ac_simps)
     also have "... \<le> ereal (2* log 2 (real s + 1) + 1) + ereal  (2* log 2 (real t + 1) + 1)
       + ereal (2* log 2 (real p + 1) + 1) + ereal (2 * log 2 (real r + 1) + 1)
       + (ereal (real s) * (ereal (real 2 * (log 2 (real p) + 1)))) 
       + (ereal (real s) * ((ereal (real t) * 
             (ereal (12 + 4 * real r + 2 * log 2 (log 2 (real (n + 13)))) + 1) + 1)))"
       using c e f
       by (intro add_mono exp_golomb_bit_count fun_bit_count_est[where xs="[0..<s]", simplified])
        (simp_all add:lessThan_atLeast0)
     also have "... = ereal ( 4 + 2 * log 2 (real s + 1) + 2 * log 2 (real t + 1) + 
       2 * log 2 (real p + 1) + 2 * log 2 (real r + 1) + real s * (3 + 2 * log 2 (real p) + 
       real t * (13 + (4 * real r + 2 * log 2 (log 2 (real n + 13))))))"
       by (simp add:algebra_simps)
     also have "... \<le> ereal ( 4 + 2 * log 2 (real s + 1)  + 2 * log 2 (real t + 1) + 
       2 * log 2 (2 * (21 + real n)) + 2 * log 2 (real r + 1) + real s * (3 + 2 * log 2 (2 * (21 + real n)) + 
       real t * (13 + (4 * real r + 2 * log 2 (log 2 (real n + 13))))))"
       using p_le_n p_gt_0
       by (intro ereal_mono add_mono mult_left_mono, auto)
     also have "... =  ereal (6 + 2 * log 2 (real s + 1) + 2 * log 2 (real t + 1) + 
       2 * log 2 (21 + real n) + 2 * log 2 (real r + 1) + real s * (5 + 2 * log 2 (21 + real n) + 
       real t * (13 + (4 * real r + 2 * log 2 (log 2 (real n + 13))))))"
       by (subst (1 2) log_mult, auto)
     also have "... \<le> f0_space_usage (n, \<epsilon>, \<delta>)"
       by (simp add:s_def[symmetric] r_def[symmetric] t_def[symmetric] Let_def)
        (simp add:algebra_simps)
     finally show "bit_count (encode_f0_state (s, t, p, r, x, \<lambda>i\<in>{..<s}. sketch_rv (x i))) \<le> 
         f0_space_usage (n, \<epsilon>, \<delta>)" by simp
   qed
   hence "\<And>x. x \<in> set_pmf \<Omega>\<^sub>0 \<Longrightarrow>
          bit_count (encode_f0_state (s, t, p, r, x, \<lambda>i\<in>{..<s}. sketch_rv (x i)))  \<le> ereal (f0_space_usage (n, \<epsilon>, \<delta>))"
     by (simp add:\<Omega>\<^sub>0_def set_prod_pmf del:f0_space_usage.simps)
   hence "\<And>y. y \<in> set_pmf \<Omega> \<Longrightarrow> bit_count (encode_f0_state y) \<le> ereal (f0_space_usage (n, \<epsilon>, \<delta>))"
     by (simp add: \<Omega>_def f0_alg_sketch del:f0_space_usage.simps f0_init.simps)
      (metis (no_types, lifting) image_iff pmf.set_map)
   thus ?thesis
     by (simp add: AE_measure_pmf_iff del:f0_space_usage.simps)
 qed
 
 end
 
 text \<open>Main results of this section:\<close>
 
 theorem f0_alg_correct:
   assumes "\<epsilon> \<in> {0<..<1}"
   assumes "\<delta> \<in> {0<..<1}"
   assumes "set as \<subseteq> {..<n}"
   defines "\<Omega> \<equiv> fold (\<lambda>a state. state \<bind> f0_update a) as (f0_init \<delta> \<epsilon> n) \<bind> f0_result"
   shows "\<P>(\<omega> in measure_pmf \<Omega>. \<bar>\<omega> - F 0 as\<bar> \<le> \<delta> * F 0 as) \<ge> 1 - of_rat \<epsilon>"
   using f0_alg_correct'[OF assms(1-3)] unfolding \<Omega>_def by blast
 
 theorem f0_exact_space_usage:
   assumes "\<epsilon> \<in> {0<..<1}"
   assumes "\<delta> \<in> {0<..<1}"
   assumes "set as \<subseteq> {..<n}"
   defines "\<Omega> \<equiv> fold (\<lambda>a state. state \<bind> f0_update a) as (f0_init \<delta> \<epsilon> n)"
   shows "AE \<omega> in \<Omega>. bit_count (encode_f0_state \<omega>) \<le> f0_space_usage (n, \<epsilon>, \<delta>)"
   using f0_exact_space_usage'[OF assms(1-3)] unfolding \<Omega>_def by blast
 
 theorem f0_asymptotic_space_complexity:
   "f0_space_usage \<in> O[at_top \<times>\<^sub>F at_right 0 \<times>\<^sub>F at_right 0](\<lambda>(n, \<epsilon>, \<delta>). ln (1 / of_rat \<epsilon>) * 
   (ln (real n) + 1 / (of_rat \<delta>)\<^sup>2 * (ln (ln (real n)) + ln (1 / of_rat \<delta>))))"
   (is "_ \<in> O[?F](?rhs)")
 proof -
   define n_of :: "nat \<times> rat \<times> rat \<Rightarrow> nat" where "n_of = (\<lambda>(n, \<epsilon>, \<delta>). n)"
   define \<epsilon>_of :: "nat \<times> rat \<times> rat \<Rightarrow> rat" where "\<epsilon>_of = (\<lambda>(n, \<epsilon>, \<delta>). \<epsilon>)"
   define \<delta>_of :: "nat \<times> rat \<times> rat \<Rightarrow> rat" where "\<delta>_of = (\<lambda>(n, \<epsilon>, \<delta>). \<delta>)"
   define t_of where "t_of = (\<lambda>x. nat \<lceil>80 / (real_of_rat (\<delta>_of x))\<^sup>2\<rceil>)"
   define s_of where "s_of = (\<lambda>x. nat \<lceil>-(18 * ln (real_of_rat (\<epsilon>_of x)))\<rceil>)"
   define r_of where "r_of = (\<lambda>x. nat (4 * \<lceil>log 2 (1 / real_of_rat (\<delta>_of x))\<rceil> + 23))"
 
   define g where "g = (\<lambda>x. ln (1 / of_rat (\<epsilon>_of x)) * (ln (real (n_of x)) + 
     1 / (of_rat (\<delta>_of x))\<^sup>2 * (ln (ln (real (n_of x))) + ln (1 / of_rat (\<delta>_of x)))))"
 
   have evt: "(\<And>x. 
     0 < real_of_rat (\<delta>_of x) \<and> 0 < real_of_rat (\<epsilon>_of x) \<and> 
     1/real_of_rat (\<delta>_of x) \<ge> \<delta> \<and> 1/real_of_rat (\<epsilon>_of x) \<ge> \<epsilon> \<and>
     real (n_of x) \<ge> n \<Longrightarrow> P x) \<Longrightarrow> eventually P ?F"  (is "(\<And>x. ?prem x \<Longrightarrow> _) \<Longrightarrow> _")
     for \<delta> \<epsilon> n P
     apply (rule eventually_mono[where P="?prem" and Q="P"])
     apply (simp add:\<epsilon>_of_def case_prod_beta' \<delta>_of_def n_of_def)
      apply (intro eventually_conj eventually_prod1' eventually_prod2' 
         sequentially_inf eventually_at_right_less inv_at_right_0_inf)
     by (auto simp add:prod_filter_eq_bot)
 
   have exp_pos: "exp k \<le> real x \<Longrightarrow> x > 0" for k x
     using exp_gt_zero gr0I by force 
 
   have exp_gt_1: "exp 1 \<ge> (1::real)"
     by simp
 
   have 1: "(\<lambda>_. 1) \<in> O[?F](\<lambda>x. ln (1 / real_of_rat (\<epsilon>_of x)))"
     by (auto intro!:landau_o.big_mono evt[where \<epsilon>="exp 1"] iffD2[OF ln_ge_iff] simp add:abs_ge_iff)
 
   have 2: "(\<lambda>_. 1) \<in> O[?F](\<lambda>x. ln (1 / real_of_rat (\<delta>_of x)))" 
     by (auto intro!:landau_o.big_mono evt[where \<delta>="exp 1"] iffD2[OF ln_ge_iff] simp add:abs_ge_iff)
 
   have 3: " (\<lambda>x. 1) \<in> O[?F](\<lambda>x. ln (ln (real (n_of x))) + ln (1 / real_of_rat (\<delta>_of x)))"
     using exp_pos
     by (intro landau_sum_2 2 evt[where n="exp 1" and \<delta>="1"] ln_ge_zero  iffD2[OF ln_ge_iff], auto)
   have 4: "(\<lambda>_. 1) \<in> O[?F](\<lambda>x. 1 / (real_of_rat (\<delta>_of x))\<^sup>2)" 
     using one_le_power
     by (intro landau_o.big_mono evt[where \<delta>="1"], auto simp add:power_one_over[symmetric])
 
   have "(\<lambda>x. 80 * (1 / (real_of_rat (\<delta>_of x))\<^sup>2)) \<in> O[?F](\<lambda>x. 1 / (real_of_rat (\<delta>_of x))\<^sup>2)"
     by (subst landau_o.big.cmult_in_iff, auto)
   hence 5: "(\<lambda>x. real (t_of x)) \<in> O[?F](\<lambda>x. 1 / (real_of_rat (\<delta>_of x))\<^sup>2)"
     unfolding  t_of_def 
     by (intro landau_real_nat landau_ceil 4, auto)
 
   have "(\<lambda>x. ln (real_of_rat (\<epsilon>_of x))) \<in> O[?F](\<lambda>x. ln (1 / real_of_rat (\<epsilon>_of x)))"
     by (intro landau_o.big_mono evt[where \<epsilon>="1"], auto simp add:ln_div)
   hence 6: "(\<lambda>x. real (s_of x)) \<in> O[?F](\<lambda>x. ln (1 / real_of_rat (\<epsilon>_of x)))"
     unfolding s_of_def by (intro landau_nat_ceil 1, simp)
 
   have 7: " (\<lambda>x. 1) \<in> O[?F](\<lambda>x. ln (real (n_of x)))"
     using exp_pos by (auto intro!: landau_o.big_mono evt[where n="exp 1"] iffD2[OF ln_ge_iff] simp: abs_ge_iff)
 
   have 8:" (\<lambda>_. 1) \<in> 
     O[?F](\<lambda>x. ln (real (n_of x)) + 1 / (real_of_rat (\<delta>_of x))\<^sup>2 * (ln (ln (real (n_of x))) + ln (1 / real_of_rat (\<delta>_of x))))"
     using order_trans[OF exp_gt_1] exp_pos
     by (intro landau_sum_1 7 evt[where n="exp 1" and \<delta>="1"] ln_ge_zero  iffD2[OF ln_ge_iff] 
         mult_nonneg_nonneg add_nonneg_nonneg) auto
 
   have "(\<lambda>x. ln (real (s_of x) + 1)) \<in> O[?F](\<lambda>x. ln (1 / real_of_rat (\<epsilon>_of x)))"
     by (intro landau_ln_3 sum_in_bigo 6 1, simp)
 
   hence 9: "(\<lambda>x. log 2 (real (s_of x) + 1)) \<in> O[?F](g)"
     unfolding g_def by (intro landau_o.big_mult_1 8, auto simp:log_def)
   have 10: "(\<lambda>x. 1) \<in> O[?F](g)"
     unfolding g_def by (intro landau_o.big_mult_1 8 1)
 
   have "(\<lambda>x. ln (real (t_of x) + 1)) \<in> 
     O[?F](\<lambda>x. 1 / (real_of_rat (\<delta>_of x))\<^sup>2 * (ln (ln (real (n_of x))) + ln (1 / real_of_rat (\<delta>_of x))))"
     using 5 by (intro landau_o.big_mult_1 3 landau_ln_3 sum_in_bigo 4, simp_all)
   hence " (\<lambda>x. log 2 (real (t_of x) + 1)) \<in> 
   O[?F](\<lambda>x. ln (real (n_of x)) + 1 / (real_of_rat (\<delta>_of x))\<^sup>2 * (ln (ln (real (n_of x))) + ln (1 / real_of_rat (\<delta>_of x))))"
     using order_trans[OF exp_gt_1] exp_pos
     by (intro landau_sum_2  evt[where n="exp 1" and \<delta>="1"] ln_ge_zero  iffD2[OF ln_ge_iff] 
         mult_nonneg_nonneg add_nonneg_nonneg) (auto simp add:log_def)
   hence 11: "(\<lambda>x. log 2 (real (t_of x) + 1)) \<in> O[?F](g)"
     unfolding g_def  by (intro landau_o.big_mult_1' 1, auto)
   have " (\<lambda>x. 1) \<in> O[?F](\<lambda>x. real (n_of x))" 
     by (intro landau_o.big_mono evt[where n="1"], auto)
   hence "(\<lambda>x. ln (real (n_of x) + 21)) \<in> O[?F](\<lambda>x. ln (real (n_of x)))" 
     by (intro landau_ln_2[where a="2"] evt[where n="2"] sum_in_bigo, auto)
 
   hence 12: "(\<lambda>x. log 2 (real (n_of x) + 21)) \<in> O[?F](g)"
     unfolding g_def using exp_pos order_trans[OF exp_gt_1]
     by (intro landau_o.big_mult_1' 1 landau_sum_1  evt[where n="exp 1" and \<delta>="1"] 
         ln_ge_zero  iffD2[OF ln_ge_iff] mult_nonneg_nonneg add_nonneg_nonneg)  (auto simp add:log_def)
 
   have "(\<lambda>x. ln (1 / real_of_rat (\<delta>_of x))) \<in> O[?F](\<lambda>x. 1 / (real_of_rat (\<delta>_of x))\<^sup>2)" 
     by (intro landau_ln_3 evt[where \<delta>="1"] landau_o.big_mono) 
       (auto simp add:power_one_over[symmetric] self_le_power)
   hence " (\<lambda>x. real (nat (4*\<lceil>log 2 (1 / real_of_rat (\<delta>_of x))\<rceil>+23))) \<in> O[?F](\<lambda>x. 1 / (real_of_rat (\<delta>_of x))\<^sup>2)"
     using 4 by (auto intro!: landau_real_nat sum_in_bigo landau_ceil simp:log_def)
   hence " (\<lambda>x. ln (real (r_of x) + 1)) \<in> O[?F](\<lambda>x. 1 / (real_of_rat (\<delta>_of x))\<^sup>2)"
     unfolding r_of_def
     by (intro landau_ln_3 sum_in_bigo 4, auto)
   hence " (\<lambda>x. log 2 (real (r_of x) + 1)) \<in> 
     O[?F](\<lambda>x. (1 / (real_of_rat (\<delta>_of x))\<^sup>2) * (ln (ln (real (n_of x))) + ln (1 / real_of_rat (\<delta>_of x))))"
     by (intro landau_o.big_mult_1 3, simp add:log_def)
   hence " (\<lambda>x. log 2 (real (r_of x) + 1)) \<in> 
     O[?F](\<lambda>x. ln (real (n_of x)) + 1 / (real_of_rat (\<delta>_of x))\<^sup>2 * (ln (ln (real (n_of x))) + ln (1 / real_of_rat (\<delta>_of x))))"
     using exp_pos order_trans[OF exp_gt_1]
     by (intro landau_sum_2 evt[where n="exp 1" and \<delta>="1"] ln_ge_zero  
         iffD2[OF ln_ge_iff] add_nonneg_nonneg mult_nonneg_nonneg) (auto)
   hence 13: "(\<lambda>x. log 2 (real (r_of x) + 1)) \<in> O[?F](g)"
     unfolding g_def  by (intro landau_o.big_mult_1' 1, auto)
   have 14: "(\<lambda>x. 1) \<in> O[?F](\<lambda>x. real (n_of x))" 
     by (intro landau_o.big_mono evt[where n="1"], auto)
 
   have "(\<lambda>x. ln (real (n_of x) + 13)) \<in> O[?F](\<lambda>x. ln (real (n_of x)))" 
     using 14 by (intro landau_ln_2[where a="2"]  evt[where n="2"] sum_in_bigo, auto)
 
   hence "(\<lambda>x. ln (log 2 (real (n_of x) + 13))) \<in> O[?F](\<lambda>x. ln (ln (real (n_of x))))"
     using exp_pos by (intro landau_ln_2[where a="2"] iffD2[OF ln_ge_iff] evt[where n="exp 2"])
         (auto simp add:log_def)
 
   hence "(\<lambda>x. log 2 (log 2 (real (n_of x) + 13))) \<in> O[?F](\<lambda>x. ln (ln (real (n_of x))) + ln (1 / real_of_rat (\<delta>_of x)))"
     using exp_pos by (intro landau_sum_1 evt[where n="exp 1" and \<delta>="1"] ln_ge_zero  iffD2[OF ln_ge_iff])
      (auto simp add:log_def)
 
   moreover have  "(\<lambda>x. real (r_of x)) \<in> O[?F](\<lambda>x. ln (1 / real_of_rat (\<delta>_of x)))"
     unfolding r_of_def using 2
     by (auto intro!: landau_real_nat sum_in_bigo landau_ceil simp:log_def)
   hence "(\<lambda>x. real (r_of x)) \<in> O[?F](\<lambda>x. ln (ln (real (n_of x))) + ln (1 / real_of_rat (\<delta>_of x)))"
     using exp_pos 
     by (intro landau_sum_2 evt[where n="exp 1" and \<delta>="1"] ln_ge_zero  iffD2[OF ln_ge_iff], auto)
 
   ultimately have 15:" (\<lambda>x. real (t_of x) * (13 + 4 * real (r_of x) + 2 * log 2 (log 2 (real (n_of x) + 13))))
       \<in> O[?F](\<lambda>x. 1 / (real_of_rat (\<delta>_of x))\<^sup>2 * (ln (ln (real (n_of x))) + ln (1 / real_of_rat (\<delta>_of x))))"
     using 5 3 
     by (intro landau_o.mult sum_in_bigo, auto)
 
   have "(\<lambda>x. 5 + 2 * log 2 (21 + real (n_of x)) + real (t_of x) * (13 + 4 * real (r_of x) + 2 * log 2 (log 2 (real (n_of x) + 13))))
       \<in> O[?F](\<lambda>x. ln (real (n_of x)) + 1 / (real_of_rat (\<delta>_of x))\<^sup>2 * (ln (ln (real (n_of x))) + ln (1 / real_of_rat (\<delta>_of x))))"
   proof -
     have "\<forall>\<^sub>F x in ?F. 0 \<le> ln (real (n_of x))" 
       by (intro evt[where n="1"] ln_ge_zero, auto)
     moreover have "\<forall>\<^sub>F x in ?F. 0 \<le> 1 / (real_of_rat (\<delta>_of x))\<^sup>2 * (ln (ln (real (n_of x))) + ln (1 / real_of_rat (\<delta>_of x)))"
       using exp_pos
       by (intro evt[where n="exp 1" and \<delta>="1"] mult_nonneg_nonneg add_nonneg_nonneg 
           ln_ge_zero iffD2[OF ln_ge_iff]) auto
     moreover have " (\<lambda>x. ln (21 + real (n_of x))) \<in> O[?F](\<lambda>x. ln (real (n_of x)))" 
       using 14 by (intro landau_ln_2[where a="2"] sum_in_bigo evt[where n="2"], auto)
     hence "(\<lambda>x. 5 + 2 * log 2 (21 + real (n_of x))) \<in> O[?F](\<lambda>x. ln (real (n_of x)))"
       using 7  by (intro sum_in_bigo, auto simp add:log_def)
     ultimately show ?thesis
       using 15 by (rule landau_sum)
   qed
 
   hence 16: "(\<lambda>x. real (s_of x) * (5 + 2 * log 2 (21 + real (n_of x)) + real (t_of x) *
     (13 + 4 * real (r_of x) + 2 * log 2 (log 2 (real (n_of x) + 13)))))  \<in> O[?F](g)"
     unfolding g_def
     by (intro landau_o.mult 6, auto)
 
   have "f0_space_usage = (\<lambda>x. f0_space_usage (n_of x, \<epsilon>_of x, \<delta>_of x))"
     by (simp add:case_prod_beta' n_of_def \<epsilon>_of_def \<delta>_of_def)
   also have "... \<in>  O[?F](g)"
     using 9 10 11 12 13 16
     by (simp add:fun_cong[OF s_of_def[symmetric]] fun_cong[OF t_of_def[symmetric]] 
         fun_cong[OF r_of_def[symmetric]] Let_def) (intro sum_in_bigo, auto)
   also have "... = O[?F](?rhs)"
     by (simp add:case_prod_beta' g_def n_of_def \<epsilon>_of_def \<delta>_of_def)
   finally show ?thesis
     by simp
 qed
 
 end
diff --git a/thys/Frequency_Moments/Frequency_Moment_2.thy b/thys/Frequency_Moments/Frequency_Moment_2.thy
--- a/thys/Frequency_Moments/Frequency_Moment_2.thy
+++ b/thys/Frequency_Moments/Frequency_Moment_2.thy
@@ -1,721 +1,721 @@
 section \<open>Frequency Moment $2$\<close>
 
 theory Frequency_Moment_2
   imports
     Universal_Hash_Families.Carter_Wegman_Hash_Family
     Equivalence_Relation_Enumeration.Equivalence_Relation_Enumeration
     Landau_Ext
     Median_Method.Median
     Product_PMF_Ext
-    Universal_Hash_Families.Field
+    Universal_Hash_Families.Universal_Hash_Families_More_Finite_Fields
     Frequency_Moments 
 begin
 
 text \<open>This section contains a formalization of the algorithm for the second frequency moment.
 It is based on the algorithm described in \<^cite>\<open>\<open>\textsection 2.2\<close> in "alon1999"\<close>.
 The only difference is that the algorithm is adapted to work with prime field of odd order, which
 greatly reduces the implementation complexity.\<close>
 
 fun f2_hash where
   "f2_hash p h k = (if even (ring.hash (mod_ring p) k h) then int p - 1 else - int p - 1)"
 
 type_synonym f2_state = "nat \<times> nat \<times> nat \<times> (nat \<times> nat \<Rightarrow> nat list) \<times> (nat \<times> nat \<Rightarrow> int)"
 
 fun f2_init :: "rat \<Rightarrow> rat \<Rightarrow> nat \<Rightarrow> f2_state pmf" where
   "f2_init \<delta> \<epsilon> n =
     do {
       let s\<^sub>1 = nat \<lceil>6 / \<delta>\<^sup>2\<rceil>;
       let s\<^sub>2 = nat \<lceil>-(18 * ln (real_of_rat \<epsilon>))\<rceil>;
       let p = prime_above (max n 3);
       h \<leftarrow> prod_pmf ({..<s\<^sub>1} \<times> {..<s\<^sub>2}) (\<lambda>_. pmf_of_set (bounded_degree_polynomials (mod_ring p) 4));
       return_pmf (s\<^sub>1, s\<^sub>2, p, h, (\<lambda>_ \<in> {..<s\<^sub>1} \<times> {..<s\<^sub>2}. (0 :: int)))
     }"
 
 fun f2_update :: "nat \<Rightarrow> f2_state \<Rightarrow> f2_state pmf" where
   "f2_update x (s\<^sub>1, s\<^sub>2, p, h, sketch) = 
     return_pmf (s\<^sub>1, s\<^sub>2, p, h, \<lambda>i \<in> {..<s\<^sub>1} \<times> {..<s\<^sub>2}. f2_hash p (h i) x + sketch i)"
 
 fun f2_result :: "f2_state \<Rightarrow> rat pmf" where
   "f2_result (s\<^sub>1, s\<^sub>2, p, h, sketch) = 
     return_pmf (median s\<^sub>2 (\<lambda>i\<^sub>2 \<in> {..<s\<^sub>2}. 
       (\<Sum>i\<^sub>1\<in>{..<s\<^sub>1} . (rat_of_int (sketch (i\<^sub>1, i\<^sub>2)))\<^sup>2) / (((rat_of_nat p)\<^sup>2-1) * rat_of_nat s\<^sub>1)))"
 
 fun f2_space_usage :: "(nat \<times> nat \<times> rat \<times> rat) \<Rightarrow> real" where
   "f2_space_usage (n, m, \<epsilon>, \<delta>) = (
     let s\<^sub>1 = nat \<lceil>6 / \<delta>\<^sup>2 \<rceil> in
     let s\<^sub>2 = nat \<lceil>-(18 * ln (real_of_rat \<epsilon>))\<rceil> in 
     3 +
     2 * log 2 (s\<^sub>1 + 1) +
     2 * log 2 (s\<^sub>2 + 1) +
     2 * log 2 (9 + 2 * real n) +
     s\<^sub>1 * s\<^sub>2 * (5 + 4*log 2 (8 + 2 * real n) + 2 * log 2 (real m * (18 + 4 * real n) + 1 )))"
 
 definition encode_f2_state :: "f2_state \<Rightarrow> bool list option" where
   "encode_f2_state = 
     N\<^sub>e \<Join>\<^sub>e (\<lambda>s\<^sub>1. 
     N\<^sub>e \<Join>\<^sub>e (\<lambda>s\<^sub>2. 
     N\<^sub>e \<Join>\<^sub>e (\<lambda>p. 
     (List.product [0..<s\<^sub>1] [0..<s\<^sub>2] \<rightarrow>\<^sub>e P\<^sub>e p 4) \<times>\<^sub>e
     (List.product [0..<s\<^sub>1] [0..<s\<^sub>2] \<rightarrow>\<^sub>e I\<^sub>e))))"
 
 lemma "inj_on encode_f2_state (dom encode_f2_state)"
 proof -
   have " is_encoding encode_f2_state"
     unfolding encode_f2_state_def
     by (intro dependent_encoding exp_golomb_encoding fun_encoding list_encoding int_encoding poly_encoding)
       
   thus ?thesis
     by (rule encoding_imp_inj)
 qed
 
 context
   fixes \<epsilon> \<delta> :: rat
   fixes n :: nat
   fixes as :: "nat list"
   fixes result
   assumes \<epsilon>_range: "\<epsilon> \<in> {0<..<1}"
   assumes \<delta>_range: "\<delta> > 0"
   assumes as_range: "set as \<subseteq> {..<n}"
   defines "result \<equiv> fold (\<lambda>a state. state \<bind> f2_update a) as (f2_init \<delta> \<epsilon> n) \<bind> f2_result"
 begin  
 
 private definition s\<^sub>1 where "s\<^sub>1 = nat \<lceil>6 / \<delta>\<^sup>2\<rceil>"
 
 lemma s1_gt_0: "s\<^sub>1 > 0"
     using \<delta>_range by (simp add:s\<^sub>1_def)
 
 private definition s\<^sub>2 where "s\<^sub>2 = nat \<lceil>-(18* ln (real_of_rat \<epsilon>))\<rceil>"
 
 lemma s2_gt_0: "s\<^sub>2 > 0"
     using \<epsilon>_range by (simp add:s\<^sub>2_def)
 
 private definition p where "p = prime_above (max n 3)"
  
 lemma p_prime: "Factorial_Ring.prime p" 
   unfolding p_def using prime_above_prime by blast
 
 lemma p_ge_3: "p \<ge> 3"
     unfolding p_def by (meson max.boundedE prime_above_lower_bound)
 
 lemma p_gt_0: "p > 0" using p_ge_3 by linarith
 
 lemma p_gt_1: "p > 1" using p_ge_3 by simp
 
 lemma p_ge_n: "p \<ge> n" unfolding p_def
   by (meson max.boundedE prime_above_lower_bound )
 
 interpretation carter_wegman_hash_family "mod_ring p" 4
   using carter_wegman_hash_familyI[OF mod_ring_is_field mod_ring_finite]
   using p_prime by auto
 
 definition sketch where "sketch = fold (\<lambda>a state. state \<bind> f2_update a) as (f2_init \<delta> \<epsilon> n)"
 private definition \<Omega> where"\<Omega> = prod_pmf ({..<s\<^sub>1} \<times> {..<s\<^sub>2}) (\<lambda>_. pmf_of_set space)" 
 private definition \<Omega>\<^sub>p where"\<Omega>\<^sub>p = measure_pmf \<Omega>" 
 private definition sketch_rv where "sketch_rv \<omega> = of_int (sum_list (map (f2_hash p \<omega>) as))^2"
 private definition mean_rv where "mean_rv \<omega> = (\<lambda>i\<^sub>2. (\<Sum>i\<^sub>1 = 0..<s\<^sub>1. sketch_rv (\<omega> (i\<^sub>1, i\<^sub>2))) / (((of_nat p)\<^sup>2 - 1) * of_nat s\<^sub>1))"
 private definition result_rv where "result_rv \<omega> = median s\<^sub>2 (\<lambda>i\<^sub>2\<in>{..<s\<^sub>2}. mean_rv \<omega> i\<^sub>2)"
 
 lemma mean_rv_alg_sketch:
   "sketch = \<Omega> \<bind> (\<lambda>\<omega>. return_pmf (s\<^sub>1, s\<^sub>2, p, \<omega>, \<lambda>i \<in> {..<s\<^sub>1} \<times> {..<s\<^sub>2}. sum_list (map (f2_hash p (\<omega> i)) as)))"
 proof -
   have "sketch =  fold (\<lambda>a state. state \<bind> f2_update a) as (f2_init \<delta> \<epsilon> n)"
     by (simp add:sketch_def)
   also have "... = \<Omega> \<bind> (\<lambda>\<omega>. return_pmf (s\<^sub>1, s\<^sub>2, p, \<omega>, 
       \<lambda>i \<in> {..<s\<^sub>1} \<times> {..<s\<^sub>2}. sum_list (map (f2_hash p (\<omega> i)) as)))"
   proof (induction as rule:rev_induct)
     case Nil
     then show ?case 
       by (simp add:s\<^sub>1_def s\<^sub>2_def space_def p_def[symmetric] \<Omega>_def restrict_def Let_def) 
   next
     case (snoc a as)
     have "fold (\<lambda>a state. state \<bind> f2_update a) (as @ [a]) (f2_init \<delta> \<epsilon> n) = \<Omega> \<bind> 
       (\<lambda>\<omega>. return_pmf (s\<^sub>1, s\<^sub>2, p, \<omega>, \<lambda>s \<in> {..<s\<^sub>1} \<times> {..<s\<^sub>2}. (\<Sum>x \<leftarrow> as.  f2_hash p (\<omega> s) x)) \<bind> f2_update a)"
       using snoc by (simp add: bind_assoc_pmf restrict_def del:f2_hash.simps f2_init.simps)
     also have "... =  \<Omega> \<bind> (\<lambda>\<omega>. return_pmf (s\<^sub>1, s\<^sub>2, p, \<omega>, \<lambda>i \<in> {..<s\<^sub>1} \<times> {..<s\<^sub>2}. (\<Sum>x \<leftarrow> as@[a].  f2_hash p (\<omega> i) x)))"
       by (subst bind_return_pmf) (simp add: add.commute del:f2_hash.simps cong:restrict_cong)
     finally show ?case by blast
   qed
   finally show ?thesis by auto
 qed
 
 lemma distr:  "result = map_pmf result_rv \<Omega>"
 proof -
   have "result = sketch \<bind> f2_result"
     by (simp add:result_def sketch_def)
   also have "... = \<Omega> \<bind> (\<lambda>x. f2_result (s\<^sub>1, s\<^sub>2, p, x, \<lambda>i\<in>{..<s\<^sub>1} \<times> {..<s\<^sub>2}. sum_list (map (f2_hash p (x i)) as)))"
     by (simp add: mean_rv_alg_sketch  bind_assoc_pmf bind_return_pmf)
   also have "... = map_pmf result_rv \<Omega>"
     by (simp add:map_pmf_def result_rv_def mean_rv_def sketch_rv_def lessThan_atLeast0 cong:restrict_cong)
   finally show ?thesis by simp
 qed
 
 private lemma f2_hash_pow_exp:
   assumes "k < p"
   shows
     "expectation (\<lambda>\<omega>. real_of_int (f2_hash p \<omega> k) ^m) = 
      ((real p - 1) ^ m * (real p + 1) + (- real p - 1) ^ m * (real p - 1)) / (2 * real p)"
 proof -
 
   have "odd p" using p_prime p_ge_3 prime_odd_nat assms by simp
   then obtain t where t_def: "p=2*t+1" 
     using oddE by blast
 
   have "Collect even \<inter> {..<2 * t + 1} \<subseteq> (*) 2 ` {..<t + 1}" 
     by (rule in_image_by_witness[where g="\<lambda>x. x div 2"], simp, linarith)
   moreover have " (*) 2 ` {..<t + 1} \<subseteq> Collect even \<inter> {..<2 * t + 1}"
     by (rule image_subsetI, simp)
   ultimately have "card ({k. even k} \<inter> {..<p}) = card ((\<lambda>x. 2*x) ` {..<t+1})"
     unfolding t_def using order_antisym by metis
   also have "... = card {..<t+1}" 
     by (rule card_image, simp add: inj_on_mult)
   also have "... =  t+1" by simp
   finally have card_even: "card ({k. even k} \<inter> {..<p}) = t+1" by simp
   hence "card ({k. even k} \<inter> {..<p}) * 2 = (p+1)" by (simp add:t_def)
   hence prob_even: "prob {\<omega>. hash k \<omega> \<in> Collect even} = (real p + 1)/(2*real p)"
     using assms by (subst prob_range, auto simp:frac_eq_eq p_gt_0 mod_ring_def) 
 
   have "p = card {..<p}" by simp
   also have "... = card (({k. odd k} \<inter> {..<p}) \<union> ({k. even k} \<inter> {..<p}))" 
     by (rule arg_cong[where f="card"], auto)
   also have "... = card ({k. odd k} \<inter> {..<p}) +  card ({k. even k} \<inter> {..<p})"
     by (rule card_Un_disjoint, simp, simp, blast)
   also have "... = card ({k. odd k} \<inter> {..<p}) + t+1"
     by (simp add:card_even)
   finally have "p = card ({k. odd k} \<inter> {..<p}) + t+1"
     by simp
   hence "card ({k. odd k} \<inter> {..<p}) * 2 = (p-1)" 
     by (simp add:t_def)
   hence prob_odd: "prob {\<omega>. hash k \<omega> \<in> Collect odd} = (real p - 1)/(2*real p)"
     using assms by (subst prob_range, auto simp add: frac_eq_eq mod_ring_def)
 
   have "expectation (\<lambda>x. real_of_int (f2_hash p x k) ^ m) =
     expectation (\<lambda>\<omega>. indicator {\<omega>. even (hash k \<omega>)} \<omega> * (real p - 1)^m + 
       indicator {\<omega>. odd (hash k \<omega>)} \<omega> * (-real p - 1)^m)" 
     by (rule Bochner_Integration.integral_cong, simp, simp)
   also have "... = 
      prob {\<omega>. hash  k \<omega> \<in> Collect even}  * (real p - 1) ^ m  + 
      prob {\<omega>. hash  k \<omega> \<in> Collect odd}  * (-real p - 1) ^ m "
     by (simp, simp add:M_def)
   also have "... = (real p + 1) * (real p - 1) ^ m / (2 * real p) + (real p - 1) * (- real p - 1) ^ m / (2 * real p)"
     by (subst prob_even, subst prob_odd, simp)
   also have "... =  
     ((real p - 1) ^ m * (real p + 1) + (- real p - 1) ^ m * (real p - 1)) / (2 * real p)"
     by (simp add:add_divide_distrib ac_simps)
   finally show "expectation (\<lambda>x. real_of_int (f2_hash p x k) ^ m) = 
     ((real p - 1) ^ m * (real p + 1) + (- real p - 1) ^ m * (real p - 1)) / (2 * real p)" by simp
 qed
 
 lemma 
   shows var_sketch_rv:"variance sketch_rv \<le> 2*(real_of_rat (F 2 as)^2) * ((real p)\<^sup>2-1)\<^sup>2" (is "?A")
   and exp_sketch_rv:"expectation sketch_rv = real_of_rat (F 2 as) * ((real p)\<^sup>2-1)" (is "?B")
 proof -
   define h where "h = (\<lambda>\<omega> x. real_of_int (f2_hash p \<omega> x))"
   define c where "c = (\<lambda>x. real (count_list as x))"
   define r where "r = (\<lambda>(m::nat). ((real p - 1) ^ m * (real p + 1) + (- real p - 1) ^ m * (real p - 1)) / (2 * real p))"
   define h_prod where "h_prod = (\<lambda>as \<omega>. prod_list (map (h \<omega>) as))" 
 
   define exp_h_prod :: "nat list \<Rightarrow> real" where "exp_h_prod = (\<lambda>as. (\<Prod>i \<in> set as. r (count_list as i)))"
 
   have f_eq: "sketch_rv = (\<lambda>\<omega>. (\<Sum>x \<in> set as. c x * h \<omega> x)^2)"
     by (rule ext, simp add:sketch_rv_def c_def h_def sum_list_eval del:f2_hash.simps)
 
   have r_one: "r (Suc 0) = 0"
     by (simp add:r_def algebra_simps)
 
   have r_two: "r 2 = (real p^2-1)"
     using p_gt_0 unfolding r_def power2_eq_square 
     by (simp add:nonzero_divide_eq_eq, simp add:algebra_simps)
 
   have"(real p)^2 \<ge> 2^2"
     by (rule power_mono, use p_gt_1 in linarith, simp)
   hence p_square_ge_4: "(real p)\<^sup>2 \<ge> 4" by simp
 
   have "r 4 = (real p)^4+2*(real p)\<^sup>2 - 3" 
     using p_gt_0 unfolding r_def
     by (subst nonzero_divide_eq_eq, auto simp:power4_eq_xxxx power2_eq_square algebra_simps)
   also have "... \<le> (real p)^4+2*(real p)\<^sup>2 + 3"
     by simp
   also have "... \<le> 3 * r 2 * r 2"
     using p_square_ge_4
     by (simp add:r_two power4_eq_xxxx power2_eq_square algebra_simps mult_left_mono)
   finally have r_four_est: "r 4 \<le> 3 * r 2 * r 2"  by simp
 
   have exp_h_prod_elim: "exp_h_prod = (\<lambda>as. prod_list (map (r \<circ> count_list as) (remdups as)))" 
     by (simp add:exp_h_prod_def prod.set_conv_list[symmetric])
 
   have exp_h_prod: "\<And>x. set x \<subseteq> set as \<Longrightarrow> length x \<le> 4 \<Longrightarrow> expectation (h_prod x) = exp_h_prod x"
   proof -
     fix x 
     assume "set x \<subseteq> set as"
     hence x_sub_p: "set x \<subseteq> {..<p}" using as_range p_ge_n by auto
     hence x_le_p: "\<And>k. k \<in> set x \<Longrightarrow> k < p" by auto
     assume "length x \<le> 4"
     hence card_x: "card (set x) \<le> 4" using card_length dual_order.trans by blast
 
     have "set x \<subseteq> carrier (mod_ring p) "
       using x_sub_p by (simp add:mod_ring_def)
 
     hence h_indep: "indep_vars (\<lambda>_. borel) (\<lambda>i \<omega>. h \<omega> i ^ count_list x i) (set x)"
       using k_wise_indep_vars_subset[OF k_wise_indep] card_x as_range h_def
       by (auto intro:indep_vars_compose2[where X="hash" and M'=" (\<lambda>_. discrete)"])
 
     have "expectation (h_prod x) = expectation (\<lambda>\<omega>. \<Prod> i \<in> set x. h \<omega> i^(count_list x i))"
       by (simp add:h_prod_def prod_list_eval)
     also have "... = (\<Prod>i \<in> set x. expectation (\<lambda>\<omega>. h \<omega> i^(count_list x i)))"
       by (simp add: indep_vars_lebesgue_integral[OF _ h_indep])
     also have "... = (\<Prod>i \<in> set x. r (count_list x i))"
       using f2_hash_pow_exp x_le_p 
       by (simp add:h_def r_def M_def[symmetric] del:f2_hash.simps)
     also have "... = exp_h_prod x"
       by (simp add:exp_h_prod_def)
     finally show "expectation (h_prod x) = exp_h_prod x" by simp
   qed
 
   have "\<And>x y. kernel_of x = kernel_of y \<Longrightarrow> exp_h_prod x = exp_h_prod y" 
   proof -
     fix x y :: "nat list"
     assume a:"kernel_of x = kernel_of y"
     then obtain f where b:"bij_betw f (set x) (set y)" and c:"\<And>z. z \<in> set x \<Longrightarrow> count_list x z = count_list y (f z)"
       using kernel_of_eq_imp_bij by blast
     have "exp_h_prod x = prod ( (\<lambda>i. r(count_list y i)) \<circ> f) (set x)"
       by (simp add:exp_h_prod_def c)
     also have "... = (\<Prod>i \<in> f ` (set x). r(count_list y i))"
       by (metis b bij_betw_def prod.reindex)
     also have "... = exp_h_prod y"
       unfolding exp_h_prod_def
       by (rule prod.cong, metis b bij_betw_def) simp
     finally show "exp_h_prod x = exp_h_prod y" by simp
   qed
 
   hence exp_h_prod_cong: "\<And>p x. of_bool (kernel_of x = kernel_of p) * exp_h_prod p = 
     of_bool (kernel_of x = kernel_of p) * exp_h_prod x" 
     by (metis (full_types) of_bool_eq_0_iff vector_space_over_itself.scale_zero_left)
 
   have c:"(\<Sum>p\<leftarrow>enum_rgfs n. of_bool (kernel_of xs = kernel_of p) * r) = r"
     if a:"length xs = n" for xs :: "nat list" and n and r :: real
   proof -
     have "(\<Sum>p\<leftarrow>enum_rgfs n. of_bool (kernel_of xs = kernel_of p) * 1) = (1::real)"
       using equiv_rels_2[OF a[symmetric]] by (simp add:equiv_rels_def comp_def) 
     thus "(\<Sum>p\<leftarrow>enum_rgfs n. of_bool (kernel_of xs = kernel_of p) * r) = (r::real)" 
       by (simp add:sum_list_mult_const)
   qed
 
   have "expectation sketch_rv = (\<Sum>i\<in>set as. (\<Sum>j\<in>set as. c i * c j * expectation (h_prod [i,j])))"
     by (simp add:f_eq h_prod_def power2_eq_square sum_distrib_left sum_distrib_right Bochner_Integration.integral_sum algebra_simps)
   also have "... = (\<Sum>i\<in>set as. (\<Sum>j\<in>set as. c i * c j * exp_h_prod [i,j]))"
     by (simp add:exp_h_prod)
   also have "... = (\<Sum>i \<in> set as. (\<Sum>j \<in> set as.  
     c i * c j * (sum_list (map (\<lambda>p. of_bool (kernel_of [i,j] = kernel_of p) * exp_h_prod p) (enum_rgfs 2)))))"
     by (subst exp_h_prod_cong, simp add:c)
   also have "... = (\<Sum>i\<in>set as. c i * c i * r 2)"
     by (simp add: numeral_eq_Suc kernel_of_eq All_less_Suc exp_h_prod_elim r_one distrib_left sum.distrib sum_collapse)
   also have "... = real_of_rat (F 2 as) * ((real p)^2-1)"
     by (simp add: sum_distrib_right[symmetric] c_def F_def power2_eq_square of_rat_sum of_rat_mult r_two)
   finally show b:?B by simp
 
   have "expectation (\<lambda>x. (sketch_rv x)\<^sup>2) = (\<Sum>i1 \<in> set as. (\<Sum>i2 \<in> set as. (\<Sum>i3 \<in> set as. (\<Sum>i4 \<in> set as.
     c i1 * c i2 * c i3 * c i4 * expectation (h_prod [i1, i2, i3, i4])))))"
     by (simp add:f_eq h_prod_def power4_eq_xxxx sum_distrib_left sum_distrib_right Bochner_Integration.integral_sum algebra_simps)
   also have "... = (\<Sum>i1 \<in> set as. (\<Sum>i2 \<in> set as. (\<Sum>i3 \<in> set as. (\<Sum>i4 \<in> set as. 
     c i1 * c i2 * c i3 * c i4 * exp_h_prod [i1,i2,i3,i4]))))"
     by (simp add:exp_h_prod)
   also have "... = (\<Sum>i1 \<in> set as. (\<Sum>i2 \<in> set as. (\<Sum>i3 \<in> set as. (\<Sum>i4 \<in> set as. 
     c i1 * c i2 * c i3 * c i4 * 
     (sum_list (map (\<lambda>p. of_bool (kernel_of [i1,i2,i3,i4] = kernel_of p) * exp_h_prod p) (enum_rgfs 4)))))))"
     by (subst exp_h_prod_cong, simp add:c)
   also have "... = 
     3 * (\<Sum>i \<in> set as. (\<Sum>j \<in> set as. c i^2 * c j^2 * r 2 * r 2)) + ((\<Sum> i \<in> set as. c i^4 * r 4) - 3 *  (\<Sum> i \<in> set as. c i ^ 4 * r 2 * r 2))"
     apply (simp add: numeral_eq_Suc exp_h_prod_elim r_one) (* large intermediate terms *)
     apply (simp add: kernel_of_eq All_less_Suc numeral_eq_Suc distrib_left sum.distrib sum_collapse neq_commute of_bool_not_iff)
     apply (simp add: algebra_simps sum_subtractf sum_collapse)
     apply (simp add: sum_distrib_left algebra_simps)
     done
   also have "... = 3 * (\<Sum>i \<in> set as. c i^2 * r 2)^2 + (\<Sum> i \<in> set as. c i ^ 4 * (r 4 - 3 * r 2 * r 2))"
     by (simp add:power2_eq_square sum_distrib_left algebra_simps sum_subtractf)
   also have "... = 3 * (\<Sum>i \<in> set as. c i^2)^2 * (r 2)^2 + (\<Sum>i \<in> set as. c i ^ 4 * (r 4 - 3 * r 2 * r 2))"
     by (simp add:power_mult_distrib sum_distrib_right[symmetric])
   also have "... \<le> 3 * (\<Sum>i \<in> set as. c i^2)^2 * (r 2)^2 + (\<Sum>i \<in> set as. c i ^ 4 * 0)"
     using r_four_est  
     by (auto intro!: sum_nonpos simp add:mult_nonneg_nonpos)
   also have "... = 3 * (real_of_rat (F 2 as)^2) * ((real p)\<^sup>2-1)\<^sup>2" 
     by (simp add:c_def r_two F_def of_rat_sum of_rat_power)
   finally have "expectation (\<lambda>x. (sketch_rv x)\<^sup>2) \<le> 3 * (real_of_rat (F 2 as)^2) * ((real p)\<^sup>2-1)\<^sup>2"
     by simp
   
   thus "variance sketch_rv \<le> 2*(real_of_rat (F 2 as)^2) * ((real p)\<^sup>2-1)\<^sup>2"
      by (simp add: variance_eq, simp add:power_mult_distrib b)
 qed
 
 lemma space_omega_1 [simp]: "Sigma_Algebra.space \<Omega>\<^sub>p = UNIV"
     by (simp add:\<Omega>\<^sub>p_def)
 
 interpretation \<Omega>: prob_space "\<Omega>\<^sub>p"
   by (simp add:\<Omega>\<^sub>p_def prob_space_measure_pmf)
 
 lemma integrable_\<Omega>:
   fixes f :: "((nat \<times> nat) \<Rightarrow> (nat list)) \<Rightarrow> real"
   shows "integrable \<Omega>\<^sub>p f"
   unfolding \<Omega>\<^sub>p_def \<Omega>_def
   by (rule integrable_measure_pmf_finite, auto intro:finite_PiE simp:set_prod_pmf)
 
 lemma sketch_rv_exp:
   assumes "i\<^sub>2 < s\<^sub>2"
   assumes "i\<^sub>1 \<in> {0..<s\<^sub>1}"
   shows "\<Omega>.expectation (\<lambda>\<omega>. sketch_rv (\<omega> (i\<^sub>1, i\<^sub>2))) = real_of_rat (F 2 as) * ((real p)\<^sup>2 - 1)"
 proof -
   have "\<Omega>.expectation (\<lambda>\<omega>.  (sketch_rv (\<omega> (i\<^sub>1, i\<^sub>2))) :: real) = expectation sketch_rv"
     using integrable_\<Omega> integrable_M assms
     unfolding \<Omega>_def \<Omega>\<^sub>p_def M_def
     by (subst expectation_Pi_pmf_slice, auto)
   also have "... = (real_of_rat (F 2 as)) * ((real p)\<^sup>2 - 1)"
     using exp_sketch_rv by simp
   finally show ?thesis by simp
 qed
 
 lemma sketch_rv_var:
   assumes "i\<^sub>2 < s\<^sub>2"
   assumes "i\<^sub>1 \<in> {0..<s\<^sub>1}"
   shows "\<Omega>.variance (\<lambda>\<omega>. sketch_rv (\<omega> (i\<^sub>1, i\<^sub>2))) \<le> 2 * (real_of_rat (F 2 as))\<^sup>2 * ((real p)\<^sup>2 - 1)\<^sup>2"
 proof -
   have "\<Omega>.variance (\<lambda>\<omega>. (sketch_rv (\<omega> (i\<^sub>1, i\<^sub>2)) :: real)) = variance sketch_rv"
     using integrable_\<Omega> integrable_M assms
     unfolding \<Omega>_def \<Omega>\<^sub>p_def M_def
     by (subst variance_prod_pmf_slice, auto)
   also have "... \<le>  2 * (real_of_rat (F 2 as))\<^sup>2 * ((real p)\<^sup>2 - 1)\<^sup>2"
     using var_sketch_rv by simp
   finally show ?thesis by simp
 qed
 
 lemma mean_rv_exp:
   assumes "i < s\<^sub>2"
   shows "\<Omega>.expectation (\<lambda>\<omega>. mean_rv \<omega> i) = real_of_rat (F 2 as)"
 proof -
   have a:"(real p)\<^sup>2 > 1" using p_gt_1 by simp
 
   have "\<Omega>.expectation (\<lambda>\<omega>. mean_rv \<omega> i) = (\<Sum>i\<^sub>1 = 0..<s\<^sub>1. \<Omega>.expectation (\<lambda>\<omega>. sketch_rv (\<omega> (i\<^sub>1, i)))) / (((real p)\<^sup>2 - 1) * real s\<^sub>1)"
     using assms integrable_\<Omega> by (simp add:mean_rv_def)
   also have "... = (\<Sum>i\<^sub>1 = 0..<s\<^sub>1. real_of_rat (F 2 as) * ((real p)\<^sup>2 - 1)) / (((real p)\<^sup>2 - 1) * real s\<^sub>1)" 
     using sketch_rv_exp[OF assms] by simp
   also have "... = real_of_rat (F 2 as)"
     using s1_gt_0 a by simp
   finally show ?thesis by simp
 qed
 
 lemma mean_rv_var:
   assumes "i < s\<^sub>2"
   shows "\<Omega>.variance (\<lambda>\<omega>. mean_rv \<omega> i) \<le> (real_of_rat (\<delta> * F 2 as))\<^sup>2 / 3"
 proof -
   have a: "\<Omega>.indep_vars (\<lambda>_. borel) (\<lambda>i\<^sub>1 x. sketch_rv (x (i\<^sub>1, i))) {0..<s\<^sub>1}"
     using assms
     unfolding \<Omega>\<^sub>p_def \<Omega>_def
     by (intro indep_vars_restrict_intro'[where f="fst"])
      (auto simp add: restrict_dfl_def case_prod_beta lessThan_atLeast0)
 
   have p_sq_ne_1: "(real p)^2 \<noteq> 1" 
     by (metis p_gt_1 less_numeral_extra(4) of_nat_power one_less_power pos2 semiring_char_0_class.of_nat_eq_1_iff)
 
   have s1_bound: " 6 / (real_of_rat \<delta>)\<^sup>2 \<le> real s\<^sub>1"
     unfolding s\<^sub>1_def
     by  (metis (mono_tags, opaque_lifting) of_rat_ceiling of_rat_divide of_rat_numeral_eq of_rat_power real_nat_ceiling_ge)
 
   have "\<Omega>.variance (\<lambda>\<omega>. mean_rv \<omega> i) = \<Omega>.variance (\<lambda>\<omega>. \<Sum>i\<^sub>1 = 0..<s\<^sub>1. sketch_rv (\<omega> (i\<^sub>1, i))) / (((real p)\<^sup>2 - 1) * real s\<^sub>1)\<^sup>2"
     unfolding mean_rv_def by (subst \<Omega>.variance_divide[OF integrable_\<Omega>], simp)
   also have "... = (\<Sum>i\<^sub>1 = 0..<s\<^sub>1. \<Omega>.variance (\<lambda>\<omega>. sketch_rv (\<omega> (i\<^sub>1, i)))) / (((real p)\<^sup>2 - 1) * real s\<^sub>1)\<^sup>2"
     by (subst \<Omega>.var_sum_all_indep[OF _ _ integrable_\<Omega> a]) (auto simp: \<Omega>_def \<Omega>\<^sub>p_def)
   also have "... \<le>  (\<Sum>i\<^sub>1 = 0..<s\<^sub>1. 2*(real_of_rat (F 2 as)^2) * ((real p)\<^sup>2-1)\<^sup>2)  / (((real p)\<^sup>2 - 1) * real s\<^sub>1)\<^sup>2"
     by (rule divide_right_mono, rule sum_mono[OF sketch_rv_var[OF assms]], auto)
   also have "... = 2 * (real_of_rat (F 2 as)^2) / real s\<^sub>1"
     using p_sq_ne_1 s1_gt_0 by (subst frac_eq_eq, auto simp:power2_eq_square)
   also have "... \<le> 2 * (real_of_rat (F 2 as)^2) / (6 / (real_of_rat \<delta>)\<^sup>2)"
     using  s1_gt_0 \<delta>_range by (intro divide_left_mono mult_pos_pos s1_bound) auto
   also have "... = (real_of_rat (\<delta> * F 2 as))\<^sup>2 / 3"
     by (simp add:of_rat_mult algebra_simps)
   finally show ?thesis by simp
 qed
 
 lemma mean_rv_bounds:
   assumes "i < s\<^sub>2"
   shows "\<Omega>.prob {\<omega>. real_of_rat \<delta> * real_of_rat (F 2 as) < \<bar>mean_rv \<omega> i - real_of_rat (F 2 as)\<bar>} \<le> 1/3"
 proof (cases "as = []")
   case True
   then show ?thesis
     using assms by (subst mean_rv_def, subst sketch_rv_def, simp add:F_def)
 next
   case False
   hence "F 2 as > 0" using F_gr_0 by auto
 
   hence a: "0 < real_of_rat (\<delta> * F 2 as)"
     using \<delta>_range by simp
   have [simp]: "(\<lambda>\<omega>. mean_rv \<omega> i) \<in> borel_measurable \<Omega>\<^sub>p"
     by (simp add:\<Omega>_def \<Omega>\<^sub>p_def)
   have "\<Omega>.prob {\<omega>. real_of_rat \<delta> * real_of_rat (F 2 as) < \<bar>mean_rv \<omega> i - real_of_rat (F 2 as)\<bar>} \<le> 
       \<Omega>.prob {\<omega>. real_of_rat (\<delta> * F 2 as) \<le> \<bar>mean_rv \<omega> i - real_of_rat (F 2 as)\<bar>}"
     by (rule \<Omega>.pmf_mono[OF \<Omega>\<^sub>p_def], simp add:of_rat_mult)
   also have "... \<le>  \<Omega>.variance (\<lambda>\<omega>. mean_rv \<omega> i) / (real_of_rat (\<delta> * F 2 as))\<^sup>2"
     using \<Omega>.Chebyshev_inequality[where a="real_of_rat (\<delta> * F 2 as)" and f="\<lambda>\<omega>. mean_rv \<omega> i",simplified] 
       a prob_space_measure_pmf[where p="\<Omega>"] mean_rv_exp[OF assms] integrable_\<Omega> by simp
   also have "... \<le> ((real_of_rat (\<delta> * F 2 as))\<^sup>2/3) / (real_of_rat (\<delta> * F 2 as))\<^sup>2"
     by (rule divide_right_mono, rule mean_rv_var[OF assms], simp)
   also  have "... = 1/3" using a by force
   finally show ?thesis by blast
 qed
 
 lemma f2_alg_correct':
    "\<P>(\<omega> in measure_pmf result. \<bar>\<omega> - F 2 as\<bar> \<le> \<delta> * F 2 as) \<ge> 1-of_rat \<epsilon>"
 proof -
   have a: "\<Omega>.indep_vars (\<lambda>_. borel) (\<lambda>i \<omega>. mean_rv \<omega> i) {0..<s\<^sub>2}" 
     using s1_gt_0 unfolding \<Omega>\<^sub>p_def \<Omega>_def
     by (intro indep_vars_restrict_intro'[where f="snd"])
       (auto simp: \<Omega>\<^sub>p_def \<Omega>_def mean_rv_def restrict_dfl_def)
 
   have b: "- 18 * ln (real_of_rat \<epsilon>) \<le> real s\<^sub>2" 
     unfolding  s\<^sub>2_def using of_nat_ceiling by auto
 
   have "1 - of_rat \<epsilon> \<le> \<Omega>.prob {\<omega>.  \<bar>median s\<^sub>2 (mean_rv \<omega>) -  real_of_rat (F 2 as) \<bar> \<le> of_rat \<delta> * of_rat (F 2 as)}"
     using \<epsilon>_range \<Omega>.median_bound_2[OF _ a b, where \<delta>="real_of_rat \<delta> * real_of_rat (F 2 as)"
         and \<mu>="real_of_rat (F 2 as)"] mean_rv_bounds
     by simp
   also have "... = \<Omega>.prob {\<omega>.  \<bar>real_of_rat (result_rv \<omega>) - of_rat (F 2 as) \<bar> \<le> of_rat \<delta> * of_rat (F 2 as)}"
     by (simp add:result_rv_def median_restrict lessThan_atLeast0 median_rat[OF s2_gt_0]
          mean_rv_def sketch_rv_def of_rat_divide of_rat_sum of_rat_mult of_rat_diff of_rat_power)
   also have "... = \<Omega>.prob {\<omega>. \<bar>result_rv \<omega> - F 2 as\<bar> \<le> \<delta> * F 2 as} " 
     by (simp add:of_rat_less_eq of_rat_mult[symmetric]  of_rat_diff[symmetric] set_eq_iff)
   finally have "\<Omega>.prob {y. \<bar>result_rv y - F 2 as\<bar> \<le> \<delta> * F 2 as} \<ge> 1-of_rat \<epsilon> " by simp
   thus ?thesis by (simp add: distr \<Omega>\<^sub>p_def)
 qed
 
 lemma f2_exact_space_usage':
    "AE \<omega> in sketch . bit_count (encode_f2_state \<omega>) \<le> f2_space_usage (n, length as, \<epsilon>, \<delta>)"
 proof -
   have "p \<le> 2 * max n 3 + 2"
     by (subst p_def, rule prime_above_upper_bound)
   also have "... \<le> 2 * n + 8"
     by (cases "n \<le> 2", simp_all)
   finally have p_bound: "p \<le> 2 * n + 8" 
     by simp
   have "bit_count (N\<^sub>e p) \<le> ereal (2 * log 2 (real p + 1) + 1)"
     by (rule exp_golomb_bit_count)
   also have "... \<le> ereal (2 * log 2 (2 * real n + 9) + 1)"
     using p_bound by simp
   finally have p_bit_count: "bit_count (N\<^sub>e p) \<le> ereal (2 * log 2 (2 * real n + 9) + 1)"
     by simp
 
   have a: "bit_count (encode_f2_state (s\<^sub>1, s\<^sub>2, p, y, \<lambda>i\<in>{..<s\<^sub>1} \<times> {..<s\<^sub>2}. 
       sum_list (map (f2_hash p (y i)) as))) \<le> ereal (f2_space_usage (n, length as, \<epsilon>, \<delta>))"
     if a:"y\<in>{..<s\<^sub>1} \<times> {..<s\<^sub>2} \<rightarrow>\<^sub>E bounded_degree_polynomials (mod_ring p) 4" for y
   proof -
     have "y \<in> extensional ({..<s\<^sub>1} \<times> {..<s\<^sub>2})" using a PiE_iff by blast
     hence y_ext: "y \<in> extensional (set (List.product [0..<s\<^sub>1] [0..<s\<^sub>2]))"
       by (simp add:lessThan_atLeast0)
 
     have h_bit_count_aux: "bit_count (P\<^sub>e p 4 (y x)) \<le> ereal (4 + 4 * log 2 (8 + 2 * real n))"
       if b:"x \<in>  set (List.product [0..<s\<^sub>1] [0..<s\<^sub>2])" for x
     proof -
       have "y x \<in> bounded_degree_polynomials (Field.mod_ring p) 4"
         using b a by force
       hence "bit_count (P\<^sub>e p 4 (y x)) \<le> ereal ( real 4 * (log 2 (real p) + 1))"
         by (rule bounded_degree_polynomial_bit_count[OF p_gt_1] )
       also have "... \<le> ereal (real 4 * (log 2 (8 + 2 * real n) + 1) )"
         using p_gt_0 p_bound by simp
       also have "... \<le> ereal (4 + 4 * log 2 (8 + 2 * real n))"
         by simp
       finally show ?thesis
         by blast
     qed
 
     have h_bit_count: 
       "bit_count ((List.product [0..<s\<^sub>1] [0..<s\<^sub>2] \<rightarrow>\<^sub>e P\<^sub>e p 4) y) \<le> ereal (real s\<^sub>1 * real s\<^sub>2 * (4 + 4 * log 2 (8 + 2 * real n)))"
       using fun_bit_count_est[where e="P\<^sub>e p 4", OF y_ext h_bit_count_aux]
       by simp
 
     have sketch_bit_count_aux:
       "bit_count (I\<^sub>e (sum_list (map (f2_hash p (y x)) as))) \<le> ereal (1 + 2 * log 2 (real (length as) * (18 + 4 * real n) + 1))" (is "?lhs \<le> ?rhs")
       if " x \<in> {0..<s\<^sub>1} \<times> {0..<s\<^sub>2}" for x
     proof -
       have "\<bar>sum_list (map (f2_hash p (y x)) as)\<bar> \<le> sum_list (map (abs \<circ> (f2_hash p (y x))) as)" 
         by (subst map_map[symmetric])  (rule sum_list_abs)
       also have "... \<le>  sum_list (map (\<lambda>_. (int p+1)) as)"
         by (rule sum_list_mono) (simp add:p_gt_0) 
       also have "... = int (length as) * (int p+1)"
         by (simp add: sum_list_triv)
       also have "... \<le> int (length as) * (9+2*(int n))"
         using p_bound by (intro mult_mono, auto)
       finally  have "\<bar>sum_list (map (f2_hash p (y x)) as)\<bar> \<le> int (length as) * (9 + 2 * int n)" by simp
       hence "?lhs \<le> ereal (2 * log 2 (real_of_int (2* (int (length as) * (9 + 2 * int n)) + 1)) + 1)"
         by (rule int_bit_count_est)
       also have "... = ?rhs" by (simp add:algebra_simps)
       finally show "?thesis" by simp
     qed
 
     have 
       "bit_count ((List.product [0..<s\<^sub>1] [0..<s\<^sub>2] \<rightarrow>\<^sub>e I\<^sub>e) (\<lambda>i\<in>{..<s\<^sub>1} \<times> {..<s\<^sub>2}. sum_list (map (f2_hash p (y i)) as)))
       \<le> ereal (real (length (List.product [0..<s\<^sub>1] [0..<s\<^sub>2]))) * (ereal (1 + 2 * log 2 (real (length as) * (18 + 4 * real n) + 1)))"
       by (intro fun_bit_count_est)  
        (simp_all add:extensional_def lessThan_atLeast0 sketch_bit_count_aux del:f2_hash.simps)
     also have "... = ereal (real s\<^sub>1 * real s\<^sub>2 * (1 + 2 * log 2 (real (length as) * (18 + 4 * real n) + 1)))"
       by simp
     finally have sketch_bit_count: 
        "bit_count ((List.product [0..<s\<^sub>1] [0..<s\<^sub>2] \<rightarrow>\<^sub>e I\<^sub>e) (\<lambda>i\<in>{..<s\<^sub>1} \<times> {..<s\<^sub>2}. sum_list (map (f2_hash p (y i)) as))) \<le>
       ereal (real s\<^sub>1 * real s\<^sub>2 * (1 + 2 * log 2 (real (length as) * (18 + 4 * real n) + 1)))" by simp
 
     have "bit_count (encode_f2_state (s\<^sub>1, s\<^sub>2, p, y, \<lambda>i\<in>{..<s\<^sub>1} \<times> {..<s\<^sub>2}. sum_list (map (f2_hash p (y i)) as))) \<le> 
       bit_count (N\<^sub>e s\<^sub>1) + bit_count (N\<^sub>e s\<^sub>2) +bit_count (N\<^sub>e p) +
       bit_count ((List.product [0..<s\<^sub>1] [0..<s\<^sub>2] \<rightarrow>\<^sub>e P\<^sub>e p 4) y) +
       bit_count ((List.product [0..<s\<^sub>1] [0..<s\<^sub>2] \<rightarrow>\<^sub>e I\<^sub>e) (\<lambda>i\<in>{..<s\<^sub>1} \<times> {..<s\<^sub>2}. sum_list (map (f2_hash p (y i)) as)))"   
       by (simp add:Let_def s\<^sub>1_def s\<^sub>2_def encode_f2_state_def dependent_bit_count add.assoc)
     also have "... \<le> ereal (2 * log 2 (real s\<^sub>1 + 1) + 1) + ereal (2 * log 2 (real s\<^sub>2 + 1) + 1) + ereal (2 * log 2 (2 * real n + 9) + 1) + 
       (ereal (real s\<^sub>1 * real s\<^sub>2) * (4 + 4 * log 2 (8 + 2 * real n))) + 
       (ereal (real s\<^sub>1 * real s\<^sub>2) * (1 + 2 * log 2 (real (length as) * (18 + 4 * real n) + 1) ))"
       by (intro add_mono exp_golomb_bit_count p_bit_count, auto intro: h_bit_count sketch_bit_count)
     also have "... = ereal (f2_space_usage (n, length as, \<epsilon>, \<delta>))"
       by (simp add:distrib_left add.commute s\<^sub>1_def[symmetric] s\<^sub>2_def[symmetric] Let_def)
     finally show "bit_count (encode_f2_state (s\<^sub>1, s\<^sub>2, p, y, \<lambda>i\<in>{..<s\<^sub>1} \<times> {..<s\<^sub>2}. sum_list (map (f2_hash p (y i)) as))) \<le>  
       ereal (f2_space_usage (n, length as, \<epsilon>, \<delta>))" 
       by simp
   qed
 
   have "set_pmf \<Omega> = {..<s\<^sub>1} \<times> {..<s\<^sub>2} \<rightarrow>\<^sub>E bounded_degree_polynomials (Field.mod_ring p) 4"
     by (simp add: \<Omega>_def set_prod_pmf)  (simp add: space_def)
   thus ?thesis
     by (simp  add:mean_rv_alg_sketch AE_measure_pmf_iff del:f2_space_usage.simps, metis a)
 qed
 
 end
 
 
 text \<open>Main results of this section:\<close>
 
 theorem f2_alg_correct:
   assumes "\<epsilon> \<in> {0<..<1}"
   assumes "\<delta> > 0"
   assumes "set as \<subseteq> {..<n}"
   defines "\<Omega> \<equiv> fold (\<lambda>a state. state \<bind> f2_update a) as (f2_init \<delta> \<epsilon> n) \<bind> f2_result"
   shows "\<P>(\<omega> in measure_pmf \<Omega>. \<bar>\<omega> - F 2 as\<bar> \<le> \<delta> * F 2 as) \<ge> 1-of_rat \<epsilon>"
   using f2_alg_correct'[OF assms(1,2,3)] \<Omega>_def by auto
 
 theorem f2_exact_space_usage:
   assumes "\<epsilon> \<in> {0<..<1}"
   assumes "\<delta> > 0"
   assumes "set as \<subseteq> {..<n}"
   defines "M \<equiv> fold (\<lambda>a state. state \<bind> f2_update a) as (f2_init \<delta> \<epsilon> n)"
   shows "AE \<omega> in M. bit_count (encode_f2_state \<omega>) \<le> f2_space_usage (n, length as, \<epsilon>, \<delta>)"
   using f2_exact_space_usage'[OF assms(1,2,3)]
   by (subst (asm) sketch_def[OF assms(1,2,3)], subst M_def, simp)
 
 theorem f2_asymptotic_space_complexity:
   "f2_space_usage \<in> O[at_top \<times>\<^sub>F at_top \<times>\<^sub>F at_right 0 \<times>\<^sub>F at_right 0](\<lambda> (n, m, \<epsilon>, \<delta>). 
   (ln (1 / of_rat \<epsilon>)) / (of_rat \<delta>)\<^sup>2 * (ln (real n) + ln (real m)))"
   (is "_ \<in> O[?F](?rhs)")
 proof -
   define n_of :: "nat \<times> nat \<times> rat \<times> rat \<Rightarrow> nat" where "n_of = (\<lambda>(n, m, \<epsilon>, \<delta>). n)"
   define m_of :: "nat \<times> nat \<times> rat \<times> rat \<Rightarrow> nat" where "m_of = (\<lambda>(n, m, \<epsilon>, \<delta>). m)"
   define \<epsilon>_of :: "nat \<times> nat \<times> rat \<times> rat \<Rightarrow> rat" where "\<epsilon>_of = (\<lambda>(n, m, \<epsilon>, \<delta>). \<epsilon>)"
   define \<delta>_of :: "nat \<times> nat \<times> rat \<times> rat \<Rightarrow> rat" where "\<delta>_of = (\<lambda>(n, m, \<epsilon>, \<delta>). \<delta>)"
 
   define g where "g = (\<lambda>x. (1/ (of_rat (\<delta>_of x))\<^sup>2) * (ln (1 / of_rat (\<epsilon>_of x))) * (ln (real (n_of x)) + ln (real (m_of x))))"
 
   have evt: "(\<And>x. 
     0 < real_of_rat (\<delta>_of x) \<and> 0 < real_of_rat (\<epsilon>_of x) \<and> 
     1/real_of_rat (\<delta>_of x) \<ge> \<delta> \<and> 1/real_of_rat (\<epsilon>_of x) \<ge> \<epsilon> \<and>
     real (n_of x) \<ge> n \<and> real (m_of x) \<ge> m\<Longrightarrow> P x) 
     \<Longrightarrow> eventually P ?F"  (is "(\<And>x. ?prem x \<Longrightarrow> _) \<Longrightarrow> _")
     for \<delta> \<epsilon> n m P
     apply (rule eventually_mono[where P="?prem" and Q="P"])
     apply (simp add:\<epsilon>_of_def case_prod_beta' \<delta>_of_def n_of_def m_of_def)
      apply (intro eventually_conj eventually_prod1' eventually_prod2' 
         sequentially_inf eventually_at_right_less inv_at_right_0_inf)
     by (auto simp add:prod_filter_eq_bot)
 
   have unit_1: "(\<lambda>_. 1) \<in> O[?F](\<lambda>x. 1 / (real_of_rat (\<delta>_of x))\<^sup>2)"
     using one_le_power
     by (intro landau_o.big_mono evt[where \<delta>="1"], auto simp add:power_one_over[symmetric])
 
   have unit_2: "(\<lambda>_. 1) \<in> O[?F](\<lambda>x. ln (1 / real_of_rat (\<epsilon>_of x)))"
     by (intro landau_o.big_mono  evt[where \<epsilon>="exp 1"])
      (auto intro!:iffD2[OF ln_ge_iff] simp add:abs_ge_iff)
 
   have unit_3: "(\<lambda>_. 1) \<in> O[?F](\<lambda>x. real (n_of x))"
     by (intro landau_o.big_mono evt, auto)
 
   have unit_4: "(\<lambda>_. 1) \<in> O[?F](\<lambda>x. real (m_of x))"
     by (intro landau_o.big_mono evt, auto)
 
   have unit_5: "(\<lambda>_. 1) \<in> O[?F](\<lambda>x. ln (real (n_of x)))"
     by (auto intro!: landau_o.big_mono evt[where n="exp 1"])
       (metis abs_ge_self linorder_not_le ln_ge_iff not_exp_le_zero order.trans)
 
   have unit_6: "(\<lambda>_. 1) \<in> O[?F](\<lambda>x. ln (real (n_of x)) + ln (real (m_of x)))"
     by (intro landau_sum_1 evt unit_5 iffD2[OF ln_ge_iff], auto)
 
   have unit_7: "(\<lambda>_. 1) \<in> O[?F](\<lambda>x. 1 / real_of_rat (\<epsilon>_of x))"
     by (intro landau_o.big_mono  evt[where \<epsilon>="1"], auto)
  
   have unit_8: "(\<lambda>_. 1) \<in> O[?F](g)" 
     unfolding g_def by (intro landau_o.big_mult_1 unit_1 unit_2 unit_6)
 
   have unit_9: "(\<lambda>_. 1) \<in> O[?F](\<lambda>x. real (n_of x) * real (m_of x))"
     by (intro landau_o.big_mult_1 unit_3 unit_4)
 
   have " (\<lambda>x. 6 * (1 / (real_of_rat (\<delta>_of x))\<^sup>2)) \<in> O[?F](\<lambda>x. 1 / (real_of_rat (\<delta>_of x))\<^sup>2)"
     by (subst landau_o.big.cmult_in_iff, simp_all)
   hence l1: "(\<lambda>x. real (nat \<lceil>6 / (\<delta>_of x)\<^sup>2\<rceil>)) \<in> O[?F](\<lambda>x. 1 / (real_of_rat (\<delta>_of x))\<^sup>2)"
     by (intro landau_real_nat  landau_rat_ceil[OF unit_1]) (simp_all add:of_rat_divide of_rat_power)
 
   have "(\<lambda>x. - ( ln (real_of_rat (\<epsilon>_of x)))) \<in> O[?F](\<lambda>x. ln (1 / real_of_rat (\<epsilon>_of x)))"
     by (intro landau_o.big_mono evt) (subst ln_div, auto)
   hence l2: "(\<lambda>x. real (nat \<lceil>- (18 * ln (real_of_rat (\<epsilon>_of x)))\<rceil>)) \<in> O[?F](\<lambda>x. ln (1 / real_of_rat (\<epsilon>_of x)))"
     by (intro landau_real_nat landau_ceil[OF unit_2], simp)
 
   have l3_aux: " (\<lambda>x. real (m_of x) * (18 + 4 * real (n_of x)) + 1) \<in> O[?F](\<lambda>x. real (n_of x) * real (m_of x))"
     by (rule sum_in_bigo[OF _unit_9], subst mult.commute)
       (intro landau_o.mult sum_in_bigo, auto simp:unit_3)
 
   have "(\<lambda>x. ln (real (m_of x) * (18 + 4 * real (n_of x)) + 1)) \<in> O[?F](\<lambda>x. ln (real (n_of x) * real (m_of x)))"
      apply (rule landau_ln_2[where a="2"], simp, simp)
       apply (rule evt[where m="2" and n="1"])
      apply (metis dual_order.trans mult_left_mono mult_of_nat_commute of_nat_0_le_iff verit_prod_simplify(1))
     using l3_aux by simp
   also have "(\<lambda>x. ln (real (n_of x) * real (m_of x))) \<in> O[?F](\<lambda>x. ln (real (n_of x)) + ln(real (m_of x)))"
     by (intro landau_o.big_mono evt[where m="1" and n="1"], auto simp add:ln_mult)
   finally have l3: "(\<lambda>x. ln (real (m_of x) * (18 + 4 * real (n_of x)) + 1)) \<in> O[?F](\<lambda>x. ln (real (n_of x)) + ln (real (m_of x)))"
     using  landau_o.big_trans by simp
 
   have l4: "(\<lambda>x. ln (8 + 2 * real (n_of x))) \<in> O[?F](\<lambda>x. ln (real (n_of x)) + ln (real (m_of x)))"
     by (intro landau_sum_1  evt[where n="2"] landau_ln_2[where a="2"] iffD2[OF ln_ge_iff])
      (auto intro!: sum_in_bigo simp add:unit_3)
 
   have l5: "(\<lambda>x. ln (9 + 2 * real (n_of x))) \<in> O[?F](\<lambda>x. ln (real (n_of x)) + ln (real (m_of x)))"
     by (intro landau_sum_1  evt[where n="2"] landau_ln_2[where a="2"] iffD2[OF ln_ge_iff])
      (auto intro!: sum_in_bigo simp add:unit_3)
 
   have l6: "(\<lambda>x. ln (real (nat \<lceil>6 / (\<delta>_of x)\<^sup>2\<rceil>) + 1)) \<in> O[?F](g)"
     unfolding g_def
     by (intro landau_o.big_mult_1 landau_ln_3 sum_in_bigo unit_6 unit_2 l1 unit_1, simp)
 
   have l7: "(\<lambda>x. ln (9 + 2 * real (n_of x))) \<in> O[?F](g)"
     unfolding g_def
     by (intro landau_o.big_mult_1' unit_1 unit_2 l5)
 
   have l8: "(\<lambda>x. ln (real (nat \<lceil>- (18 * ln (real_of_rat (\<epsilon>_of x)))\<rceil>) + 1) ) \<in> O[?F](g)"
     unfolding g_def
     by (intro landau_o.big_mult_1 unit_6 landau_o.big_mult_1' unit_1 landau_ln_3  sum_in_bigo l2 unit_2) simp
 
   have l9: "(\<lambda>x. 5 + 4 * ln (8 + 2 * real (n_of x)) / ln 2 + 2 * ln (real (m_of x) * (18 + 4 * real (n_of x)) + 1) / ln 2)
       \<in> O[?F](\<lambda>x. ln (real (n_of x)) + ln (real (m_of x)))"
     by (intro sum_in_bigo, auto simp: l3 l4 unit_6)
 
   have l10: "(\<lambda>x. real (nat \<lceil>6 / (\<delta>_of x)\<^sup>2\<rceil>) * real (nat \<lceil>- (18 * ln (real_of_rat (\<epsilon>_of x)))\<rceil>) * 
       (5 + 4 * ln (8 + 2 * real (n_of x)) / ln 2 + 2 * ln(real (m_of x) * (18 + 4 * real (n_of x)) + 1) / ln 2))
       \<in> O[?F](g)"
     unfolding g_def by (intro landau_o.mult, auto simp: l1 l2 l9)
 
   have "f2_space_usage = (\<lambda>x. f2_space_usage (n_of x, m_of x, \<epsilon>_of x, \<delta>_of x))"
     by (simp add:case_prod_beta' n_of_def \<epsilon>_of_def \<delta>_of_def m_of_def)
   also have "... \<in> O[?F](g)"
     by (auto intro!:sum_in_bigo simp:Let_def log_def l6 l7 l8 l10 unit_8)
   also have "... = O[?F](?rhs)"
     by (simp add:case_prod_beta' g_def n_of_def \<epsilon>_of_def \<delta>_of_def m_of_def)
   finally show ?thesis by simp
 qed
 
 end
diff --git a/thys/Frequency_Moments/Frequency_Moments.thy b/thys/Frequency_Moments/Frequency_Moments.thy
--- a/thys/Frequency_Moments/Frequency_Moments.thy
+++ b/thys/Frequency_Moments/Frequency_Moments.thy
@@ -1,115 +1,115 @@
 section "Frequency Moments"
 
 theory Frequency_Moments
   imports 
     Frequency_Moments_Preliminary_Results
-    Universal_Hash_Families.Field
+    Universal_Hash_Families.Universal_Hash_Families_More_Finite_Fields
     Interpolation_Polynomials_HOL_Algebra.Interpolation_Polynomial_Cardinalities
 begin
 
 text \<open>This section contains a definition of the frequency moments of a stream and a few general results about 
 frequency moments..\<close>
 
 definition F where
   "F k xs = (\<Sum> x \<in> set xs. (rat_of_nat (count_list xs x)^k))"
 
 lemma F_ge_0: "F k as \<ge> 0"
   unfolding F_def by (rule sum_nonneg, simp)
 
 lemma F_gr_0:
   assumes "as \<noteq> []"
   shows "F k as > 0"
 proof -
   have "rat_of_nat 1 \<le> rat_of_nat (card (set as))"
     using assms card_0_eq[where A="set as"] 
     by (intro of_nat_mono)
      (metis List.finite_set One_nat_def Suc_leI neq0_conv set_empty)
   also have "... = (\<Sum>x\<in>set as. 1)" by simp
   also have "... \<le> (\<Sum>x\<in>set as. rat_of_nat (count_list as x) ^ k)"
     by (intro sum_mono one_le_power)
      (metis  count_list_gr_1  of_nat_1 of_nat_le_iff)
   also have "... \<le> F k as"
     by (simp add:F_def)
   finally show ?thesis by simp
 qed
 
 definition P\<^sub>e :: "nat \<Rightarrow> nat \<Rightarrow> nat list \<Rightarrow> bool list option" where
-  "P\<^sub>e p n f = (if p > 1 \<and> f \<in> bounded_degree_polynomials (Field.mod_ring p) n then
-    ([0..<n] \<rightarrow>\<^sub>e Nb\<^sub>e p) (\<lambda>i \<in> {..<n}. ring.coeff (Field.mod_ring p) f i) else None)"
+  "P\<^sub>e p n f = (if p > 1 \<and> f \<in> bounded_degree_polynomials (mod_ring p) n then
+    ([0..<n] \<rightarrow>\<^sub>e Nb\<^sub>e p) (\<lambda>i \<in> {..<n}. ring.coeff (mod_ring p) f i) else None)"
 
 lemma poly_encoding:
   "is_encoding (P\<^sub>e p n)"
 proof (cases "p > 1")
   case True
-  interpret cring "Field.mod_ring p"
+  interpret cring "mod_ring p"
     using mod_ring_is_cring True by blast
   have a:"inj_on (\<lambda>x. (\<lambda>i \<in> {..<n}. (coeff x i))) (bounded_degree_polynomials (mod_ring p) n)"
   proof (rule inj_onI)
     fix x y
     assume b:"x \<in> bounded_degree_polynomials (mod_ring p) n"
     assume c:"y \<in> bounded_degree_polynomials (mod_ring p) n"
     assume d:"restrict (coeff x) {..<n} = restrict (coeff y) {..<n}"
     have "coeff x i = coeff y i" for i
     proof (cases "i < n")
       case True
       then show ?thesis by (metis lessThan_iff restrict_apply d)
     next
       case False
       hence e: "i \<ge> n" by linarith
       have "coeff x i = \<zero>\<^bsub>mod_ring p\<^esub>"
         using b e by (subst coeff_length, auto simp:bounded_degree_polynomials_length)
       also have "... = coeff y i"
         using c e by (subst coeff_length, auto simp:bounded_degree_polynomials_length)
       finally show ?thesis by simp
     qed
     then show "x = y"
       using b c univ_poly_carrier 
       by (subst coeff_iff_polynomial_cond) (auto simp:bounded_degree_polynomials_length) 
   qed
 
   have "is_encoding (\<lambda>f. P\<^sub>e p n f)"
     unfolding P\<^sub>e_def using a True
     by (intro encoding_compose[where f="([0..<n] \<rightarrow>\<^sub>e Nb\<^sub>e p)"] fun_encoding bounded_nat_encoding) 
      auto
   thus ?thesis by simp
 next
   case False
   hence "is_encoding (\<lambda>f. P\<^sub>e p n f)"
     unfolding P\<^sub>e_def using encoding_triv by simp
   then show ?thesis by simp
 qed
 
 lemma bounded_degree_polynomial_bit_count:
   assumes "p > 1"
-  assumes "x \<in> bounded_degree_polynomials (Field.mod_ring p) n"
+  assumes "x \<in> bounded_degree_polynomials (mod_ring p) n"
   shows "bit_count (P\<^sub>e p n x) \<le> ereal (real n * (log 2 p + 1))"
 proof -
-  interpret cring "Field.mod_ring p"
+  interpret cring "mod_ring p"
     using mod_ring_is_cring assms by blast
 
   have a: "x \<in> carrier (poly_ring (mod_ring p))"
     using assms(2) by (simp add:bounded_degree_polynomials_def)
 
   have "real_of_int \<lfloor>log 2 (p-1)\<rfloor>+1 \<le> log 2 (p-1) + 1"
     using floor_eq_iff by (intro add_mono, auto) 
   also have "... \<le> log 2 p + 1"
     using assms by (intro add_mono, auto)
   finally have b: "\<lfloor>log 2 (p-1)\<rfloor>+1 \<le> log 2 p + 1"
     by simp
 
   have "bit_count (P\<^sub>e p n x) = (\<Sum> k \<leftarrow> [0..<n]. bit_count (Nb\<^sub>e p (coeff x k)))"
     using assms restrict_extensional 
     by (auto intro!:arg_cong[where f="sum_list"] simp add:P\<^sub>e_def fun_bit_count lessThan_atLeast0)
   also have "... = (\<Sum> k \<leftarrow> [0..<n]. ereal (floorlog 2 (p-1)))"
     using coeff_in_carrier[OF a] mod_ring_carr 
     by (subst bounded_nat_bit_count_2, auto)
   also have "... = n * ereal (floorlog 2 (p-1))"
     by (simp add: sum_list_triv)
   also have "... = n * real_of_int (\<lfloor>log 2 (p-1)\<rfloor>+1)" 
     using assms(1) by (simp add:floorlog_def)
   also have "... \<le> ereal (real n * (log 2 p + 1))" 
     by (subst ereal_less_eq, intro mult_left_mono b, auto)
   finally show ?thesis by simp
 qed
 
 end
\ No newline at end of file
diff --git a/thys/Frequency_Moments/Product_PMF_Ext.thy b/thys/Frequency_Moments/Product_PMF_Ext.thy
--- a/thys/Frequency_Moments/Product_PMF_Ext.thy
+++ b/thys/Frequency_Moments/Product_PMF_Ext.thy
@@ -1,210 +1,210 @@
 section \<open>Indexed Products of Probability Mass Functions\<close>
 
 theory Product_PMF_Ext
-  imports Main Probability_Ext "HOL-Probability.Product_PMF" Universal_Hash_Families.Preliminary_Results
+  imports Main Probability_Ext "HOL-Probability.Product_PMF" Universal_Hash_Families.Universal_Hash_Families_More_Independent_Families
 begin
 
 hide_const "Isolated.discrete"
 
 text \<open>This section introduces a restricted version of @{term "Pi_pmf"} where the default value is @{term "undefined"}
 and contains some additional results about that case in addition to @{theory "HOL-Probability.Product_PMF"}\<close>
 
 abbreviation prod_pmf where "prod_pmf I M \<equiv> Pi_pmf I undefined M"
 
 lemma pmf_prod_pmf: 
   assumes "finite I"
   shows "pmf (prod_pmf I M) x = (if x \<in> extensional I then \<Prod>i \<in> I. (pmf (M i)) (x i) else 0)"
   by (simp add:  pmf_Pi[OF assms(1)] extensional_def)
 
 lemma PiE_defaut_undefined_eq: "PiE_dflt I undefined M = PiE I M" 
   by (simp add:PiE_dflt_def PiE_def extensional_def Pi_def set_eq_iff) blast
 
 lemma set_prod_pmf:
   assumes "finite I"
   shows "set_pmf (prod_pmf I M) = PiE I (set_pmf \<circ> M)"
   by (simp add:set_Pi_pmf[OF assms] PiE_defaut_undefined_eq)
 
 text \<open>A more general version of @{thm [source] "measure_Pi_pmf_Pi"}.\<close>
 lemma prob_prod_pmf': 
   assumes "finite I"
   assumes "J \<subseteq> I"
   shows "measure (measure_pmf (Pi_pmf I d M)) (Pi J A) = (\<Prod> i \<in> J. measure (M i) (A i))"
 proof -
   have a:"Pi J A = Pi I (\<lambda>i. if i \<in> J then A i else UNIV)"
     using assms by (simp add:Pi_def set_eq_iff, blast)
   show ?thesis
     using assms
     by (simp add:if_distrib  a measure_Pi_pmf_Pi[OF assms(1)] prod.If_cases[OF assms(1)] Int_absorb1)
 qed
 
 lemma prob_prod_pmf_slice:
   assumes "finite I"
   assumes "i \<in> I"
   shows "measure (measure_pmf (prod_pmf I M)) {\<omega>. P (\<omega> i)} = measure (M i) {\<omega>. P \<omega>}"
   using prob_prod_pmf'[OF assms(1), where J="{i}" and M="M" and A="\<lambda>_. Collect P"]
   by (simp add:assms Pi_def)
 
 
 definition restrict_dfl where "restrict_dfl f A d = (\<lambda>x. if x \<in> A then f x else d)"
 
 lemma pi_pmf_decompose:
   assumes "finite I"
   shows "Pi_pmf I d M = map_pmf (\<lambda>\<omega>. restrict_dfl (\<lambda>i. \<omega> (f i) i) I d) (Pi_pmf (f ` I) (\<lambda>_. d) (\<lambda>j. Pi_pmf (f -` {j} \<inter> I) d M))"
 proof -
   have fin_F_I:"finite (f ` I)" using assms by blast
 
   have "finite I \<Longrightarrow> ?thesis"
     using fin_F_I
   proof (induction "f ` I" arbitrary: I rule:finite_induct)
     case empty
     then show ?case by (simp add:restrict_dfl_def)
   next
     case (insert x F)
     have a: "(f -` {x} \<inter> I) \<union> (f -` F \<inter> I) = I"
       using insert(4) by blast
     have b: "F = f `  (f -` F \<inter> I) " using insert(2,4) 
       by (auto simp add:set_eq_iff image_def vimage_def) 
     have c: "finite (f -` F \<inter> I)" using insert by blast
     have d: "\<And>j. j \<in> F \<Longrightarrow> (f -` {j} \<inter> (f -` F \<inter> I)) = (f -` {j} \<inter> I)"
       using insert(4) by blast 
 
     have " Pi_pmf I d M = Pi_pmf ((f -` {x} \<inter> I) \<union> (f -` F \<inter> I)) d M"
       by (simp add:a)
     also have "... = map_pmf (\<lambda>(g, h) i. if i \<in> f -` {x} \<inter> I then g i else h i) 
       (pair_pmf (Pi_pmf (f -` {x} \<inter> I) d M) (Pi_pmf (f -` F \<inter> I) d M))"
       using insert by (subst Pi_pmf_union) auto
     also have "... = map_pmf (\<lambda>(g,h) i. if f i = x \<and> i \<in> I then g i else if f i \<in> F \<and> i \<in> I then h (f i) i else d)
       (pair_pmf (Pi_pmf (f -` {x} \<inter> I) d M) (Pi_pmf F (\<lambda>_. d) (\<lambda>j. Pi_pmf (f -` {j} \<inter> (f -` F \<inter> I)) d M)))"
       by (simp add:insert(3)[OF b c] map_pmf_comp case_prod_beta' apsnd_def map_prod_def 
           pair_map_pmf2 b[symmetric] restrict_dfl_def) (metis fst_conv snd_conv)
     also have "... = map_pmf (\<lambda>(g,h) i. if i \<in> I then (h(x := g)) (f i) i else d) 
       (pair_pmf (Pi_pmf (f -` {x} \<inter> I) d M) (Pi_pmf F (\<lambda>_. d) (\<lambda>j. Pi_pmf (f -` {j} \<inter> I) d M)))" 
       using insert(4) d
       by (intro arg_cong2[where f="map_pmf"] ext) (auto simp add:case_prod_beta' cong:Pi_pmf_cong) 
     also have "... = map_pmf (\<lambda>\<omega> i. if i \<in> I then \<omega> (f i) i else d) (Pi_pmf (insert x F) (\<lambda>_. d) (\<lambda>j. Pi_pmf (f -` {j} \<inter> I) d M))"
       by (simp add:Pi_pmf_insert[OF insert(1,2)] map_pmf_comp case_prod_beta')
     finally show ?case by (simp add:insert(4) restrict_dfl_def)
   qed
   thus ?thesis using assms by blast
 qed
 
 lemma restrict_dfl_iter: "restrict_dfl (restrict_dfl f I d) J d = restrict_dfl f (I \<inter> J) d"
   by (rule ext, simp add:restrict_dfl_def)
 
 lemma indep_vars_restrict':
   assumes "finite I"
   shows "prob_space.indep_vars (Pi_pmf I d M) (\<lambda>_. discrete) (\<lambda>i \<omega>. restrict_dfl \<omega> (f -` {i} \<inter> I) d) (f ` I)"
 proof -
   let ?Q = "(Pi_pmf (f ` I) (\<lambda>_. d) (\<lambda>i. Pi_pmf (I \<inter> f -` {i}) d M))"
   have a:"prob_space.indep_vars ?Q (\<lambda>_. discrete) (\<lambda>i \<omega>. \<omega> i) (f ` I)"
     using assms by (intro indep_vars_Pi_pmf, blast)
   have b: "AE x in measure_pmf ?Q. \<forall>i\<in>f ` I. x i = restrict_dfl (\<lambda>i. x (f i) i) (I \<inter> f -` {i}) d"
     using assms
     by (auto simp add:PiE_dflt_def restrict_dfl_def AE_measure_pmf_iff set_Pi_pmf comp_def Int_commute)
   have "prob_space.indep_vars ?Q (\<lambda>_. discrete) (\<lambda>i x. restrict_dfl (\<lambda>i. x (f i) i) (I \<inter> f -` {i}) d) (f ` I)"
     by (rule prob_space.indep_vars_cong_AE[OF prob_space_measure_pmf b a],  simp)
   thus ?thesis
     using prob_space_measure_pmf 
     by (auto intro!:prob_space.indep_vars_distr simp:pi_pmf_decompose[OF assms, where f="f"]  
         map_pmf_rep_eq comp_def restrict_dfl_iter Int_commute) 
 qed
 
 lemma indep_vars_restrict_intro':
   assumes "finite I"
   assumes "\<And>i \<omega>. i \<in> J \<Longrightarrow> X' i \<omega> = X' i (restrict_dfl \<omega> (f -` {i} \<inter> I) d)"
   assumes "J = f ` I"
   assumes "\<And>\<omega> i. i \<in> J \<Longrightarrow>  X' i \<omega> \<in> space (M' i)"
   shows "prob_space.indep_vars (measure_pmf (Pi_pmf I d p)) M' (\<lambda>i \<omega>. X' i \<omega>) J"
 proof -
   define M where "M \<equiv> measure_pmf (Pi_pmf I d p)"
   interpret prob_space "M"
     using M_def prob_space_measure_pmf by blast
   have "indep_vars (\<lambda>_. discrete) (\<lambda>i x. restrict_dfl x (f -` {i} \<inter> I) d) (f ` I)" 
     unfolding M_def  by (rule indep_vars_restrict'[OF assms(1)])
   hence "indep_vars M' (\<lambda>i \<omega>. X' i (restrict_dfl \<omega> ( f -` {i} \<inter> I) d)) (f ` I)"
     using assms(4)
     by (intro indep_vars_compose2[where Y="X'" and N="M'" and M'="\<lambda>_. discrete"])  (auto simp:assms(3))
   hence "indep_vars M' (\<lambda>i \<omega>. X' i \<omega>) (f ` I)"
     using assms(2)[symmetric]
     by (simp add:assms(3) cong:indep_vars_cong)
   thus ?thesis
     unfolding M_def using assms(3) by simp 
 qed
 
 lemma  
   fixes f :: "'b \<Rightarrow> ('c :: {second_countable_topology,banach,real_normed_field})"
   assumes "finite I"
   assumes "i \<in> I"
   assumes "integrable (measure_pmf (M i)) f"
   shows  integrable_Pi_pmf_slice: "integrable (Pi_pmf I d M) (\<lambda>x. f (x i))"
   and expectation_Pi_pmf_slice: "integral\<^sup>L (Pi_pmf I d M) (\<lambda>x. f (x i)) = integral\<^sup>L (M i) f"
 proof -
   have a:"distr (Pi_pmf I d M) (M i) (\<lambda>\<omega>. \<omega> i) = distr (Pi_pmf I d M) discrete (\<lambda>\<omega>. \<omega> i)"
     by (rule distr_cong, auto)
 
   have b: "measure_pmf.random_variable (M i) borel f"
     using assms(3) by simp
 
   have c:"integrable (distr (Pi_pmf I d M) (M i) (\<lambda>\<omega>. \<omega> i)) f" 
     using assms(1,2,3)
     by (subst a, subst map_pmf_rep_eq[symmetric], subst Pi_pmf_component, auto)
 
   show "integrable (Pi_pmf I d M) (\<lambda>x. f (x i))"
     by (rule integrable_distr[where f="f" and M'="M i"])  (auto intro: c)
 
   have "integral\<^sup>L (Pi_pmf I d M) (\<lambda>x. f (x i)) = integral\<^sup>L (distr (Pi_pmf I d M) (M i) (\<lambda>\<omega>. \<omega> i)) f"
     using b by (intro integral_distr[symmetric], auto)
   also have "... =  integral\<^sup>L (map_pmf (\<lambda>\<omega>. \<omega> i) (Pi_pmf I d M)) f"
     by (subst a, subst map_pmf_rep_eq[symmetric], simp)
   also have "... =  integral\<^sup>L (M i) f"
     using assms(1,2) by (simp add: Pi_pmf_component)
   finally show "integral\<^sup>L (Pi_pmf I d M) (\<lambda>x. f (x i)) = integral\<^sup>L (M i) f" by simp
 qed
 
 text \<open>This is an improved version of @{thm [source] "expectation_prod_Pi_pmf"}.
 It works for general normed fields instead of non-negative real functions .\<close>
 
 lemma expectation_prod_Pi_pmf: 
   fixes f :: "'a \<Rightarrow> 'b \<Rightarrow> ('c :: {second_countable_topology,banach,real_normed_field})"
   assumes "finite I"
   assumes "\<And>i. i \<in> I \<Longrightarrow> integrable (measure_pmf (M i)) (f i)"
   shows   "integral\<^sup>L (Pi_pmf I d M) (\<lambda>x. (\<Prod>i \<in> I. f i (x i))) = (\<Prod> i \<in> I. integral\<^sup>L (M i) (f i))"
 proof -
   have a: "prob_space.indep_vars (measure_pmf (Pi_pmf I d M)) (\<lambda>_. borel) (\<lambda>i \<omega>. f i (\<omega> i)) I"
     by (intro prob_space.indep_vars_compose2[where Y="f" and M'="\<lambda>_. discrete"] 
         prob_space_measure_pmf indep_vars_Pi_pmf assms(1)) auto
   have "integral\<^sup>L (Pi_pmf I d M) (\<lambda>x. (\<Prod>i \<in> I. f i (x i))) = (\<Prod> i \<in> I. integral\<^sup>L (Pi_pmf I d M) (\<lambda>x. f i (x i)))"
     by (intro prob_space.indep_vars_lebesgue_integral prob_space_measure_pmf assms(1,2) 
         a integrable_Pi_pmf_slice) auto
   also have "... = (\<Prod> i \<in> I. integral\<^sup>L (M i) (f i))"
     by (intro prod.cong expectation_Pi_pmf_slice assms(1,2)) auto
   finally show ?thesis by simp
 qed
 
 lemma variance_prod_pmf_slice:
   fixes f :: "'a \<Rightarrow> real"
   assumes "i \<in> I" "finite I"
   assumes "integrable (measure_pmf (M i)) (\<lambda>\<omega>. f \<omega>^2)"
   shows "prob_space.variance (Pi_pmf I d M) (\<lambda>\<omega>. f (\<omega> i)) = prob_space.variance (M i) f"
 proof -
   have a:"integrable (measure_pmf (M i)) f"
     using assms(3) measure_pmf.square_integrable_imp_integrable by auto
   have b:" integrable (measure_pmf (Pi_pmf I d M)) (\<lambda>x. (f (x i))\<^sup>2)"
     by (rule integrable_Pi_pmf_slice[OF assms(2) assms(1)], metis assms(3))
   have c:" integrable (measure_pmf (Pi_pmf I d M)) (\<lambda>x. (f (x i)))"
     by (rule integrable_Pi_pmf_slice[OF assms(2) assms(1)], metis a)
 
   have "measure_pmf.expectation (Pi_pmf I d M) (\<lambda>x. (f (x i))\<^sup>2) - (measure_pmf.expectation (Pi_pmf I d M) (\<lambda>x. f (x i)))\<^sup>2 =
       measure_pmf.expectation (M i) (\<lambda>x. (f x)\<^sup>2) - (measure_pmf.expectation (M i) f)\<^sup>2"
     using assms a b c by ((subst expectation_Pi_pmf_slice[OF assms(2,1)])?, simp)+
 
   thus ?thesis
     using assms a b c by (simp add: measure_pmf.variance_eq)
 qed
 
 lemma Pi_pmf_bind_return:
   assumes "finite I"
   shows "Pi_pmf I d (\<lambda>i. M i \<bind> (\<lambda>x. return_pmf (f i x))) = Pi_pmf I d' M \<bind> (\<lambda>x. return_pmf (\<lambda>i. if i \<in> I then f i (x i) else d))"
   using assms by (simp add: Pi_pmf_bind[where d'="d'"])
 
 end
diff --git a/thys/Median_Method/Median.thy b/thys/Median_Method/Median.thy
--- a/thys/Median_Method/Median.thy
+++ b/thys/Median_Method/Median.thy
@@ -1,887 +1,887 @@
 section \<open>Intervals are Borel measurable\<close>
 
 theory Median
   imports 
     "HOL-Probability.Probability" 
     "HOL-Library.Multiset" 
-    "Universal_Hash_Families.Preliminary_Results"
+    "Universal_Hash_Families.Universal_Hash_Families_More_Independent_Families"
 begin
 
 text \<open>This section contains a proof that intervals are Borel measurable, where an interval is
 defined as a convex subset of linearly ordered space, more precisely, a set is an interval, if 
 for each triple of points $x < y < z$: If $x$ and $z$ are in the set so is $y$.
 This includes ordinary intervals like @{term "{a..b}"}, @{term "{a<..<b}"} but also for example
 @{term [show_types] "{(x::rat). x * x < 2}"} which cannot be expressed in the standard notation.
 
 In the @{theory "HOL-Analysis.Borel_Space"} there are proofs for the measurability of each specific
 type of interval, but those unfortunately do not help if we want to express the result about the
 median bound for arbitrary types of intervals.\<close>
 
 definition interval :: "('a :: linorder) set \<Rightarrow> bool" where
   "interval I = (\<forall>x y z. x \<in> I \<longrightarrow> z \<in> I \<longrightarrow> x \<le> y \<longrightarrow> y \<le> z \<longrightarrow> y \<in> I)"
 
 definition up_ray :: "('a :: linorder) set \<Rightarrow> bool" where
   "up_ray I = (\<forall>x y. x \<in> I \<longrightarrow> x \<le> y \<longrightarrow> y \<in> I)"
 
 lemma up_ray_borel:
   assumes "up_ray (I :: (('a :: linorder_topology) set))"
   shows "I \<in> borel"
 proof (cases "closed I")
   case True
   then show ?thesis using borel_closed by blast
 next
   case False
   hence b:"\<not> closed I" by blast
 
   have "open I"
   proof (rule Topological_Spaces.openI)
     fix x
     assume c:"x \<in> I"
     show "\<exists>T. open T \<and> x \<in> T \<and> T \<subseteq> I"
     proof (cases "\<exists>y. y < x \<and> y \<in> I")
       case True
       then obtain y where a:"y < x \<and> y \<in> I" by blast
       have "open {y<..}" by simp
       moreover have "x \<in> {y<..}" using a by simp
       moreover have "{y<..} \<subseteq> I"
         using a assms(1) by (auto simp: up_ray_def) 
       ultimately show ?thesis by blast
     next
       case False
       hence "I \<subseteq> {x..}" using linorder_not_less by auto
       moreover have "{x..} \<subseteq> I"
         using c assms(1) unfolding up_ray_def by blast
       ultimately have "I = {x..}" 
         by (rule order_antisym)
       moreover have "closed {x..}" by simp
       ultimately have "False" using b by auto
       then show ?thesis by simp
     qed
   qed
   then show ?thesis by simp
 qed
 
 definition down_ray :: "('a :: linorder) set \<Rightarrow> bool" where
   "down_ray I = (\<forall>x y. y \<in> I \<longrightarrow> x \<le> y \<longrightarrow> x \<in> I)"
 
 lemma down_ray_borel:
   assumes "down_ray (I :: (('a :: linorder_topology) set))"
   shows "I \<in> borel"
 proof -
   have "up_ray (-I)" using assms 
     by (simp add: up_ray_def down_ray_def, blast)
   hence "(-I) \<in> borel" using up_ray_borel by blast
   thus "I \<in> borel" 
     by (metis borel_comp double_complement)
 qed
 
 text \<open>Main result of this section:\<close>
 
 lemma interval_borel:
   assumes "interval (I :: (('a :: linorder_topology) set))"
   shows "I \<in> borel"
 proof (cases "I = {}")
   case True
   then show ?thesis by simp
 next
   case False
   then obtain x where a:"x \<in> I" by blast
   have "\<And>y z. y \<in> I \<union> {x..} \<Longrightarrow> y \<le> z \<Longrightarrow> z \<in> I \<union> {x..}" 
     by (metis assms a interval_def  IntE UnE Un_Int_eq(1) Un_Int_eq(2) atLeast_iff nle_le order.trans)
   hence "up_ray (I \<union> {x..})"
     using up_ray_def by blast
   hence b:"I \<union> {x..} \<in> borel" 
     using up_ray_borel by blast
 
   have "\<And>y z. y \<in> I \<union> {..x} \<Longrightarrow> z \<le> y \<Longrightarrow> z \<in> I \<union> {..x}" 
     by (metis assms a interval_def UnE UnI1 UnI2 atMost_iff dual_order.trans linorder_le_cases)
   hence "down_ray (I \<union> {..x})"
     using down_ray_def by blast
   hence c:"I \<union> {..x} \<in> borel"
     using down_ray_borel by blast
 
   have "I = (I \<union> {x..}) \<inter> (I \<union> {..x})"
     using a by fastforce    
 
   then show ?thesis using b c
     by (metis sets.Int)
 qed
 
 section \<open>Order statistics are Borel measurable\<close>
 
 text \<open>This section contains a proof that order statistics of Borel measurable random variables are
 themselves Borel measurable.
 
 The proof relies on the existence of branch-free comparison-sort algorithms. Given a sequence length
 these algorithms perform compare-swap operations on predefined pairs of positions. In particular the
 result of a comparison does not affect future operations. An example for a branch-free comparison
 sort algorithm is shell-sort and also bubble-sort without the early exit.
 
 The advantage of using such a comparison-sort algorithm is that it can be lifted to work on random
 variables, where the result of a comparison-swap operation on two random variables @{term"X"} and
 @{term"Y"} can be represented as the expressions @{term "\<lambda>\<omega>. min (X \<omega>) (Y \<omega>)"} and
 @{term "\<lambda>\<omega>. max (X \<omega>) (Y \<omega>)"}.
 
 Because taking the point-wise minimum (resp. maximum) of two random variables is still
 Borel measurable, and because the entire sorting operation can be represented using such
 compare-swap operations, we can show that all order statistics are Borel measuable.\<close>
 
 fun sort_primitive where
   "sort_primitive i j f k = (if k = i then min (f i) (f j) else (if k = j then max (f i) (f j) else f k))"
 
 fun sort_map where
   "sort_map f n = fold id [sort_primitive j i. i <- [0..<n], j <- [0..<i]] f"
 
 lemma sort_map_ind:
   "sort_map f (Suc n) = fold id [sort_primitive j n. j <- [0..<n]] (sort_map f n)"
   by simp
 
 lemma sort_map_strict_mono:
   fixes f :: "nat \<Rightarrow> 'b :: linorder"
   shows "j < n \<Longrightarrow> i < j \<Longrightarrow> sort_map f n i \<le> sort_map f n j"
 proof (induction n arbitrary: i j)
   case 0
   then show ?case by simp
 next
   case (Suc n)
   define g where "g = (\<lambda>k. fold id [sort_primitive j n. j <- [0..<k]] (sort_map f n))"
   define k where "k = n"
   have a:"(\<forall>i j. j < n \<longrightarrow> i < j \<longrightarrow> g k i \<le> g k j) \<and> (\<forall>l. l < k \<longrightarrow> g k l \<le> g k n)"
   proof (induction k)
     case 0
     then show ?case using Suc by (simp add:g_def del:sort_map.simps)
   next
     case (Suc k)
     have "g (Suc k) = sort_primitive k n (g k)" 
       by (simp add:g_def)
     then show ?case using Suc
       apply (cases "g k k \<le> g k n")
        apply (simp add:min_def max_def)
        using less_antisym apply blast
       apply (cases "g k n \<le> g k k")
        apply (simp add:min_def max_def)
        apply (metis less_antisym max.coboundedI2 max.orderE)
       by simp
   qed
 
   hence "\<And>i j. j < Suc n \<Longrightarrow> i < j \<Longrightarrow> g n i \<le> g n j"
     apply (simp add:k_def) using less_antisym by blast
   moreover have "sort_map f (Suc n) = g n" 
     by (simp add:sort_map_ind g_def del:sort_map.simps)
   ultimately show ?case
     using Suc by (simp del:sort_map.simps)
 qed
 
 lemma sort_map_mono:
   fixes f :: "nat \<Rightarrow> 'b :: linorder"
   shows "j < n \<Longrightarrow> i \<le> j \<Longrightarrow> sort_map f n i \<le> sort_map f n j"
   by (metis sort_map_strict_mono eq_iff le_imp_less_or_eq)
 
 lemma sort_map_perm:
   fixes f :: "nat \<Rightarrow> 'b :: linorder"
   shows "image_mset (sort_map f n) (mset [0..<n]) = image_mset f (mset [0..<n])"
 proof -
   define is_swap where "is_swap = (\<lambda>(ts :: ((nat \<Rightarrow> 'b) \<Rightarrow> nat \<Rightarrow> 'b)). \<exists>i < n. \<exists>j < n. ts = sort_primitive i j)"
   define t :: "((nat \<Rightarrow> 'b) \<Rightarrow> nat \<Rightarrow> 'b) list" 
     where "t = [sort_primitive j i. i <- [0..<n], j <- [0..<i]]"
 
   have a: "\<And>x f. is_swap x \<Longrightarrow> image_mset (x f) (mset_set {0..<n}) = image_mset f (mset_set {0..<n})"
   proof -
     fix x
     fix f :: "nat \<Rightarrow> 'b :: linorder"
     assume "is_swap x"
     then obtain i j where x_def: "x = sort_primitive i j" and i_bound: "i < n" and j_bound:"j < n" 
       using is_swap_def by blast
     define inv where "inv = mset_set {k. k < n \<and> k \<noteq> i \<and> k \<noteq> j}"
     have b:"{0..<n} = {k. k < n \<and> k \<noteq> i \<and> k \<noteq> j} \<union> {i,j}"
       apply (rule order_antisym, rule subsetI, simp, blast, rule subsetI, simp)
       using i_bound j_bound by meson
     have c:"\<And>k. k \<in># inv \<Longrightarrow> (x f) k = f k" 
       by (simp add:x_def inv_def)
     have "image_mset (x f) inv = image_mset f inv"
       apply (rule multiset_eqI)
       using c multiset.map_cong0 by force
     moreover have "image_mset (x f) (mset_set {i,j}) = image_mset f (mset_set {i,j})"
       apply (cases "i = j")
       by (simp add:x_def max_def min_def)+
     moreover have "mset_set {0..<n} = inv + mset_set {i,j}"
       by (simp only:inv_def b, rule mset_set_Union, simp, simp, simp) 
     ultimately show "image_mset (x f) (mset_set {0..<n}) = image_mset f (mset_set {0..<n})"
       by simp
   qed
 
   have "(\<forall>x \<in> set t. is_swap x) \<Longrightarrow> image_mset (fold id t f) (mset [0..<n]) = image_mset f (mset [0..<n])"
     by (induction t arbitrary:f, simp, simp add:a) 
   moreover have "\<And>x. x \<in> set t \<Longrightarrow> is_swap x" 
     apply (simp add:t_def is_swap_def) 
     by (meson atLeastLessThan_iff imageE less_imp_le less_le_trans)  
   ultimately have "image_mset (fold id t f) (mset [0..<n]) = image_mset f (mset [0..<n])" by blast
   then show ?thesis by (simp add:t_def)
 qed
 
 lemma list_eq_iff:
   assumes "mset xs = mset ys"
   assumes "sorted xs"
   assumes "sorted ys"
   shows "xs = ys" 
   using assms properties_for_sort by blast
 
 lemma sort_map_eq_sort:
   fixes f :: "nat \<Rightarrow> ('b :: linorder)"
   shows "map (sort_map f n) [0..<n] = sort (map f [0..<n])" (is "?A = ?B")
 proof -
   have "mset ?A = mset ?B"
     using sort_map_perm[where f="f" and n="n"]
     by (simp del:sort_map.simps)
   moreover have "sorted ?B"
     by simp
   moreover have "sorted ?A"
     apply (subst sorted_wrt_iff_nth_less)
     apply (simp del:sort_map.simps)
     by (metis sort_map_mono nat_less_le)
   ultimately show "?A = ?B" 
     using list_eq_iff by blast
 qed
 
 lemma order_statistics_measurable_aux: 
   fixes X :: "nat \<Rightarrow> 'a \<Rightarrow> ('b :: {linorder_topology, second_countable_topology})"
   assumes "n \<ge> 1" 
   assumes "j < n"
   assumes "\<And>i. i < n \<Longrightarrow> X i \<in> measurable M borel"
   shows "(\<lambda>x. (sort_map (\<lambda>i. X i x) n) j) \<in> measurable M borel"
 proof -
   have n_ge_0:"n > 0" using assms by simp
   define is_swap where "is_swap = (\<lambda>(ts :: ((nat \<Rightarrow> 'b) \<Rightarrow> nat \<Rightarrow> 'b)). \<exists>i < n. \<exists>j < n. ts = sort_primitive i j)"
   define t :: "((nat \<Rightarrow> 'b) \<Rightarrow> nat \<Rightarrow> 'b) list" 
     where "t = [sort_primitive j i. i <- [0..<n], j <- [0..<i]]"
 
   define meas_ptw :: "(nat \<Rightarrow> 'a \<Rightarrow> 'b) \<Rightarrow> bool"
     where "meas_ptw = (\<lambda>f. (\<forall>k. k < n \<longrightarrow> f k \<in> borel_measurable M))"
 
   have ind_step:
     "\<And>x (g :: nat \<Rightarrow> 'a \<Rightarrow> 'b). meas_ptw g \<Longrightarrow> is_swap x \<Longrightarrow> meas_ptw (\<lambda>k \<omega>. x (\<lambda>i. g i \<omega>) k)"
   proof -
     fix x g
     assume "meas_ptw g"
     hence a:"\<And>k. k < n \<Longrightarrow> g k \<in> borel_measurable M" by (simp add:meas_ptw_def)
     assume "is_swap x"
     then obtain i j where x_def:"x=sort_primitive i j" and i_le:"i < n" and j_le:"j < n"
       by (simp add:is_swap_def, blast)
     have "\<And>k. k < n \<Longrightarrow> (\<lambda>\<omega>. x (\<lambda>i. g i \<omega>) k) \<in> borel_measurable M"
     proof -
       fix k
       assume "k < n"
       thus " (\<lambda>\<omega>. x (\<lambda>i. g i \<omega>) k) \<in> borel_measurable M"
         apply (simp add:x_def)
         apply (cases "k = i", simp)
         using a i_le j_le borel_measurable_min apply blast
         apply (cases "k = j", simp)
         using a i_le j_le borel_measurable_max apply blast
         using a by simp
     qed
     thus "meas_ptw (\<lambda>k \<omega>. x (\<lambda>i. g i \<omega>) k)" 
       by (simp add:meas_ptw_def)
   qed
 
   have "(\<forall>x \<in> set t. is_swap x) \<Longrightarrow> meas_ptw (\<lambda> k \<omega>. (fold id t (\<lambda>k. X k \<omega>)) k)"
   proof (induction t rule:rev_induct)
     case Nil
     then show ?case using assms by (simp add:meas_ptw_def)
   next
     case (snoc x xs)
     have a:"meas_ptw (\<lambda>k \<omega>. fold (\<lambda>a. a) xs (\<lambda>k. X k \<omega>) k)" using snoc by simp
     have b:"is_swap x" using snoc by simp
     show ?case using ind_step[OF a b] by simp
   qed
   moreover have "\<And>x. x \<in> set t \<Longrightarrow> is_swap x" 
     apply (simp add:t_def is_swap_def) 
     by (meson atLeastLessThan_iff imageE less_imp_le less_le_trans)  
   ultimately show ?thesis using assms
     by (simp add:t_def[symmetric] meas_ptw_def)
 qed
 
 text \<open>Main results of this section:\<close>
 
 lemma order_statistics_measurable:
   fixes X :: "nat \<Rightarrow> 'a \<Rightarrow> ('b :: {linorder_topology, second_countable_topology})"
   assumes "n \<ge> 1" 
   assumes "j < n"
   assumes "\<And>i. i < n \<Longrightarrow> X i \<in> measurable M borel"
   shows "(\<lambda>x. (sort (map (\<lambda>i. X i x) [0..<n])) ! j) \<in> measurable M borel"
   apply (subst sort_map_eq_sort[symmetric])
   using assms by (simp add:order_statistics_measurable_aux del:sort_map.simps)
 
 definition median :: "nat \<Rightarrow> (nat \<Rightarrow> ('a :: linorder)) \<Rightarrow> 'a" where
   "median n f = sort (map f [0..<n]) ! (n div 2)"
 
 lemma median_measurable:
   fixes X :: "nat \<Rightarrow> 'a \<Rightarrow> ('b :: {linorder_topology, second_countable_topology})"
   assumes "n \<ge> 1" 
   assumes "\<And>i. i < n \<Longrightarrow> X i \<in> measurable M borel"
   shows "(\<lambda>x. median n (\<lambda>i. X i x)) \<in> measurable M borel"
   apply (simp add:median_def)
   apply (rule order_statistics_measurable[OF assms(1) _ assms(2)])
   using assms(1) by force+
 
 section \<open>The Median Method\<close>
 
 text \<open>This section contains the proof for the probability that the median of independent random
 variables will be in an interval with high probability if the individual variables are in the
 same interval with probability larger than $\frac{1}{2}$.
 
 The proof starts with the elementary observation that the median of a seqeuence with $n$ elements
 is in an interval $I$ if at least half of them are in $I$. This works because after sorting the
 sequence the elements that will be in the interval must necessarily form a consecutive subsequence,
 if its length is larger than $\frac{n}{2}$ the median must be in it.
 
 The remainder follows the proof in \<^cite>\<open>\<open>\textsection 2.1\<close> in "alon1999"\<close> using the Hoeffding inequality
 to estimate the probability that at least half of the sequence elements will be in the interval $I$.\<close>
 
 lemma interval_rule:
   assumes "interval I"
   assumes "a \<le> x" "x \<le> b"
   assumes "a \<in> I"
   assumes "b \<in> I"
   shows "x \<in> I"
   using assms(1) apply (simp add:interval_def)
   using assms by blast
 
 lemma sorted_int:
   assumes "interval I"
   assumes "sorted xs"
   assumes "k < length xs" "i \<le> j" "j \<le> k "
   assumes "xs ! i \<in> I" "xs ! k \<in> I"
   shows "xs ! j \<in> I"
   apply (rule interval_rule[where a="xs ! i" and b="xs ! k"])
   using assms by (simp add: sorted_nth_mono)+
 
 lemma mid_in_interval:
   assumes "2*length (filter (\<lambda>x. x \<in> I) xs) > length xs"
   assumes "interval I"
   assumes "sorted xs"
   shows "xs ! (length xs div 2) \<in> I"
 proof -
   have "length (filter (\<lambda>x. x \<in> I) xs) > 0"  using assms(1) by linarith
   then obtain v where v_1: "v < length xs" and v_2: "xs ! v \<in> I" 
     by (metis filter_False in_set_conv_nth length_greater_0_conv)
 
   define J where "J = {k. k < length xs \<and> xs ! k \<in> I}"
 
   have card_J_min: "2*card J > length xs"
     using assms(1) by (simp add:J_def length_filter_conv_card)
 
   consider
     (a) "xs ! (length xs div 2) \<in> I" |
     (b) "xs ! (length xs div 2) \<notin> I \<and> v > (length xs div 2)" |
     (c) "xs ! (length xs div 2) \<notin> I \<and> v < (length xs div 2)"
     by (metis linorder_cases v_2)
   thus ?thesis
   proof (cases)
     case a
     then show ?thesis by simp
   next
     case b
     have p:"\<And>k. k \<le> length xs div 2 \<Longrightarrow> xs ! k \<notin> I"
       using b v_2 sorted_int[OF assms(2) assms(3) v_1, where j="length xs div 2"] apply simp by blast
     have "card J \<le> card {Suc (length xs div 2)..<length xs}"
       apply (rule card_mono, simp)
       apply (rule subsetI, simp add:J_def not_less_eq_eq[symmetric])
       using p by metis
     hence "card J \<le> length xs - (Suc (length xs div 2))"
       using card_atLeastLessThan by metis
     hence "length xs \<le> 2*( length xs - (Suc (length xs div 2)))"
       using card_J_min by linarith
     hence "False"
       apply (simp add:nat_distrib)
       apply (subst (asm) le_diff_conv2) using b v_1 apply linarith
       by simp
     then show ?thesis by simp
   next
     case c
     have p:"\<And>k. k \<ge> length xs div 2 \<Longrightarrow> k < length xs \<Longrightarrow> xs ! k \<notin> I"
       using c v_1 v_2 sorted_int[OF assms(2) assms(3), where i ="v" and j="length xs div 2"] apply simp by blast
     have "card J \<le> card {0..<(length xs div 2)}"
       apply (rule card_mono, simp)
       apply (rule subsetI, simp add:J_def not_less_eq_eq[symmetric])
       using p linorder_le_less_linear by blast
     hence "card J \<le> (length xs div 2)"
       using card_atLeastLessThan by simp
     then show ?thesis using card_J_min by linarith
   qed
 qed
 
 lemma median_est:
   assumes "interval I"
   assumes "2*card {k. k < n \<and> f k \<in> I} > n"
   shows "median n f \<in> I"
 proof -
   have a:"{k. k < n \<and> f k \<in> I} = {i. i < n \<and> map f [0..<n] ! i \<in> I}"
     apply (rule order_antisym, rule subsetI, simp)
     by (rule subsetI, simp, metis add_0 diff_zero nth_map_upt)
 
   show ?thesis
     apply (simp add:median_def)
     apply (rule mid_in_interval[where I="I" and xs="sort (map f [0..<n])", simplified])
      using assms a apply (simp add:filter_sort comp_def length_filter_conv_card)
     by (simp add:assms)
 qed
 
 lemma prod_pmf_bernoulli_mono:
   assumes "finite I"
   assumes "\<And>i. i \<in> I \<Longrightarrow> 0 \<le> f i \<and> f i \<le> g i \<and> g i \<le> 1"
   assumes "\<And>x y. x \<in> A \<Longrightarrow> (\<forall>i \<in> I. x i \<le> y i) \<Longrightarrow> y \<in> A"
   shows "measure (Pi_pmf I d (bernoulli_pmf \<circ> f)) A \<le> measure (Pi_pmf I d (bernoulli_pmf \<circ> g)) A"
     (is "?L \<le> ?R")
 proof -
   define q where "q i = pmf_of_list [(0::nat, f i), (1, g i - f i), (2, 1 - g i)]" for i
 
   have wf:"pmf_of_list_wf [(0::nat, f i), (1, g i - f i), (2, 1 - g i)]" if "i \<in> I" for i
     using assms(2)[OF that] by (intro pmf_of_list_wfI) auto
 
   have 0: "bernoulli_pmf (f i) = map_pmf (\<lambda>x. x = 0) (q i)" (is "?L1 = ?R1") 
     if "i \<in> I" for i
   proof -
     have "0 \<le> f i" "f i \<le> 1" using assms(2)[OF that] by auto
     hence "pmf ?L1 x = pmf ?R1 x" for x
       unfolding q_def pmf_map measure_pmf_of_list[OF wf[OF that]] 
       by (cases x;simp_all add:vimage_def)
     thus ?thesis
       by (intro pmf_eqI) auto
   qed
 
   have 1: "bernoulli_pmf (g i) = map_pmf (\<lambda>x. x \<in> {0,1}) (q i)" (is "?L1 = ?R1")
     if "i \<in> I" for i
   proof -
     have "0 \<le> g i" "g i \<le> 1" using assms(2)[OF that] by auto
     hence "pmf ?L1 x = pmf ?R1 x" for x
       unfolding q_def pmf_map measure_pmf_of_list[OF wf[OF that]] 
       by (cases x;simp_all add:vimage_def)
     thus ?thesis
       by (intro pmf_eqI) auto
   qed
 
   have 2: "(\<lambda>k. x k = 0) \<in> A \<Longrightarrow> (\<lambda>k. x k = 0 \<or> x k = Suc 0) \<in> A" for x
     by (erule assms(3)) auto
 
   have "?L = measure (Pi_pmf I d (\<lambda>i. map_pmf (\<lambda>x. x = 0) (q i))) A"
     unfolding comp_def by (simp add:0 cong: Pi_pmf_cong)
   also have "... = measure (map_pmf ((\<circ>) (\<lambda>x. x = 0)) (Pi_pmf I (if d then 0 else 2) q)) A"
     by (intro arg_cong2[where f="measure_pmf.prob"] Pi_pmf_map[OF assms(1)]) auto 
   also have "... = measure (Pi_pmf I (if d then 0 else 2) q) {x. (\<lambda>k. x k = 0) \<in> A}"
     by (simp add:comp_def vimage_def)
   also have "... \<le> measure (Pi_pmf I (if d then 0 else 2) q) {x. (\<lambda>k. x k \<in> {0,1}) \<in> A}"
     using 2 by (intro measure_pmf.finite_measure_mono subsetI) auto 
   also have "... = measure (map_pmf ((\<circ>) (\<lambda>x. x \<in> {0,1})) (Pi_pmf I (if d then 0 else 2) q)) A"
     by (simp add:vimage_def comp_def)
   also have "... = measure (Pi_pmf I d (\<lambda>i. map_pmf (\<lambda>x. x \<in> {0,1}) (q i))) A"
     by (intro arg_cong2[where f="measure_pmf.prob"] Pi_pmf_map[OF assms(1), symmetric]) auto
   also have "... = ?R" 
     unfolding comp_def by (simp add:1 cong: Pi_pmf_cong)
   finally show ?thesis by simp
 qed
 
 lemma discrete_measure_eqI:
   assumes "sets M = count_space UNIV"
   assumes "sets N = count_space UNIV" 
   assumes "countable \<Omega>"
   assumes "\<And>x. x \<in> \<Omega> \<Longrightarrow> emeasure M {x} = emeasure N {x} \<and> emeasure M {x} \<noteq> \<infinity>"
   assumes "AE x in M. x \<in> \<Omega>"
   assumes "AE x in N. x \<in> \<Omega>"
   shows "M = N"
 proof -
   define E where "E = insert {} ((\<lambda>x. {x}) ` \<Omega>)"
 
   have 0: "Int_stable E" unfolding E_def by (intro Int_stableI) auto
   have 1: "countable E" using assms(3) unfolding E_def by simp
 
   have "E \<subseteq> Pow \<Omega>" unfolding E_def by auto
   have "emeasure M A = emeasure N A" if A_range: "A \<in> E" for A
     using that assms(4) unfolding E_def by auto
   moreover have "sets M = sets N" using assms(1,2) by simp
   moreover have "\<Omega> \<in> sets M" using assms(1) by simp
   moreover have "E \<noteq> {}" unfolding E_def by simp
   moreover have "\<Union>E = \<Omega>" unfolding E_def by simp
   moreover have "emeasure M a \<noteq> \<infinity>" if "a \<in> E" for a
     using that assms(4) unfolding E_def by auto
   moreover have "sets (restrict_space M \<Omega>) = Pow \<Omega>"
     using assms(1) by (simp add:sets_restrict_space range_inter)
   moreover have "sets (restrict_space N \<Omega>) = Pow \<Omega>"
     using assms(2) by (simp add:sets_restrict_space range_inter)
   moreover have "sigma_sets \<Omega> E = Pow \<Omega>"
     unfolding E_def by (intro sigma_sets_singletons_and_empty assms(3)) 
   ultimately show ?thesis
     by (intro measure_eqI_restrict_generator[OF 0 _ _ _ _ _ _ assms(5,6) 1]) auto
 qed
 
 text \<open>Main results of this section:\<close>
 
 text \<open>The next theorem establishes a bound for the probability of the median of independent random
 variables using the binomial distribution. In a follow-up step, we will establish tail bounds
 for the binomial distribution and corresponding median bounds.
 
 This two-step strategy was suggested by Yong Kiam Tan. In a previous version, I only had verified 
 the exponential tail bound (see theorem \verb+median_bound+ below).\<close>
 
 theorem (in prob_space) median_bound_raw:
   fixes I :: "('b :: {linorder_topology, second_countable_topology}) set"
   assumes "n > 0" "p \<ge> 0"
   assumes "interval I"
   assumes "indep_vars (\<lambda>_. borel) X {0..<n}"
   assumes "\<And>i. i < n \<Longrightarrow> \<P>(\<omega> in M. X i \<omega> \<in> I) \<ge> p" 
   shows "\<P>(\<omega> in M. median n (\<lambda>i. X i \<omega>) \<in> I) \<ge> 1 - measure (binomial_pmf n p) {..n div 2}" 
     (is "?L \<ge> ?R")
 proof -
   let ?pi = "Pi_pmf {..<n} undefined"
   define q where "q i = \<P>(\<omega> in M. X i \<omega> \<in> I)" for i
 
   have n_ge_1: "n \<ge> 1" using assms(1) by simp
 
   have 0: "{k. k < n \<and> (k < n \<longrightarrow> X k \<omega> \<in> I)} = {k. k < n \<and> X k \<omega> \<in> I}" for \<omega>
     by auto
 
   have "countable ({..<n} \<rightarrow>\<^sub>E (UNIV ::  bool set))"
     by (intro countable_PiE) auto
   hence countable_ext: "countable (extensional {..<n} :: (nat \<Rightarrow> bool) set)"
     unfolding PiE_def by auto
 
   have m0: "I \<in> sets borel"
     using interval_borel[OF assms(3)] by simp
 
   have m1: "random_variable borel (\<lambda>x. X k x)" if "k \<in> {..<n}" for k 
     using assms(4) that unfolding indep_vars_def by auto
 
   have m2: "(\<lambda>x. x \<in> I) \<in> borel \<rightarrow>\<^sub>M (measure_pmf ((bernoulli_pmf \<circ> q) k))"  
     for k using m0 by measurable
   hence m3: "random_variable (measure_pmf ((bernoulli_pmf \<circ> q) k)) (\<lambda>x. X k x \<in> I)"
     if "k \<in> {..<n}" for k 
     by (intro measurable_compose[OF m1] that)
 
   hence m4: "random_variable (PiM {..<n} (bernoulli_pmf \<circ> q)) (\<lambda>\<omega>. \<lambda>k\<in>{..<n}. X k \<omega> \<in> I)" 
     by (intro measurable_restrict) auto
   moreover have "A \<in> sets (Pi\<^sub>M {..<n} (\<lambda>x. measure_pmf (bernoulli_pmf (q x))))"
     if "A \<subseteq> extensional {..<n}" for A 
   proof -
     have "A = (\<Union>a \<in> A. {a})" by auto
     also have "... = (\<Union>a \<in> A. PiE {..<n} (\<lambda>k. {a k}))"
       using that by (intro arg_cong[where f="Union"] image_cong refl PiE_singleton[symmetric]) auto
     also have "... \<in> sets (Pi\<^sub>M {..<n} (\<lambda>x. measure_pmf (bernoulli_pmf (q x))))"
       using that countable_ext countable_subset
       by (intro sets.countable_Union countable_image image_subsetI sets_PiM_I_finite) auto
     finally show ?thesis by simp
   qed
   hence m5: "id \<in> (PiM {..<n} (bernoulli_pmf \<circ> q)) \<rightarrow>\<^sub>M (count_space UNIV)"
     by (intro measurableI) (simp_all add:vimage_def space_PiM PiE_def)
   ultimately have "random_variable (count_space UNIV) (id \<circ> (\<lambda>\<omega>. \<lambda>k\<in>{..<n}. X k \<omega> \<in> I))"
     by (rule measurable_comp)
   hence m6: "random_variable (count_space UNIV) (\<lambda>\<omega>. \<lambda>k\<in>{..<n}. X k \<omega> \<in> I)" by simp
 
   have indep: "indep_vars (bernoulli_pmf \<circ> q) (\<lambda>i x. X i x \<in> I) {0..<n}" 
     by (intro indep_vars_compose2[OF assms(4)] m2)
 
   have "measure M {x \<in> space M. (X k x \<in> I) = \<omega>} = measure (bernoulli_pmf (q k)) {\<omega>}"
     if "k < n" for \<omega> k
   proof (cases "\<omega>")
     case True
     then show ?thesis unfolding q_def  by (simp add:measure_pmf_single)
   next
     case False
     have "{x \<in> space M. X k x \<in> I} \<in> events"
       using that m0 by (intro measurable_sets_Collect[OF m1]) auto
     hence "prob {x \<in> space M. X k x \<notin> I} = 1 - prob {\<omega> \<in> space M. X k \<omega> \<in> I}" 
       by (subst prob_neg) auto
     thus ?thesis using False unfolding q_def by (simp add:measure_pmf_single)
   qed
 
   hence 1: "emeasure M {x \<in> space M. (X k x \<in> I) = \<omega>} = emeasure (bernoulli_pmf (q k)) {\<omega>}"
     if "k < n" for \<omega> k
     using that unfolding emeasure_eq_measure measure_pmf.emeasure_eq_measure by simp
 
   interpret product_sigma_finite "(bernoulli_pmf \<circ> q)"
     by standard
 
   have "distr M (count_space UNIV) (\<lambda>\<omega>. (\<lambda>k\<in>{..<n} . X k \<omega> \<in> I)) = distr 
     (distr M (PiM {..<n} (bernoulli_pmf \<circ> q)) (\<lambda>\<omega>. \<lambda>k\<in>{..<n}. X k \<omega> \<in> I)) (count_space UNIV) id"
     by (subst distr_distr[OF m5 m4]) (simp add:comp_def) 
   also have "... = distr (PiM {..<n} (\<lambda>i. (distr M ((bernoulli_pmf \<circ> q) i) (\<lambda>\<omega>. X i \<omega> \<in> I) )))
     (count_space UNIV) id" 
     using assms(1) indep atLeast0LessThan by (intro arg_cong2[where f="\<lambda>x y. distr x y id"] 
         iffD1[OF indep_vars_iff_distr_eq_PiM'] m3) auto 
   also have "... = distr (PiM {..<n} (bernoulli_pmf \<circ> q)) (count_space UNIV) id"
     using m3 1 by (intro distr_cong PiM_cong refl discrete_measure_eqI[where \<Omega>="UNIV"])
         (simp_all add:emeasure_distr vimage_def Int_def conj_commute)
   also have "... = ?pi (bernoulli_pmf \<circ> q)"
   proof (rule discrete_measure_eqI[where \<Omega>="extensional {..<n}"], goal_cases)
     case 1 show ?case by simp
   next
     case 2 show ?case by simp
   next
     case 3 show ?case using countable_ext by simp
   next
     case (4 x)
     have "emeasure (Pi\<^sub>M {..<n} (bernoulli_pmf \<circ> q)) {x} = 
       emeasure (Pi\<^sub>M {..<n} (bernoulli_pmf \<circ> q)) (PiE {..<n} (\<lambda>k. {x k}))"
       using PiE_singleton[OF 4] by simp
     also have "... = (\<Prod>i<n. emeasure (measure_pmf (bernoulli_pmf (q i))) {x i})"
       by (subst emeasure_PiM) auto
     also have "... = emeasure (Pi_pmf {..<n} undefined (bernoulli_pmf\<circ>q)) 
       (PiE_dflt {..<n} undefined (\<lambda>k. {x k}))"
       unfolding measure_pmf.emeasure_eq_measure
       by (subst measure_Pi_pmf_PiE_dflt) (simp_all add:prod_ennreal)
     also have "... = emeasure (Pi_pmf {..<n} undefined (bernoulli_pmf\<circ>q)) {x}"
       using 4 by (intro arg_cong2[where f="emeasure"]) (auto simp add:PiE_dflt_def extensional_def)
     finally have "emeasure (Pi\<^sub>M {..<n} (bernoulli_pmf \<circ> q)) {x} = 
       emeasure (Pi_pmf {..<n} undefined (bernoulli_pmf \<circ> q)) {x}"
       by simp
     thus ?case using 4 
       by (subst (1 2) emeasure_distr[OF m5]) (simp_all add:vimage_def space_PiM PiE_def)
   next
     case 5
     have "AE x in Pi\<^sub>M {..<n} (bernoulli_pmf \<circ> q). x \<in> extensional {..<n}"
       by (intro AE_I2) (simp add:space_PiM PiE_def)
     then show ?case by (subst AE_distr_iff[OF m5]) simp_all
   next
     case 6
     then show ?case by (intro AE_pmfI) (simp add: set_Pi_pmf PiE_dflt_def extensional_def)
   qed
   finally have 2: "distr M (count_space UNIV) (\<lambda>\<omega>. (\<lambda>k\<in>{..<n}. X k \<omega> \<in> I)) = ?pi (bernoulli_pmf\<circ>q)"
     by simp
 
   have 3: "n < 2 * card {k. k < n \<and> y k}" if 
     "n < 2 * card {k. k < n \<and> x k}" "\<And>i. i < n \<Longrightarrow> x i \<Longrightarrow> y i" for x y
   proof -
     have "2 * card {k. k < n \<and> x k} \<le> 2 * card {k. k < n \<and> y k}"
       using that(2) by (intro mult_left_mono card_mono) auto
     thus ?thesis using that(1) by simp
   qed
 
   have 4: "0 \<le> p \<and> p \<le> q i \<and> q i \<le> 1" if "i < n" for i
     unfolding q_def using assms(2,5) that by auto
 
   have p_range: "p \<in> {0..1}"
     using 4[OF assms(1)] by auto
 
   have "?R = 1 - measure_pmf.prob (binomial_pmf n p) {k. 2 * k \<le> n}"
     by (intro arg_cong2[where f="(-)"] arg_cong2[where f="measure_pmf.prob"]) auto
   also have "... = measure (binomial_pmf n p) {k. n < 2 * k}"
     by (subst measure_pmf.prob_compl[symmetric]) (simp_all add:set_diff_eq not_le)
   also have "... = measure (?pi (bernoulli_pmf \<circ> (\<lambda>_. p))) {\<omega>. n < 2 * card {k. k < n \<and> \<omega> k}}"
     using p_range by (subst binomial_pmf_altdef'[where A="{..<n}" and dflt="undefined"]) auto
   also have "... \<le> measure (?pi (bernoulli_pmf \<circ> q)) {\<omega>. n < 2 * card {k. k < n \<and> \<omega> k}}"
     using 3 4 by (intro prod_pmf_bernoulli_mono) auto
   also have "... = 
     \<P>(\<omega> in distr M (count_space UNIV) (\<lambda>\<omega>. \<lambda>k\<in>{..<n}. X k \<omega> \<in> I). n<2*card {k. k < n \<and> \<omega> k})"
     unfolding 2 by simp
   also have "... = \<P>(\<omega> in M. n < 2*card {k. k < n \<and> X k \<omega> \<in> I})" 
     by (subst measure_distr[OF m6]) (simp_all add:vimage_def Int_def conj_commute 0)
   also have "... \<le> ?L"
     using median_est[OF assms(3)] m0 m1
     by (intro finite_measure_mono measurable_sets_Collect[OF median_measurable[OF n_ge_1]]) auto 
   finally show "?R \<le> ?L" by simp
 qed
 
 text \<open>Cumulative distribution of the binomial distribution (contributed by Yong Kiam Tan):\<close>
 
 lemma prob_binomial_pmf_upto:
   assumes "0 \<le> p" "p \<le> 1"
   shows "measure_pmf.prob (binomial_pmf n p) {..m} =
     sum (\<lambda>i. real (n choose i) * p^i * (1 - p) ^(n-i)) {0..m}"
   by (auto simp: pmf_binomial[OF assms] measure_measure_pmf_finite intro!: sum.cong)
 
 text \<open>A tail bound for the binomial distribution using Hoeffding's inequality:\<close>
 
 lemma binomial_pmf_tail:
   assumes "p \<in> {0..1}" "real k \<le> real n * p"
   shows "measure (binomial_pmf n p) {..k} \<le> exp (- 2 * real n * (p - real k / n)^2)" 
     (is "?L \<le> ?R")
 proof (cases "n = 0")
   case True then show ?thesis by simp
 next
   case False
   let ?A = "{..<n}"
   let ?pi = "Pi_pmf ?A undefined (\<lambda>_. bernoulli_pmf p)"
 
   define \<mu> where "\<mu> = (\<Sum>i<n. (\<integral>x. (of_bool (x i) :: real) \<partial> ?pi))"
   define \<epsilon> :: real where "\<epsilon> = \<mu> - k" (* eps \<ge> 0 <-> k \<le> mu *)
 
   have "\<mu> = (\<Sum>i<n. (\<integral>x. (of_bool x :: real) \<partial> (map_pmf (\<lambda>\<omega>. \<omega> i) ?pi)))"
     unfolding \<mu>_def by simp
   also have "... = (\<Sum>i<n. (\<integral>x. (of_bool x :: real) \<partial> (bernoulli_pmf p)))"
     by (simp add: Pi_pmf_component)
   also have "... = real n * p" using assms(1) by simp
   finally have \<mu>_alt: "\<mu> = real n * p"
     by simp
 
   have \<epsilon>_ge_0: "\<epsilon> \<ge> 0"
     using assms(2) unfolding \<epsilon>_def \<mu>_alt by auto
 
   have indep: "prob_space.indep_vars ?pi (\<lambda>_. borel) (\<lambda>k \<omega>. of_bool (\<omega> k)) {..<n}"
     by (intro prob_space.indep_vars_compose2[OF prob_space_measure_pmf indep_vars_Pi_pmf]) auto
   interpret Hoeffding_ineq "?pi" "{..<n}" "\<lambda>k \<omega>. of_bool (\<omega> k)" "\<lambda>_.0" "\<lambda>_.1" \<mu>
     using indep unfolding \<mu>_def by (unfold_locales) simp_all  
   
   have "?L = measure (map_pmf (\<lambda>f. card {x \<in> ?A. f x}) ?pi) {..k}"
     by (intro arg_cong2[where f="measure_pmf.prob"] binomial_pmf_altdef' assms(1)) auto
   also have "... = \<P>(\<omega> in ?pi. (\<Sum>i<n. of_bool (\<omega> i)) \<le> \<mu> - \<epsilon>)"
     unfolding \<epsilon>_def by (simp add:vimage_def Int_def)
   also have "... \<le> exp (- 2 * \<epsilon>\<^sup>2 / (\<Sum>i<n. (1 - 0)\<^sup>2))"
     using False by (intro Hoeffding_ineq_le \<epsilon>_ge_0) auto
   also have "... = ?R"
     unfolding \<epsilon>_def \<mu>_alt by (simp add:power2_eq_square field_simps) 
   finally show ?thesis by simp
 qed
 
 theorem (in prob_space) median_bound:
   fixes n :: nat
   fixes I :: "('b :: {linorder_topology, second_countable_topology}) set"
   assumes "interval I"
   assumes "\<alpha> > 0"
   assumes "\<epsilon> \<in> {0<..<1}"
   assumes "indep_vars (\<lambda>_. borel) X {0..<n}"
   assumes "n \<ge> - ln \<epsilon> / (2 * \<alpha>\<^sup>2)"
   assumes "\<And>i. i < n \<Longrightarrow> \<P>(\<omega> in M. X i \<omega> \<in> I) \<ge> 1/2+\<alpha>" 
   shows "\<P>(\<omega> in M. median n (\<lambda>i. X i \<omega>) \<in> I) \<ge> 1-\<epsilon>"
 proof -
   have "0 < -ln \<epsilon> / (2 * \<alpha>\<^sup>2)"  
     using assms by (intro divide_pos_pos) auto
   also have "... \<le> real n" using assms by simp
   finally have "real n > 0" by simp
   hence n_ge_0:"n > 0" by simp
 
   have d0: "real_of_int \<lfloor>real n / 2\<rfloor> * 2 / real n \<le> 1"
     using n_ge_0 by simp linarith
 
   hence d1: "real (nat \<lfloor>real n / 2\<rfloor>) \<le> real n * (1 / 2)"
     using n_ge_0 by (simp add:field_simps)
   also have "... \<le> real n * (1 / 2 + \<alpha>)"
     using assms(2) by (intro mult_left_mono) auto
   finally have d1: "real (nat \<lfloor>real n / 2\<rfloor>) \<le> real n * (1 / 2 + \<alpha>)" by simp
 
   have "1/2 + \<alpha> \<le> \<P>(\<omega> in M. X 0 \<omega> \<in> I)" using n_ge_0 by (intro assms(6))
   also have "... \<le> 1" by simp
   finally have d2: "1 / 2 + \<alpha> \<le> 1" by simp
 
   have d3: "nat \<lfloor>real n / 2\<rfloor> = n div 2" by linarith
 
   have "1 - \<epsilon> \<le> 1 - exp (- 2 * real n * \<alpha>\<^sup>2)" 
     using assms(2,3,5) by (intro diff_mono order.refl iffD1[OF ln_ge_iff]) (auto simp:field_simps)
   also have "... \<le> 1 - exp (- 2 * real n * ((1/2+\<alpha>) - real (nat \<lfloor>real n/2\<rfloor>) / real n)\<^sup>2)"
     using d0 n_ge_0 assms(2)
     by (intro diff_mono order.refl iffD2[OF exp_le_cancel_iff] mult_left_mono_neg power_mono) auto 
   also have "... \<le> 1 - measure (binomial_pmf n (1/2+\<alpha>)) {..nat \<lfloor>real n/2\<rfloor>}"
     using assms(2) d1 d2 by (intro diff_mono order.refl binomial_pmf_tail) auto
   also have "... = 1 - measure (binomial_pmf n (1/2+\<alpha>)) {..n div 2}" by (simp add:d3)
   also have "... \<le> \<P>(\<omega> in M. median n (\<lambda>i. X i \<omega>) \<in> I)"
     using assms(2) by (intro median_bound_raw n_ge_0 assms(1,4,6) add_nonneg_nonneg) auto
   finally show ?thesis by simp
 qed
 
 text \<open>This is a specialization of the above to closed real intervals.\<close>
 
 corollary (in prob_space) median_bound_1:
   assumes "\<alpha> > 0"
   assumes "\<epsilon> \<in> {0<..<1}"
   assumes "indep_vars (\<lambda>_. borel) X {0..<n}"
   assumes "n \<ge> - ln \<epsilon> / (2 * \<alpha>\<^sup>2)"
   assumes "\<forall>i \<in> {0..<n}. \<P>(\<omega> in M. X i \<omega> \<in> ({a..b} :: real set)) \<ge> 1/2+\<alpha>" 
   shows "\<P>(\<omega> in M. median n (\<lambda>i. X i \<omega>) \<in> {a..b}) \<ge> 1-\<epsilon>" 
   using assms(5) by (intro median_bound[OF _ assms(1,2,3,4)]) (auto simp:interval_def)
 
 text \<open>This is a specialization of the above, where $\alpha = \frac{1}{6}$ and the interval is 
 described using a mid point @{term "\<mu>"} and radius @{term "\<delta>"}. The choice of 
 $\alpha = \frac{1}{6}$ implies a success probability per random variable of $\frac{2}{3}$. It is a 
 commonly chosen success probability for Monte-Carlo algorithms 
 (cf. \<^cite>\<open>\<open>\textsection 4\<close> in "baryossef2002"\<close> or \<^cite>\<open>\<open>\textsection 1\<close> in "kane2010"\<close>).\<close>
 
 corollary (in prob_space) median_bound_2:
   fixes \<mu> \<delta> :: real
   assumes "\<epsilon> \<in> {0<..<1}"
   assumes "indep_vars (\<lambda>_. borel) X {0..<n}"
   assumes "n \<ge> -18 * ln \<epsilon>"
   assumes "\<And>i. i < n \<Longrightarrow> \<P>(\<omega> in M. abs (X i \<omega> - \<mu>) > \<delta>) \<le> 1/3" 
   shows "\<P>(\<omega> in M. abs (median n (\<lambda>i. X i \<omega>) - \<mu>) \<le> \<delta>) \<ge> 1-\<epsilon>"
 proof -
   have b:"\<And>i. i < n \<Longrightarrow> space M - {\<omega> \<in> space M. X i \<omega> \<in> {\<mu> - \<delta>..\<mu> + \<delta>}} =  {\<omega> \<in> space M. abs (X i \<omega> - \<mu>) > \<delta>}"
     apply (rule order_antisym, rule subsetI, simp, linarith)
     by (rule subsetI, simp, linarith)
 
   have "\<And>i. i < n \<Longrightarrow> 1 - \<P>(\<omega> in M. X i \<omega> \<in> {\<mu>- \<delta>..\<mu>+\<delta>}) \<le> 1/3"
     apply (subst prob_compl[symmetric])
      apply (measurable)
      using assms(2) apply (simp add:indep_vars_def)
     apply (subst b, simp)
     using assms(4) by simp
 
   hence a:"\<And>i. i < n \<Longrightarrow> \<P>(\<omega> in M. X i \<omega> \<in> {\<mu>- \<delta>..\<mu>+\<delta>}) \<ge> 2/3" by simp
   
   have "1-\<epsilon> \<le> \<P>(\<omega> in M. median n (\<lambda>i. X i \<omega>) \<in> {\<mu>-\<delta>..\<mu>+\<delta>})"
     apply (rule median_bound_1[OF _ assms(1) assms(2), where \<alpha>="1/6"], simp) 
      using assms(3) apply (simp add:power2_eq_square)
     using a by simp
   also have "... = \<P>(\<omega> in M. abs (median n (\<lambda>i. X i \<omega>) - \<mu>) \<le> \<delta>)"
     apply (rule arg_cong2[where f="measure"], simp)
     apply (rule order_antisym, rule subsetI, simp, linarith)
     by (rule subsetI, simp, linarith)
   finally show ?thesis by simp
 qed
 
 section \<open>Some additional results about the median\<close>
 
 lemma sorted_mono_map: 
   assumes "sorted xs"
   assumes "mono f"
   shows "sorted (map f xs)"
   using assms apply (simp add:sorted_wrt_map)
   apply (rule sorted_wrt_mono_rel[where P="(\<le>)"])
   by (simp add:mono_def, simp)
 
 text \<open>This could be added to @{theory "HOL.List"}:\<close>
 lemma map_sort:
   assumes "mono f"
   shows "sort (map f xs) = map f (sort xs)"
   using assms by (intro properties_for_sort sorted_mono_map) auto
 
 lemma median_cong:
   assumes "\<And>i. i < n \<Longrightarrow> f i = g i"
   shows "median n f = median n g"
   apply (cases "n = 0", simp add:median_def)
   apply (simp add:median_def)
   apply (rule arg_cong2[where f="(!)"])
    apply (rule arg_cong[where f="sort"], rule map_cong, simp, simp add:assms)
   by simp
 
 lemma median_restrict: 
   "median n (\<lambda>i \<in> {0..<n}.f i) = median n f"
   by (rule median_cong, simp)
 
 lemma median_commute_mono:
   assumes "n > 0"
   assumes "mono g"
   shows "g (median n f) = median n (g \<circ> f)"
   apply (simp add: median_def del:map_map)
   apply (subst map_map[symmetric])
   apply (subst map_sort[OF assms(2)])
   apply (subst nth_map, simp) using assms apply fastforce
   by simp
 
 lemma median_rat:
   assumes "n > 0"
   shows "real_of_rat (median n f) = median n (\<lambda>i. real_of_rat (f i))"
   apply (subst (2) comp_def[where g="f", symmetric])
   apply (rule median_commute_mono[OF assms(1)])
   by (simp add: mono_def of_rat_less_eq)
 
 lemma median_const:
   assumes "k > 0"
   shows "median k (\<lambda>i \<in> {0..<k}. a) = a"
 proof -
   have b: "sorted (map (\<lambda>_. a) [0..<k])" 
     by (subst sorted_wrt_map, simp)
   have a: "sort (map (\<lambda>_. a) [0..<k]) = map (\<lambda>_. a) [0..<k]"
     by (subst sorted_sort_id[OF b], simp)
   have "median k (\<lambda>i \<in> {0..<k}. a) = median k (\<lambda>_. a)"
     by (subst median_restrict, simp)
   also have "... = a" using assms by (simp add:median_def a)
   finally show ?thesis by simp
 qed
 
 end
diff --git a/thys/Universal_Hash_Families/Carter_Wegman_Hash_Family.thy b/thys/Universal_Hash_Families/Carter_Wegman_Hash_Family.thy
--- a/thys/Universal_Hash_Families/Carter_Wegman_Hash_Family.thy
+++ b/thys/Universal_Hash_Families/Carter_Wegman_Hash_Family.thy
@@ -1,293 +1,293 @@
 section \<open>Carter-Wegman Hash Family\label{sec:carter_wegman}\<close>
 
 theory Carter_Wegman_Hash_Family
   imports
     Interpolation_Polynomials_HOL_Algebra.Interpolation_Polynomial_Cardinalities
-    Preliminary_Results
+    Universal_Hash_Families_More_Independent_Families
 begin
 
 text \<open>The Carter-Wegman hash family is a generic method to obtain
 $k$-universal hash families for arbitrary $k$. (There are faster solutions, such as tabulation
 hashing, which are limited to a specific $k$. See for example \<^cite>\<open>"thorup2010"\<close>.)
 
 The construction was described by Wegman and Carter~\<^cite>\<open>"wegman1981"\<close>, it is a hash
 family between the elements of a finite field and works by choosing randomly a polynomial
 over the field with degree less than $k$. The hash function is the evaluation of a such a
 polynomial.
 
 Using the property that the fraction of polynomials interpolating a given set of $s \leq k$
 points is @{term "1/(card (carrier R)^s)"}, which is shown in
 \<^cite>\<open>"Interpolation_Polynomials_HOL_Algebra-AFP"\<close>, it is possible to obtain both that
 the hash functions are $k$-wise independent and uniformly distributed.
 
 In the following two locales are introduced, the main reason for both is to make the statements
 of the theorems and proofs more concise. The first locale @{term "poly_hash_family"} fixes a finite
 ring $R$ and the probability space of the polynomials of degree less than $k$. Because the ring is
 not a field, the family is not yet $k$-universal, but it is still possible to state a few results such
 as the fact that the range of the hash function is a subset of the carrier of the ring.
 
 The second locale @{term "carter_wegman_hash_family"} is an extension of the former with the
 assumption that $R$ is a field with which the $k$-universality follows.
 
 The reason for using two separate locales is to support use cases, where the ring is only probably
 a field. For example if it is the set of integers modulo an approximate prime, in such a situation a
 subset of the properties of an algorithm using approximate primes would need to be verified
 even if $R$ is only a ring.\<close>
 
 definition (in ring) "hash x \<omega> = eval \<omega> x"
 
 locale poly_hash_family = ring +
   fixes k :: nat
   assumes finite_carrier[simp]: "finite (carrier R)"
   assumes k_ge_0: "k > 0"
 begin
 
 definition space where "space = bounded_degree_polynomials R k"
 definition M where "M = measure_pmf (pmf_of_set space)"
 
 lemma finite_space[simp]:"finite space"
     unfolding space_def using fin_degree_bounded finite_carrier by simp
 
 lemma non_empty_bounded_degree_polynomials[simp]:"space \<noteq> {}"
     unfolding space_def using non_empty_bounded_degree_polynomials by simp
 
 text \<open>This is to add @{thm [source] carrier_not_empty} to the simp set in the context of
 @{locale "poly_hash_family"}:\<close>
 
 lemma non_empty_carrier[simp]: "carrier R \<noteq> {}"
   by (simp add:carrier_not_empty)
 
 sublocale prob_space "M"
   by (simp add:M_def prob_space_measure_pmf)
 
 lemma hash_range[simp]:
   assumes "\<omega> \<in> space"
   assumes "x \<in> carrier R"
   shows "hash x \<omega> \<in> carrier R"
   using assms unfolding hash_def space_def bounded_degree_polynomials_def
   by (simp, metis eval_in_carrier polynomial_incl univ_poly_carrier)
 
 lemma  hash_range_2:
   assumes "\<omega> \<in> space"
   shows "(\<lambda>x. hash x \<omega>) ` carrier R \<subseteq> carrier R"
   using hash_range assms by auto
 
 lemma integrable_M[simp]:
   fixes f :: "'a list \<Rightarrow> 'c::{banach, second_countable_topology}"
   shows "integrable M f"
     unfolding M_def
     by (rule integrable_measure_pmf_finite, simp)
 
 end
 
 locale carter_wegman_hash_family = poly_hash_family +
   assumes field_R: "field R"
 begin
 sublocale field
   using field_R by simp
 
 abbreviation "field_size \<equiv> card (carrier R)"
 
 lemma poly_cards:
   assumes "K \<subseteq> carrier R"
   assumes "card K \<le> k"
   assumes "y ` K \<subseteq> (carrier R)"
   shows
     "card {\<omega> \<in> space. (\<forall>k \<in> K. eval \<omega> k = y k)} = field_size^(k-card K)"
   unfolding space_def
   using interpolating_polynomials_card[where n="k-card K" and K="K"] assms
   using finite_carrier finite_subset by fastforce
 
 lemma poly_cards_single:
   assumes "x \<in> carrier R"
   assumes "y \<in> carrier R"
   shows "card {\<omega> \<in> space. eval \<omega> x = y} = field_size^(k-1)"
   using poly_cards[where K="{x}" and y="\<lambda>_. y", simplified] assms k_ge_0 by simp
 
 lemma hash_prob:
   assumes "K \<subseteq> carrier R"
   assumes "card K \<le> k"
   assumes "y ` K \<subseteq> carrier R"
   shows
     "prob {\<omega>. (\<forall>x \<in> K. hash x \<omega> = y x)} = 1/(real field_size)^card K"
 proof -
   have "\<zero> \<in> carrier R" by simp
 
   hence a:"field_size > 0"
     using finite_carrier card_gt_0_iff by blast
 
   have b:"real (card {\<omega> \<in> space. \<forall>x\<in>K. eval \<omega> x = y x}) / real (card space) =
     1 / real field_size ^ card K"
     using a assms(2)
     apply (simp add: frac_eq_eq poly_cards[OF assms(1,2,3)] power_add[symmetric])
     by (simp add:space_def bounded_degree_polynomials_card)
 
   show ?thesis
     unfolding M_def
     by (simp add:hash_def measure_pmf_of_set Int_def b)
 qed
 
 lemma prob_single:
   assumes "x \<in> carrier R" "y \<in> carrier R"
   shows "prob {\<omega>. hash x \<omega> = y} = 1/(real field_size)"
   using hash_prob[where K="{x}"] assms finite_carrier k_ge_0 by simp
 
 lemma prob_range:
   assumes [simp]:"x \<in> carrier R"
   shows "prob {\<omega>. hash x \<omega> \<in> A} = card (A \<inter> carrier R) / field_size"
 proof -
   have "prob {\<omega>. hash x \<omega> \<in> A} = prob (\<Union>a \<in> A \<inter> carrier R. {\<omega>. hash x \<omega> = a})"
     by (rule measure_pmf_eq, auto simp:M_def)
   also have "... = (\<Sum> a \<in> (A \<inter> carrier R). prob {\<omega>. hash x \<omega> = a})"
     by (rule measure_finite_Union, auto simp:M_def disjoint_family_on_def)
   also have "... = (\<Sum> a \<in> (A \<inter> carrier R). 1/(real field_size))"
     by (rule sum.cong, auto simp:prob_single)
   also have "... = card (A \<inter> carrier R) / field_size"
     by simp
   finally show ?thesis by simp
 qed
 
 lemma indep:
   assumes "J \<subseteq> carrier R"
   assumes "card J \<le> k"
   shows "indep_vars (\<lambda>_. discrete) hash J"
 proof -
   have "\<zero> \<in> carrier R" by simp
   hence card_R_ge_0:"field_size > 0"
     using card_gt_0_iff finite_carrier by blast
 
   have fin_J: "finite J"
     using finite_carrier assms(1) finite_subset by blast
 
   show ?thesis
   proof (rule indep_vars_pmf[OF M_def])
     fix a
     fix J'
     assume a: "J' \<subseteq> J" "finite J'"
     have card_J': "card J' \<le> k"
       by (metis card_mono order_trans a(1) assms(2) fin_J)
     have J'_in_carr: "J' \<subseteq> carrier R" by (metis order_trans a(1) assms(1))
 
     show "prob {\<omega>. \<forall>x\<in>J'. hash x \<omega> = a x} = (\<Prod>x\<in>J'. prob  {\<omega>. hash x \<omega> = a x})"
     proof (cases "a ` J' \<subseteq> carrier R")
       case True
       have a_carr: "\<And>x. x \<in> J' \<Longrightarrow> a x \<in> carrier R"  using True by force
       have "prob {\<omega>. \<forall>x\<in>J'. hash x \<omega> = a x} =
         real (card {\<omega> \<in> space. \<forall>x\<in>J'. eval \<omega> x = a x}) / real (card space)"
         by (simp add:M_def measure_pmf_of_set Int_def hash_def)
       also have "... = real (field_size ^ (k - card J')) / real (card space)"
         using True by (simp add: poly_cards[OF J'_in_carr card_J'])
       also have
         "... = real field_size ^ (k - card J') / real field_size ^ k"
         by (simp add:space_def bounded_degree_polynomials_card)
       also have
         "... = real field_size ^ ((k - 1) * card J') / real field_size ^ (k * card J')"
         using card_J' by (simp add:power_add[symmetric] power_mult[symmetric]
             diff_mult_distrib frac_eq_eq add.commute)
       also have
         "... = (real field_size ^ (k - 1)) ^ card J' / (real field_size ^ k) ^ card J'"
         by (simp add:power_add power_mult)
       also have
         "... =  (\<Prod>x\<in>J'. real (card {\<omega> \<in> space. eval \<omega> x = a x}) / real (card space))"
         using a_carr poly_cards_single[OF subsetD[OF J'_in_carr]]
         by (simp add:space_def bounded_degree_polynomials_card power_divide)
       also have "... = (\<Prod>x\<in>J'. prob {\<omega>. hash x \<omega> = a x})"
         by (simp add:measure_pmf_of_set M_def Int_def hash_def)
       finally show ?thesis by simp
     next
       case False
       then obtain j where j_def: "j \<in> J'" "a j \<notin> carrier R" by blast
       have "{\<omega> \<in> space. hash j \<omega> = a j} \<subseteq> {\<omega> \<in> space. hash j \<omega> \<notin> carrier R}"
         by (rule subsetI, simp add:j_def)
       also have "... \<subseteq> {}" using j_def(1) J'_in_carr hash_range by blast
       finally have b:"{\<omega> \<in> space. hash j \<omega> = a j} = {}" by simp
       hence "real (card ({\<omega> \<in> space. hash j \<omega> = a j})) = 0" by simp
       hence "(\<Prod>x\<in>J'. real (card {\<omega> \<in> space. hash x \<omega> = a x})) = 0"
         using a(2) prod_zero[OF a(2)] j_def(1) by auto
       moreover have
         "{\<omega> \<in> space. \<forall>x\<in>J'. hash x \<omega> = a x} \<subseteq> {\<omega> \<in> space. hash j \<omega> = a j}"
         using j_def by blast
       hence "{\<omega> \<in> space. \<forall>x\<in>J'. hash x \<omega> = a x} = {}" using b by blast
       ultimately show ?thesis
         by (simp add:measure_pmf_of_set M_def Int_def prod_dividef)
     qed
   qed
 qed
 
 lemma k_wise_indep:
   "k_wise_indep_vars k (\<lambda>_. discrete) hash (carrier R)"
   unfolding k_wise_indep_vars_def using indep by simp
 
 lemma inj_if_degree_1:
   assumes "\<omega> \<in> space"
   assumes "degree \<omega> = 1"
   shows "inj_on (\<lambda>x. hash x \<omega>) (carrier R)"
   using assms eval_inj_if_degree_1
   by (simp add:M_def space_def bounded_degree_polynomials_def hash_def)
 
 lemma uniform:
   assumes "i \<in> carrier R"
   shows "uniform_on (hash i) (carrier R)"
 proof -
   have a:
     "\<And>a. prob {\<omega>. hash i \<omega> \<in> {a}} = indicat_real (carrier R) a / real field_size"
     by (subst prob_range[OF assms], simp add:indicator_def)
   show ?thesis
     by (rule uniform_onI, use a M_def in auto)
 qed
 
 text \<open>This the main result of this section - the Carter-Wegman hash family is $k$-universal.\<close>
 
 theorem k_universal:
   "k_universal k hash (carrier R) (carrier R)"
   using uniform k_wise_indep by (simp add:k_universal_def)
 
 end
 
 lemma poly_hash_familyI:
   assumes "ring R"
   assumes "finite (carrier R)"
   assumes "0 < k"
   shows "poly_hash_family R k"
   using assms
   by (simp add:poly_hash_family_def poly_hash_family_axioms_def)
 
 lemma carter_wegman_hash_familyI:
   assumes "field F"
   assumes "finite (carrier F)"
   assumes "0 < k"
   shows "carter_wegman_hash_family F k"
   using assms field.is_ring[OF assms(1)] poly_hash_familyI
   by (simp add:carter_wegman_hash_family_def carter_wegman_hash_family_axioms_def)
 
 lemma hash_k_wise_indep:
   assumes "field F \<and> finite (carrier F)"
   assumes "1 \<le> n"
   shows
     "prob_space.k_wise_indep_vars (pmf_of_set (bounded_degree_polynomials F n)) n
     (\<lambda>_. pmf_of_set (carrier F)) (ring.hash F) (carrier F)"
 proof -
   interpret carter_wegman_hash_family "F" "n"
     using assms carter_wegman_hash_familyI by force
   have "k_wise_indep_vars n (\<lambda>_. pmf_of_set (carrier F)) hash (carrier F)"
     by (rule k_wise_indep_vars_compose[OF k_wise_indep], simp)
   thus ?thesis
     by (simp add:M_def space_def)
 qed
 
 lemma hash_prob_single:
   assumes "field F \<and> finite (carrier F)"
   assumes "x \<in> carrier F"
   assumes "1 \<le> n"
   assumes "y \<in> carrier F"
   shows
     "\<P>(\<omega> in pmf_of_set (bounded_degree_polynomials F n). ring.hash F x \<omega> = y)
       = 1/(real (card (carrier F)))"
 proof -
   interpret carter_wegman_hash_family "F" "n"
     using assms carter_wegman_hash_familyI by force
   show ?thesis
     using prob_single[OF assms(2,4)] by (simp add:M_def space_def)
 qed
 
 end
diff --git a/thys/Universal_Hash_Families/ROOT b/thys/Universal_Hash_Families/ROOT
--- a/thys/Universal_Hash_Families/ROOT
+++ b/thys/Universal_Hash_Families/ROOT
@@ -1,16 +1,16 @@
 chapter AFP
 
 session Universal_Hash_Families = "HOL-Probability" +
   options [timeout = 600]
   sessions
     "HOL-Algebra"
     "Finite_Fields"
     "Interpolation_Polynomials_HOL_Algebra"
   theories
-    Definitions
-    Preliminary_Results
+    Universal_Hash_Families
+    Universal_Hash_Families_More_Independent_Families
     Carter_Wegman_Hash_Family
-    Field
+    Universal_Hash_Families_More_Finite_Fields
   document_files
     "root.tex"
     "root.bib"
diff --git a/thys/Universal_Hash_Families/Definitions.thy b/thys/Universal_Hash_Families/Universal_Hash_Families.thy
rename from thys/Universal_Hash_Families/Definitions.thy
rename to thys/Universal_Hash_Families/Universal_Hash_Families.thy
--- a/thys/Universal_Hash_Families/Definitions.thy
+++ b/thys/Universal_Hash_Families/Universal_Hash_Families.thy
@@ -1,81 +1,81 @@
 section \<open>Introduction and Definition\<close>
 
-theory Definitions
+theory Universal_Hash_Families
   imports "HOL-Probability.Independent_Family"
 begin
 
 text \<open>Universal hash families are commonly used in randomized algorithms and data structures to
 randomize the input of algorithms, such that probabilistic methods can be employed without requiring
 any assumptions about the input distribution.
 
 If we regard a family of hash functions from a domain $D$ to a finite range $R$ as a uniform probability
 space, then the family is $k$-universal if:
 \begin{itemize}
 \item For each $x \in D$ the evaluation of the functions at $x$ forms a uniformly distributed random variable on $R$.
 \item The evaluation random variables for $k$ or fewer distinct domain elements form an
 independent family of random variables.
 \end{itemize}
 
 This definition closely follows the definition from Vadhan~\<^cite>\<open>\<open>\textsection 3.5.5\<close> in "vadhan2012"\<close>, with the minor
 modification that independence is required not only for exactly $k$, but also for \emph{fewer} than $k$ distinct
 domain elements. The correction is due to the fact that in the corner case where $D$ has fewer than $k$ elements,
 the second part of their definition becomes void. In the formalization this helps avoid an unnecessary assumption in
 the theorems.
 
 The following definition introduces the notion of $k$-wise independent random variables:\<close>
 
 definition (in prob_space) k_wise_indep_vars where
   "k_wise_indep_vars k M' X I =
     (\<forall>J \<subseteq> I. card J \<le> k \<longrightarrow> finite J \<longrightarrow> indep_vars M' X J)"
 
 lemma (in prob_space) k_wise_indep_vars_subset:
   assumes "k_wise_indep_vars k M' X I"
   assumes "J \<subseteq> I"
   assumes "finite J"
   assumes "card J \<le> k"
   shows "indep_vars M' X J"
   using assms
   by (simp add:k_wise_indep_vars_def)
 
 text \<open>Similarly for a finite non-empty set $A$ the predicate @{term "uniform_on X A"} indicates that
 the random variable is uniformly distributed on $A$:\<close>
 
 definition (in prob_space) "uniform_on X A = (
   distr M (count_space UNIV) X = uniform_measure (count_space UNIV) A \<and>
   A \<noteq> {} \<and> finite A \<and> random_variable (count_space UNIV) X)"
 
 lemma (in prob_space) uniform_onD:
   assumes "uniform_on X A"
   shows "prob {\<omega> \<in> space M. X \<omega> \<in> B} = card (A \<inter> B) / card A"
 proof -
   have "prob {\<omega> \<in> space M. X \<omega> \<in> B} = prob (X -` B \<inter> space M)"
     by (subst Int_commute, simp add:vimage_def Int_def)
   also have "... = measure (distr M (count_space UNIV) X) B"
     using assms by (subst measure_distr, auto simp:uniform_on_def)
   also have "... = measure (uniform_measure (count_space UNIV) A) B"
     using assms by (simp add:uniform_on_def)
   also have "... = card (A \<inter> B) / card A"
     using assms by (subst measure_uniform_measure, auto simp:uniform_on_def)+
   finally show ?thesis by simp
 qed
 
 text \<open>With the two previous definitions it is possible to define the $k$-universality condition for a family
 of hash functions from $D$ to $R$:\<close>
 
 definition (in prob_space) "k_universal k X D R = (
   k_wise_indep_vars k (\<lambda>_. count_space UNIV) X D \<and>
   (\<forall>i \<in> D. uniform_on (X i) R))"
 
 text \<open>Note: The definition is slightly more generic then the informal specification from above.
 This is because usually a family is formed by a single function with a variable seed parameter. Instead of
 choosing a random function from a probability space, a random seed is chosen from the probability space
 which parameterizes the hash function.
 
 The following section contains some preliminary results about independent families
 of random variables.
 Section~\ref{sec:carter_wegman} introduces the Carter-Wegman hash family, which is an
 explicit construction of $k$-universal families for arbitrary $k$ using polynomials over finite fields.
 The last section contains a proof that the factor ring of the integers modulo a prime ideal is a finite field,
 followed by an isomorphic construction of prime fields over an initial segment of the natural numbers.\<close>
 
 end
diff --git a/thys/Universal_Hash_Families/Field.thy b/thys/Universal_Hash_Families/Universal_Hash_Families_More_Finite_Fields.thy
rename from thys/Universal_Hash_Families/Field.thy
rename to thys/Universal_Hash_Families/Universal_Hash_Families_More_Finite_Fields.thy
--- a/thys/Universal_Hash_Families/Field.thy
+++ b/thys/Universal_Hash_Families/Universal_Hash_Families_More_Finite_Fields.thy
@@ -1,253 +1,253 @@
 section \<open>Finite Fields\<close>
 
-theory Field
+theory Universal_Hash_Families_More_Finite_Fields
   imports
-    "Finite_Fields.Ring_Characteristic"
+    Finite_Fields.Ring_Characteristic
     "HOL-Algebra.Ring_Divisibility"
     "HOL-Algebra.IntRing"
 begin
 
 text \<open>In some applications it is more convenient to work with natural numbers instead of
 @{term "ZFact p"} whose elements are cosets. To support that use case the following definition
 introduces an additive and multiplicative structure on @{term "{..<p}"}. After verifying that
 the function @{term "zfact_iso"} and its inverse are homomorphisms, the ring and field property
 can be transfered from @{term "ZFact p"} to to the structure on @{term "{..<p}"}.\<close>
 
 lemma zfact_iso_0:
   assumes "n > 0"
   shows "zfact_iso n 0 = \<zero>\<^bsub>ZFact (int n)\<^esub>"
 proof -
   let ?I = "Idl\<^bsub>\<Z>\<^esub> {int n}"
   have ideal_I: "ideal ?I \<Z>"
     by (simp add: int.genideal_ideal)
 
   interpret i:ideal "?I" "\<Z>" using ideal_I by simp
   interpret s:ring_hom_ring "\<Z>" "ZFact (int n)" "(+>\<^bsub>\<Z>\<^esub>) ?I"
    using i.rcos_ring_hom_ring ZFact_def by auto
 
   show ?thesis
     by (simp add:zfact_iso_def ZFact_def)
 qed
 
 lemma zfact_prime_is_field:
   assumes "Factorial_Ring.prime (p :: nat)"
   shows "field (ZFact (int p))"
   using zfact_prime_is_finite_field[OF assms] finite_field_def by auto
 
 definition mod_ring :: "nat => nat ring"
   where "mod_ring n = \<lparr>
     carrier = {..<n},
     mult = (\<lambda> x y. (x * y) mod n),
     one = 1,
     zero = 0,
     add = (\<lambda> x y. (x + y) mod n) \<rparr>"
 
 definition zfact_iso_inv :: "nat \<Rightarrow> int set \<Rightarrow> nat" where
   "zfact_iso_inv p = inv_into {..<p} (zfact_iso p)"
 
 lemma zfact_iso_inv_0:
   assumes n_ge_0: "n > 0"
   shows "zfact_iso_inv n \<zero>\<^bsub>ZFact (int n)\<^esub> = 0"
   unfolding zfact_iso_inv_def zfact_iso_0[OF n_ge_0, symmetric] using n_ge_0
   by (rule inv_into_f_f[OF zfact_iso_inj], simp add:mod_ring_def)
 
 lemma zfact_coset:
   assumes n_ge_0: "n > 0"
   assumes "x \<in> carrier (ZFact (int n))"
   defines "I \<equiv> Idl\<^bsub>\<Z>\<^esub> {int n}"
   shows "x = I +>\<^bsub>\<Z>\<^esub> (int (zfact_iso_inv n x))"
 proof -
   have "x \<in> zfact_iso n ` {..<n}"
     using assms zfact_iso_ran by simp
   hence "zfact_iso n (zfact_iso_inv n x) = x"
     unfolding zfact_iso_inv_def by (rule f_inv_into_f)
   thus ?thesis unfolding zfact_iso_def I_def by blast
 qed
 
 lemma zfact_iso_inv_is_ring_iso:
   assumes n_ge_1: "n > 1"
   shows "zfact_iso_inv n \<in> ring_iso (ZFact (int n)) (mod_ring n)"
 proof (rule ring_iso_memI)
   interpret r:cring "(ZFact (int n))"
     using ZFact_is_cring by simp
 
   define I where "I = Idl\<^bsub>\<Z>\<^esub> {int n}"
 
   have n_ge_0: "n > 0" using n_ge_1 by simp
 
   interpret i:ideal "I" "\<Z>"
     unfolding I_def using int.genideal_ideal by simp
 
   interpret s:ring_hom_ring "\<Z>" "ZFact (int n)" "(+>\<^bsub>\<Z>\<^esub>) I"
    using i.rcos_ring_hom_ring ZFact_def I_def by auto
 
   show
     "\<And>x. x \<in> carrier (ZFact (int n)) \<Longrightarrow> zfact_iso_inv n x \<in> carrier (mod_ring n)"
   proof -
     fix x
     assume "x \<in> carrier (ZFact (int n))"
     hence "zfact_iso_inv n x \<in> {..<n}"
       unfolding zfact_iso_inv_def
       using zfact_iso_ran[OF n_ge_0] inv_into_into by metis
 
     thus "zfact_iso_inv n x \<in> carrier (mod_ring n)"
       unfolding mod_ring_def by simp
   qed
 
   show "\<And>x y. x \<in> carrier (ZFact (int n)) \<Longrightarrow> y \<in> carrier (ZFact (int n)) \<Longrightarrow>
     zfact_iso_inv n (x \<otimes>\<^bsub>ZFact (int n)\<^esub> y) =
     zfact_iso_inv n x \<otimes>\<^bsub>mod_ring n\<^esub> zfact_iso_inv n y"
   proof -
     fix x y
     assume x_carr: "x \<in> carrier (ZFact (int n))"
     define x' where "x' = zfact_iso_inv n x"
     assume y_carr: "y \<in> carrier (ZFact (int n))"
     define y' where "y' = zfact_iso_inv n y"
     have "x \<otimes>\<^bsub>ZFact (int n)\<^esub> y = (I +>\<^bsub>\<Z>\<^esub> (int x')) \<otimes>\<^bsub>ZFact (int n)\<^esub> (I +>\<^bsub>\<Z>\<^esub> (int y'))"
       unfolding x'_def y'_def
       using x_carr y_carr zfact_coset[OF n_ge_0] I_def by simp
     also have "... = (I +>\<^bsub>\<Z>\<^esub> (int x' * int y'))"
       by simp
     also have "... = (I +>\<^bsub>\<Z>\<^esub> (int ((x' * y') mod n)))"
       unfolding I_def zmod_int by (rule int_cosetI[OF n_ge_0],simp)
     also have "... = (I +>\<^bsub>\<Z>\<^esub> (x' \<otimes>\<^bsub>mod_ring n\<^esub> y'))"
       unfolding mod_ring_def by simp
     also have "... = zfact_iso n (x' \<otimes>\<^bsub>mod_ring n\<^esub> y')"
       unfolding zfact_iso_def I_def by simp
     finally have a:"x \<otimes>\<^bsub>ZFact (int n)\<^esub> y = zfact_iso n (x' \<otimes>\<^bsub>mod_ring n\<^esub> y')"
       by simp
     have b:"x' \<otimes>\<^bsub>mod_ring n\<^esub> y' \<in> {..<n}"
       using mod_ring_def n_ge_0 by auto
     have "zfact_iso_inv n (zfact_iso n (x' \<otimes>\<^bsub>mod_ring n\<^esub> y')) = x' \<otimes>\<^bsub>mod_ring n\<^esub> y'"
       unfolding zfact_iso_inv_def
       by (rule inv_into_f_f[OF zfact_iso_inj[OF n_ge_0] b])
     thus
       "zfact_iso_inv n (x \<otimes>\<^bsub>ZFact (int n)\<^esub> y) =
       zfact_iso_inv n x \<otimes>\<^bsub>mod_ring n\<^esub> zfact_iso_inv n y"
       using a x'_def y'_def by simp
   qed
 
   show "\<And>x y. x \<in> carrier (ZFact (int n)) \<Longrightarrow> y \<in> carrier (ZFact (int n)) \<Longrightarrow>
     zfact_iso_inv n (x \<oplus>\<^bsub>ZFact (int n)\<^esub> y) =
     zfact_iso_inv n x \<oplus>\<^bsub>mod_ring n\<^esub> zfact_iso_inv n y"
   proof -
     fix x y
     assume x_carr: "x \<in> carrier (ZFact (int n))"
     define x' where "x' = zfact_iso_inv n x"
     assume y_carr: "y \<in> carrier (ZFact (int n))"
     define y' where "y' = zfact_iso_inv n y"
     have "x \<oplus>\<^bsub>ZFact (int n)\<^esub> y = (I +>\<^bsub>\<Z>\<^esub> (int x')) \<oplus>\<^bsub>ZFact (int n)\<^esub> (I +>\<^bsub>\<Z>\<^esub> (int y'))"
       unfolding x'_def y'_def
       using x_carr y_carr zfact_coset[OF n_ge_0] I_def by simp
     also have "... = (I +>\<^bsub>\<Z>\<^esub> (int x' + int y'))"
       by simp
     also have "... = (I +>\<^bsub>\<Z>\<^esub> (int ((x' + y') mod n)))"
       unfolding I_def zmod_int by (rule int_cosetI[OF n_ge_0],simp)
     also have "... = (I +>\<^bsub>\<Z>\<^esub> (x' \<oplus>\<^bsub>mod_ring n\<^esub> y'))"
       unfolding mod_ring_def by simp
     also have "... = zfact_iso n (x' \<oplus>\<^bsub>mod_ring n\<^esub> y')"
       unfolding zfact_iso_def I_def by simp
     finally have a:"x \<oplus>\<^bsub>ZFact (int n)\<^esub> y = zfact_iso n (x' \<oplus>\<^bsub>mod_ring n\<^esub> y')"
       by simp
     have b:"x' \<oplus>\<^bsub>mod_ring n\<^esub> y' \<in> {..<n}"
       using mod_ring_def n_ge_0 by auto
     have "zfact_iso_inv n (zfact_iso n (x' \<oplus>\<^bsub>mod_ring n\<^esub> y')) = x' \<oplus>\<^bsub>mod_ring n\<^esub> y'"
       unfolding zfact_iso_inv_def
       by (rule inv_into_f_f[OF zfact_iso_inj[OF n_ge_0] b])
     thus
       "zfact_iso_inv n (x \<oplus>\<^bsub>ZFact (int n)\<^esub> y) =
       zfact_iso_inv n x \<oplus>\<^bsub>mod_ring n\<^esub> zfact_iso_inv n y"
       using a x'_def y'_def by simp
   qed
 
   have "\<one>\<^bsub>ZFact (int n)\<^esub> = zfact_iso n (\<one>\<^bsub>mod_ring n\<^esub>)"
     by (simp add:zfact_iso_def ZFact_def I_def[symmetric] mod_ring_def)
 
   thus "zfact_iso_inv n \<one>\<^bsub>ZFact (int n)\<^esub> = \<one>\<^bsub>mod_ring n\<^esub>"
     unfolding zfact_iso_inv_def mod_ring_def
     using inv_into_f_f[OF zfact_iso_inj] n_ge_1 by simp
 
   show "bij_betw (zfact_iso_inv n) (carrier (ZFact (int n))) (carrier (mod_ring n))"
     using zfact_iso_inv_def mod_ring_def zfact_iso_bij[OF n_ge_0] bij_betw_inv_into
     by force
 qed
 
 lemma mod_ring_finite:
   "finite (carrier (mod_ring n))"
   by (simp add:mod_ring_def)
 
 lemma mod_ring_carr:
   "x \<in> carrier (mod_ring n) \<longleftrightarrow>  x < n"
   by (simp add:mod_ring_def)
 
 lemma mod_ring_is_cring:
   assumes n_ge_1: "n > 1"
   shows "cring (mod_ring n)"
 proof -
   have n_ge_0: "n > 0" using n_ge_1 by simp
 
   interpret cring "ZFact (int n)"
     using ZFact_is_cring by simp
 
   have "cring ((mod_ring n) \<lparr> zero := zfact_iso_inv n \<zero>\<^bsub>ZFact (int n)\<^esub> \<rparr>)"
     by (rule ring_iso_imp_img_cring[OF zfact_iso_inv_is_ring_iso[OF n_ge_1]])
   moreover have
     "(mod_ring n) \<lparr> zero := zfact_iso_inv n \<zero>\<^bsub>ZFact (int n)\<^esub> \<rparr> = mod_ring n"
     using zfact_iso_inv_0[OF n_ge_0]
     by (simp add:mod_ring_def)
   ultimately show ?thesis by simp
 qed
 
 lemma zfact_iso_is_ring_iso:
   assumes n_ge_1: "n > 1"
   shows "zfact_iso n \<in> ring_iso (mod_ring n) (ZFact (int n))"
 proof -
   have r:"ring (ZFact (int n))"
     using ZFact_is_cring cring.axioms(1) by blast
 
   interpret s: ring "(mod_ring n)"
     using mod_ring_is_cring cring.axioms(1) n_ge_1 by blast
   have n_ge_0: "n > 0" using n_ge_1 by linarith
 
   have
     "inv_into (carrier (ZFact (int n))) (zfact_iso_inv n)
       \<in> ring_iso (mod_ring n) (ZFact (int n))"
     using ring_iso_set_sym[OF r zfact_iso_inv_is_ring_iso[OF n_ge_1]] by simp
   moreover have "\<And>x. x \<in> carrier (mod_ring n) \<Longrightarrow>
     inv_into (carrier (ZFact (int n))) (zfact_iso_inv n) x = zfact_iso n x"
   proof -
     fix x
     assume "x \<in> carrier (mod_ring n)"
     hence "x \<in> {..<n}" by (simp add:mod_ring_def)
     thus "inv_into (carrier (ZFact (int n))) (zfact_iso_inv n) x = zfact_iso n x"
       unfolding zfact_iso_inv_def
       by (simp add:inv_into_inv_into_eq[OF zfact_iso_bij[OF n_ge_0]])
   qed
 
   ultimately show ?thesis
     using s.ring_iso_restrict by blast
 qed
 
 text \<open>If @{term "p"} is a prime than @{term "mod_ring p"} is a field:\<close>
 
 lemma mod_ring_is_field:
   assumes"Factorial_Ring.prime p"
   shows "field (mod_ring p)"
 proof -
   have p_ge_0: "p > 0" using assms prime_gt_0_nat by blast
   have p_ge_1: "p > 1" using assms prime_gt_1_nat by blast
 
   interpret field "ZFact (int p)"
     using zfact_prime_is_field[OF assms] by simp
 
   have "field ((mod_ring p) \<lparr> zero := zfact_iso_inv p \<zero>\<^bsub>ZFact (int p)\<^esub> \<rparr>)"
     by (rule ring_iso_imp_img_field[OF zfact_iso_inv_is_ring_iso[OF p_ge_1]])
 
   moreover have
     "(mod_ring p) \<lparr> zero := zfact_iso_inv p \<zero>\<^bsub>ZFact (int p)\<^esub> \<rparr> = mod_ring p"
     using zfact_iso_inv_0[OF p_ge_0]
     by (simp add:mod_ring_def)
   ultimately show ?thesis by simp
 qed
 
 end
diff --git a/thys/Universal_Hash_Families/Preliminary_Results.thy b/thys/Universal_Hash_Families/Universal_Hash_Families_More_Independent_Families.thy
rename from thys/Universal_Hash_Families/Preliminary_Results.thy
rename to thys/Universal_Hash_Families/Universal_Hash_Families_More_Independent_Families.thy
--- a/thys/Universal_Hash_Families/Preliminary_Results.thy
+++ b/thys/Universal_Hash_Families/Universal_Hash_Families_More_Independent_Families.thy
@@ -1,348 +1,348 @@
 section \<open>Preliminary Results\<close>
 
-theory Preliminary_Results
+theory Universal_Hash_Families_More_Independent_Families
   imports
-    "Definitions"
+    Universal_Hash_Families
     "HOL-Probability.Stream_Space"
     "HOL-Probability.Probability_Mass_Function"
 begin
 
 lemma set_comp_image_cong:
   assumes "\<And>x. P x \<Longrightarrow> f x = h (g x)"
   shows "{f x| x. P x} = h ` {g x| x. P x}"
   using assms by (auto simp: setcompr_eq_image)
 
 lemma (in prob_space) k_wise_indep_vars_compose:
   assumes "k_wise_indep_vars k M' X I"
   assumes "\<And>i. i \<in> I \<Longrightarrow> Y i \<in> measurable (M' i) (N i)"
   shows "k_wise_indep_vars k N (\<lambda>i x. Y i (X i x)) I"
   using indep_vars_compose2[where N="N" and X="X" and Y="Y" and M'="M'"] assms
   by (simp add: k_wise_indep_vars_def subsetD)
 
 text \<open>The following two lemmas are of independent interest, they help infer independence of events
 and random variables on distributions. (Candidates for
 @{theory "HOL-Probability.Independent_Family"}).\<close>
 
 lemma (in prob_space) indep_sets_distr:
   fixes A
   assumes "random_variable N f"
   defines "F \<equiv> (\<lambda>i. (\<lambda>a. f -` a \<inter> space M) ` A i)"
   assumes indep_F: "indep_sets F I"
   assumes sets_A: "\<And>i. i \<in> I \<Longrightarrow> A i \<subseteq> sets N"
   shows "prob_space.indep_sets (distr M N f) A I"
 proof (rule prob_space.indep_setsI)
   show "\<And>A' J. J \<noteq> {} \<Longrightarrow> J \<subseteq> I \<Longrightarrow> finite J \<Longrightarrow> \<forall>j\<in>J. A' j \<in> A j \<Longrightarrow>
       measure (distr M N f) (\<Inter> (A' ` J)) = (\<Prod>j\<in>J. measure (distr M N f) (A' j))"
   proof -
     fix A' J
     assume a:"J \<subseteq> I" "finite J" "J \<noteq> {}" "\<forall>j \<in> J. A' j \<in> A j"
 
     define F' where "F' = (\<lambda>i. f -` A' i \<inter> space M)"
 
     have "\<Inter> (F' ` J) = f -` (\<Inter> (A' ` J)) \<inter> space M"
       unfolding  set_eq_iff F'_def using a(3) by simp
     moreover have "\<Inter> (A' ` J) \<in> sets N"
       by (metis a sets_A sets.finite_INT subset_iff)
     ultimately have b:
       "measure (distr M N f) (\<Inter> (A' ` J)) = measure M (\<Inter> (F' ` J))"
       by (metis assms(1) measure_distr)
 
     have "\<And>j. j \<in> J \<Longrightarrow> F' j \<in> F j"
       using a(4) F'_def F_def by blast
     hence c:"measure M (\<Inter> (F' ` J)) = (\<Prod>j\<in> J. measure M (F' j))"
       by (metis indep_F indep_setsD a(1,2,3))
 
     have "\<And>j. j \<in> J \<Longrightarrow> F' j =  f -` A' j  \<inter> space M"
       by (simp add:F'_def)
     moreover have "\<And>j. j \<in> J \<Longrightarrow> A' j \<in> sets N"
       using a(1,4) sets_A by blast
     ultimately have d:
       "\<And>j. j \<in> J \<Longrightarrow> measure M (F' j) = measure (distr M N f) (A' j)"
       using assms(1) measure_distr by metis
 
     show
       "measure (distr M N f) (\<Inter> (A' ` J)) = (\<Prod>j\<in>J. measure (distr M N f) (A' j))"
       using b c d by auto
   qed
   show "prob_space (distr M N f)" using prob_space_distr assms by blast
   show "\<And>i. i \<in> I \<Longrightarrow> A i \<subseteq> sets (distr M N f)" using sets_A sets_distr by blast
 qed
 
 lemma (in prob_space) indep_vars_distr:
   assumes "f \<in> measurable M N"
   assumes "\<And>i. i \<in> I \<Longrightarrow> X' i \<in> measurable N (M' i)"
   assumes "indep_vars M' (\<lambda>i. (X' i) \<circ> f) I"
   shows "prob_space.indep_vars (distr M N f) M' X' I"
 proof -
   interpret D: prob_space "(distr M N f)"
     using prob_space_distr[OF assms(1)] by simp
 
   have a: "f \<in> space M \<rightarrow> space N" using assms(1) by (simp add:measurable_def)
 
   have "D.indep_sets (\<lambda>i. {X' i -` A \<inter> space N |A. A \<in> sets (M' i)}) I"
   proof (rule indep_sets_distr[OF assms(1)])
     have "\<And>i. i \<in> I \<Longrightarrow> {(X' i \<circ> f) -` A \<inter> space M |A. A \<in> sets (M' i)} =
       (\<lambda>a. f -` a \<inter> space M) ` {X' i -` A \<inter> space N |A. A \<in> sets (M' i)}"
       by (rule set_comp_image_cong, simp add:set_eq_iff, use a in blast)
     thus "indep_sets (\<lambda>i. (\<lambda>a. f -` a \<inter> space M) `
         {X' i -` A \<inter> space N |A. A \<in> sets (M' i)}) I"
       using assms(3) by (simp add:indep_vars_def2 cong:indep_sets_cong)
   next
     fix i
     assume "i \<in> I"
     thus "{X' i -` A \<inter> space N |A. A \<in> sets (M' i)} \<subseteq> sets N"
       using assms(2) measurable_sets by blast
   qed
   thus ?thesis
     using assms by (simp add:D.indep_vars_def2)
 qed
 
 lemma range_inter: "range ((\<inter>) F) = Pow F"
   unfolding image_def by auto
 
 text \<open>The singletons and the empty set form an intersection stable generator of a countable
 discrete $\sigma$-algebra:\<close>
 
 lemma sigma_sets_singletons_and_empty:
   assumes "countable M"
   shows "sigma_sets M (insert {} ((\<lambda>k. {k}) ` M)) = Pow M"
 proof -
   have "sigma_sets M ((\<lambda>k. {k}) ` M) = Pow M"
     using assms sigma_sets_singletons by auto
   hence "Pow M \<subseteq> sigma_sets M (insert {} ((\<lambda>k. {k}) ` M))"
     by (metis sigma_sets_subseteq subset_insertI)
   moreover have "(insert {} ((\<lambda>k. {k}) ` M)) \<subseteq> Pow M" by blast
   hence "sigma_sets M (insert {} ((\<lambda>k. {k}) ` M)) \<subseteq> Pow M"
     by (meson sigma_algebra.sigma_sets_subset sigma_algebra_Pow)
   ultimately show ?thesis by force
 qed
 
 text \<open>In some of the following theorems, the premise @{term "M = measure_pmf p"} is used. This allows stating
 theorems that hold for pmfs more concisely, for example, instead of
 @{term "measure_pmf.prob p A \<le> measure_pmf.prob p B"} we can
 just write @{term "M = measure_pmf p \<Longrightarrow> prob A \<le> prob B"} in the locale @{locale "prob_space"}.\<close>
 
 lemma prob_space_restrict_space:
   assumes [simp]:"M = measure_pmf p"
   shows "prob_space (restrict_space M (set_pmf p))"
   by (rule prob_spaceI, auto simp:emeasure_restrict_space emeasure_pmf)
 
 text \<open>The abbreviation below is used to specify the discrete $\sigma$-algebra on @{term "UNIV"}
 as a measure space. It is used in places where the existing definitions, such as @{term "indep_vars"},
 expect a measure space even though only a \emph{measurable} space is really needed, i.e., in cases
 where the property is invariant with respect to the actual measure.\<close>
 
 hide_const (open) discrete
 
 abbreviation "discrete \<equiv> count_space UNIV"
 
 lemma (in prob_space) indep_vars_restrict_space:
   assumes [simp]:"M = measure_pmf p"
   assumes
     "prob_space.indep_vars (restrict_space M (set_pmf p)) (\<lambda>_. discrete) X I"
   shows "indep_vars (\<lambda>_. discrete) X I"
 proof -
   have a: "id \<in> restrict_space M (set_pmf p) \<rightarrow>\<^sub>M M"
     by (simp add:measurable_def range_inter sets_restrict_space)
 
   have "prob_space.indep_vars (distr (restrict_space M (set_pmf p)) M id) (\<lambda>_. discrete) X I"
     using assms a prob_space_restrict_space by (auto intro!:prob_space.indep_vars_distr)
   moreover have
     "\<And>A. emeasure (distr (restrict_space M (set_pmf p)) M id) A = emeasure M A"
     using emeasure_distr[OF a]
     by (auto simp add: emeasure_restrict_space emeasure_Int_set_pmf)
   hence "distr (restrict_space M p) M id = M"
     by (auto intro: measure_eqI)
   ultimately show ?thesis by simp
 qed
 
 lemma (in prob_space) measure_pmf_eq:
   assumes "M = measure_pmf p"
   assumes "\<And>x. x \<in> set_pmf p \<Longrightarrow> (x \<in> P) = (x \<in> Q)"
   shows "prob P = prob Q"
   unfolding assms(1)
   by (rule measure_eq_AE, rule AE_pmfI[OF assms(2)], auto)
 
 text \<open>The following lemma is an intro rule for the independence of random variables defined on pmfs.
 In that case it is possible, to check the independence of random variables point-wise.
 
 The proof relies on the fact that the support of a pmf is countable and the $\sigma$-algebra of
 such a set can be generated by singletons.\<close>
 
 lemma (in prob_space) indep_vars_pmf:
   assumes [simp]:"M = measure_pmf p"
   assumes "\<And>a J. J \<subseteq> I \<Longrightarrow> finite J \<Longrightarrow>
     prob {\<omega>. \<forall>i \<in> J. X i \<omega> = a i} = (\<Prod>i \<in> J. prob {\<omega>. X i \<omega> = a i})"
   shows "indep_vars (\<lambda>_. discrete) X I"
 proof -
   interpret R:prob_space "(restrict_space M (set_pmf p))"
     using prob_space_restrict_space by auto
 
   have events_eq_pow: "R.events = Pow (set_pmf p)"
     by (simp add:sets_restrict_space range_inter)
 
   define G where "G = (\<lambda>i. {{}} \<union> (\<lambda>x. {x}) ` (X i ` set_pmf p))"
   define F where "F = (\<lambda>i. {X i -` a \<inter> set_pmf p|a. a \<in> G i})"
 
   have sigma_sets_pow:
     "\<And>i. i \<in> I \<Longrightarrow> sigma_sets (X i ` set_pmf p) (G i) = Pow (X i ` set_pmf p)"
     by (simp add:G_def, metis countable_image countable_set_pmf sigma_sets_singletons_and_empty)
 
   have F_in_events: "\<And>i. i \<in> I \<Longrightarrow> F i \<subseteq> Pow (set_pmf p)"
     unfolding F_def by blast
 
   have as_sigma_sets:
     "\<And>i. i \<in> I \<Longrightarrow> {u. \<exists>A. u = X i -` A \<inter> set_pmf p} = sigma_sets (set_pmf p) (F i)"
   proof -
     fix i
     assume a:"i \<in> I"
     have "\<And>A. X i -` A \<inter> set_pmf p = X i -` (A \<inter> X i ` set_pmf p) \<inter> set_pmf p"
       by auto
     hence "{u. \<exists>A. u = X i -` A \<inter> set_pmf p} =
           {X i -` A \<inter> set_pmf p |A. A \<subseteq> X i ` set_pmf p}"
       by (metis (no_types, opaque_lifting) inf_le2)
     also have
       "... = {X i -` A \<inter> set_pmf p |A. A \<in> sigma_sets (X i ` set_pmf p) (G i)}"
       using a by (simp add:sigma_sets_pow)
     also have "... = sigma_sets (set_pmf p) {X i -` a \<inter> set_pmf p |a. a \<in> G i}"
       by (subst sigma_sets_vimage_commute[symmetric], auto)
     also have "... = sigma_sets (set_pmf p) (F i)"
       by (simp add:F_def)
     finally show
       "{u. \<exists>A. u = X i -` A \<inter> set_pmf p} = sigma_sets (set_pmf p) (F i)"
       by simp
   qed
 
   have F_Int_stable: "\<And>i. i \<in> I \<Longrightarrow> Int_stable (F i)"
   proof (rule Int_stableI)
     fix i a b
     assume "i \<in> I"  "a \<in> F i"  "b \<in> F i"
     thus "a \<inter> b \<in> (F i)"
       unfolding F_def G_def by (cases "a \<inter> b = {}", auto)
   qed
 
   have F_indep_sets:"R.indep_sets F I"
   proof (rule R.indep_setsI)
     fix i
     assume "i \<in> I"
     show "F i \<subseteq> R.events"
       unfolding F_def events_eq_pow by blast
   next
     fix A
     fix J
     assume a:"J \<subseteq> I" "J \<noteq> {}" "finite J" "\<forall>j\<in>J. A j \<in> F j"
     have b: "\<And>j. j \<in> J \<Longrightarrow> A j \<subseteq> set_pmf p"
       by (metis PowD a(1,4) subsetD F_in_events)
     obtain x where x_def:"\<And>j. j \<in> J  \<Longrightarrow> A j = X j -` x j \<inter> set_pmf p \<and> x j \<in> G j"
       using a by (simp add:Pi_def F_def, metis)
 
     show "R.prob (\<Inter> (A ` J)) = (\<Prod>j\<in>J. R.prob (A j))"
     proof (cases "\<exists>j \<in> J. A j = {}")
       case True
       hence "\<Inter> (A ` J) = {}" by blast
       then show ?thesis
         using a True by (simp, metis measure_empty)
     next
       case False
       then have "\<And>j. j \<in> J \<Longrightarrow> x j \<noteq> {}" using x_def by auto
       hence "\<And>j. j \<in> J \<Longrightarrow> x j \<in> (\<lambda>x. {x}) ` X j ` set_pmf p"
         using x_def by (simp add:G_def)
       then obtain y where y_def: "\<And>j. j \<in> J \<Longrightarrow> x j = {y j}"
         by (simp add:image_def, metis)
 
       have "\<Inter> (A ` J) \<subseteq> set_pmf p" using b a(2) by blast
       hence "R.prob (\<Inter> (A ` J)) = prob (\<Inter> j \<in> J. A j)"
         by (simp add: measure_restrict_space)
       also have "... = prob ({\<omega>. \<forall>j \<in> J. X j \<omega> = y j})"
         using a x_def y_def apply (simp add:vimage_def measure_Int_set_pmf)
         by (rule arg_cong2 [where f="measure"], auto)
       also have "... = (\<Prod> j\<in> J. prob (A j))"
         using x_def y_def a assms(2)
         by (simp add:vimage_def measure_Int_set_pmf)
       also have "... = (\<Prod>j\<in>J. R.prob (A j))"
         using b by (simp add: measure_restrict_space cong:prod.cong)
       finally show ?thesis by blast
     qed
   qed
 
   have "R.indep_sets (\<lambda>i. sigma_sets (set_pmf p) (F i)) I"
     using R.indep_sets_sigma[simplified] F_Int_stable F_indep_sets
     by (auto simp:space_restrict_space)
 
   hence "R.indep_sets (\<lambda>i. {u. \<exists>A. u = X i -` A \<inter> set_pmf p}) I"
     by (simp add: as_sigma_sets cong:R.indep_sets_cong)
 
   hence "R.indep_vars (\<lambda>_. discrete) X I"
     unfolding  R.indep_vars_def2
     by (simp add:measurable_def sets_restrict_space range_inter)
 
   thus ?thesis
     using indep_vars_restrict_space[OF assms(1)] by simp
 qed
 
 lemma (in prob_space) split_indep_events:
   assumes "M = measure_pmf p"
   assumes "indep_vars (\<lambda>i. discrete) X' I"
   assumes "K \<subseteq> I" "finite K"
   shows "prob {\<omega>. \<forall>x \<in> K. P x (X' x \<omega>)} = (\<Prod>x \<in> K. prob {\<omega>. P x (X' x \<omega>)})"
 proof -
   have [simp]: "space M = UNIV"  "events = UNIV"  "prob UNIV = 1"
     by (simp add:assms(1))+
 
   have "indep_vars (\<lambda>_. discrete) X' K"
     using assms(2,3) indep_vars_subset by blast
   hence "indep_events (\<lambda>x. {\<omega> \<in> space M. P x (X' x \<omega>)}) K"
     using indep_eventsI_indep_vars by force
   hence a:"indep_events (\<lambda>x. {\<omega>. P x (X' x \<omega>)}) K"
     by simp
 
   have "prob  {\<omega>. \<forall>x \<in> K. P x (X' x \<omega>)} = prob (\<Inter>x \<in> K. {\<omega>. P x (X' x \<omega>)})"
     by (simp add: measure_pmf_eq[OF assms(1)])
   also have "... =  (\<Prod> x \<in> K. prob {\<omega>. P x (X' x \<omega>)})"
     using a assms(4) by (cases "K = {}", auto simp: indep_events_def)
   finally show ?thesis by simp
 qed
 
 lemma pmf_of_set_eq_uniform:
   assumes "finite A" "A \<noteq> {}"
   shows "measure_pmf (pmf_of_set A) = uniform_measure discrete A"
 proof -
   have a:"real (card A) > 0" using assms
     by (simp add: card_gt_0_iff)
 
   have b:
     "\<And>Y. emeasure (pmf_of_set A) Y = emeasure (uniform_measure discrete A) Y"
     using assms a
     by (simp add: emeasure_pmf_of_set divide_ennreal ennreal_of_nat_eq_real_of_nat)
 
   show ?thesis
     by (rule measure_eqI, auto simp add: b)
 qed
 
 lemma (in prob_space) uniform_onI:
   assumes "M = measure_pmf p"
   assumes "finite A" "A \<noteq> {}"
   assumes "\<And>a. prob {\<omega>. X \<omega> = a} = indicator A a / card A"
   shows "uniform_on X A"
 proof -
   have a:"\<And>a. measure_pmf.prob p {x. X x = a} = indicator A a / card A"
     using assms(1,4) by simp
 
   have b:"map_pmf X p = pmf_of_set A"
     by (rule pmf_eqI, simp add:assms pmf_map vimage_def a)
 
   have "distr M discrete X = map_pmf X p"
     by (simp add: map_pmf_rep_eq assms(1))
   also have "... = measure_pmf (pmf_of_set A)"
     using b by simp
   also have "... =  uniform_measure discrete A"
     by (rule pmf_of_set_eq_uniform[OF assms(2,3)])
   finally have "distr M discrete X = uniform_measure discrete A"
     by simp
   moreover have "random_variable discrete X"
     by (simp add: assms(1))
   ultimately show  ?thesis using assms(2,3)
     by (simp add: uniform_on_def)
 qed
 
 end