diff --git a/thys/Concentration_Inequalities/Bennett_Inequality.thy b/thys/Concentration_Inequalities/Bennett_Inequality.thy
new file mode 100644
--- /dev/null
+++ b/thys/Concentration_Inequalities/Bennett_Inequality.thy
@@ -0,0 +1,550 @@
+section \<open>Bennett's Inequality\<close>
+
+text \<open>In this section we verify Bennett's inequality~\cite{bennett1962} and a (weak) version of
+Bernstein's inequality as a corollary. Both inequalities give concentration bounds for sums of
+independent random variables. The statement and proofs follow a summary paper by
+Boucheron et al.~\cite{DBLP:conf/ac/BoucheronLB03}.\<close>
+
+theory Bennett_Inequality
+  imports Concentration_Inequalities_Preliminary
+begin
+
+context prob_space
+begin
+
+(* Restating Chernoff inequality for independent variables *)
+lemma indep_vars_Chernoff_ineq_ge:
+  assumes I: "finite I"
+  assumes ind: "indep_vars (\<lambda> _. borel) X I"
+  assumes sge: "s \<ge> 0"
+  assumes int: "\<And>i. i \<in> I \<Longrightarrow> integrable M (\<lambda>x. exp (s * X i x))"
+  shows "prob {x \<in> space M. (\<Sum>i \<in>I. X i x - expectation (X i)) \<ge> t} \<le>
+    exp (-s*t) *
+    (\<Prod>i\<in>I. expectation (\<lambda>x. exp(s * (X i x - expectation (X i)))))"
+proof (cases "s = 0")
+  case [simp]: True
+  thus ?thesis
+    by (simp add: prob_space)
+next
+  case False
+  then have s: "s > 0" using sge by auto
+
+  have [measurable]: "\<And>i. i \<in> I \<Longrightarrow> random_variable borel (X i)"
+    using ind unfolding indep_vars_def by blast
+
+  have indep1: "indep_vars (\<lambda>_. borel)
+     (\<lambda>i \<omega>. exp (s * (X i \<omega> - expectation (X i)))) I"
+    apply (intro indep_vars_compose[OF ind, unfolded o_def])
+    by auto
+
+  define S where "S = (\<lambda>x. (\<Sum>i \<in>I. X i x - expectation (X i)))"
+
+  have int1: "\<And>i. i \<in> I \<Longrightarrow>
+         integrable M (\<lambda>\<omega>. exp (s * (X i \<omega> - expectation (X i))))"
+    by (auto simp add: algebra_simps exp_diff int)
+
+  have eprod: "\<And>x. exp (s * S x) = (\<Prod>i\<in>I. exp(s * (X i x - expectation (X i))))"
+     unfolding S_def
+     by (simp add: assms(1) exp_sum vector_space_over_itself.scale_sum_right)
+
+  from indep_vars_integrable[OF I indep1 int1]
+  have intS: "integrable M (\<lambda>x. exp (s * S x))"
+    unfolding eprod by auto
+
+  then have si: "set_integrable M (space M) (\<lambda>x. exp (s * S x))"
+    unfolding set_integrable_def
+    apply (intro integrable_mult_indicator)
+    by auto
+
+  from Chernoff_ineq_ge[OF s si]
+  have "prob {x \<in> space M. S x \<ge> t} \<le> exp (- s * t) * (\<integral>x\<in>space M. exp (s * S x)\<partial>M)"
+    by auto
+
+  also have "(\<integral>x\<in>space M. exp (s * S x)\<partial>M) = expectation (\<lambda>x. exp(s * S x))"
+     unfolding set_integral_space[OF intS] by auto
+
+  also have "... = expectation (\<lambda>x. \<Prod>i\<in>I. exp(s * (X i x - expectation (X i))))"
+     unfolding S_def
+     by (simp add: assms(1) exp_sum vector_space_over_itself.scale_sum_right)
+  also have "... = (\<Prod>i\<in>I. expectation (\<lambda>x. exp(s * (X i x - expectation (X i)))))"
+     apply (intro indep_vars_lebesgue_integral[OF I indep1 int1]) .
+  finally show ?thesis
+    unfolding S_def
+    by auto
+qed
+
+definition bennett_h::"real \<Rightarrow> real"
+  where "bennett_h u = (1 + u) * ln (1 + u) - u"
+
+lemma exp_sub_two_terms_eq:
+  fixes x :: real
+  shows "exp x - x - 1 = (\<Sum>n. x^(n+2) / fact (n+2))"
+    "summable (\<lambda>n. x^(n+2) / fact (n+2))"
+proof -
+  have "(\<Sum>i<2. inverse (fact i) * x ^ i) = 1 + x"
+    by (simp add:numeral_eq_Suc)
+  thus "exp x - x - 1 = (\<Sum>n. x^(n+2) / fact (n+2))"
+    unfolding exp_def
+    apply (subst suminf_split_initial_segment[where k = 2])
+    by (auto simp add: summable_exp divide_inverse_commute)
+  have "summable (\<lambda>n. x^n / fact n)"
+    by (simp add: divide_inverse_commute summable_exp)
+  then have "summable (\<lambda>n. x^(Suc (Suc n)) / fact (Suc (Suc n)))"
+    apply (subst summable_Suc_iff)
+    apply (subst summable_Suc_iff)
+    by auto
+  thus "summable (\<lambda>n. x^(n+2) / fact (n+2))" by auto
+qed
+
+lemma psi_mono:
+  defines "f \<equiv> (\<lambda>x. (exp x - x - 1) - x^2 / 2)"
+  assumes xy: "a \<le> (b::real)"
+  shows "f a \<le> f b"
+proof -
+  have 1: "(f has_real_derivative (exp x - x - 1)) (at x)" for x
+    unfolding f_def
+    by (auto intro!: derivative_eq_intros)
+
+  have 2: "\<And>x. x \<in> {a..b} \<Longrightarrow> 0 \<le> exp x - x - 1"
+    by (smt (verit) exp_ge_add_one_self)
+
+  from deriv_nonneg_imp_mono[OF 1 2 xy]
+  show ?thesis by auto
+qed
+
+(* TODO: not sure if this holds for y < 0 too *)
+lemma psi_inequality:
+  assumes le: "x \<le> (y::real)" "y \<ge> 0"
+  shows "y^2 * (exp x - x - 1) \<le> x^2 * (exp y - y - 1)"
+proof -
+
+  have x: "exp x - x - 1 = (\<Sum>n. (x^(n+2) / fact (n+2)))"
+    "summable (\<lambda>n. x^(n+2) / fact (n+2))"
+    using exp_sub_two_terms_eq .
+
+  have y: "exp y - y - 1 = (\<Sum>n. (y^(n+2) / fact (n+2)))"
+    "summable (\<lambda>n. y^(n+2) / fact (n+2))"
+    using exp_sub_two_terms_eq .
+
+  (* Simplify the expressions in the inequality *)
+  have l:"y^2 * (exp x - x - 1) = (\<Sum>n. y^2 * (x^(n+2) / fact (n+2)))"
+    using x
+    apply (subst suminf_mult)
+    by auto
+  have ls: "summable (\<lambda>n. y^2 * (x^(n+2) / fact (n+2)))"
+    by (intro summable_mult[OF x(2)])
+
+  have r:"x^2 * (exp y - y - 1) = (\<Sum>n. x^2 * (y^(n+2) / fact (n+2)))"
+    using y
+    apply (subst suminf_mult)
+    by auto
+  have rs: "summable (\<lambda>n. x^2 * (y^(n+2) / fact (n+2)))"
+    by (intro summable_mult[OF y(2)])
+
+  have "\<bar>x\<bar> \<le> \<bar>y\<bar> \<or> \<bar>y\<bar> < \<bar>x\<bar>" by auto
+  moreover {
+    assume "\<bar>x\<bar> \<le> \<bar>y\<bar>"
+    then have "x^ n \<le> y ^n" for n
+    by (smt (verit, ccfv_threshold) bot_nat_0.not_eq_extremum le power_0 real_root_less_mono real_root_power_cancel root_abs_power)
+    then have "(x^2 * y^2) * x^n \<le> (x^2 * y^2) * y^n" for n
+      by (simp add: mult_left_mono)
+    then have "y\<^sup>2 * (x ^ (n + 2)) \<le> x\<^sup>2 * (y ^ (n + 2))" for n
+      by (metis (full_types) ab_semigroup_mult_class.mult_ac(1) mult.commute power_add)
+    then have "y\<^sup>2 * (x ^ (n + 2)) / fact (n+2)\<le> x\<^sup>2 * (y ^ (n + 2)) / fact (n+2)" for n
+      by (meson divide_right_mono fact_ge_zero)
+    then have "(\<Sum>n. y^2 * (x^(n+2) / fact (n+2))) \<le> (\<Sum>n. x^2 * (y^(n+2) / fact (n+2)))"
+      apply (intro suminf_le[OF _ ls rs])
+      by auto
+    then have "y^2 * (exp x - x - 1) \<le> x^2 * (exp y - y - 1)"
+    using l r by presburger
+  }
+  moreover {
+    assume ineq: "\<bar>y\<bar> < \<bar>x\<bar>"
+
+    from psi_mono[OF assms(1)]
+    have "(exp x - x - 1) - x^2 /2 \<le> (exp y - y - 1) - y^2/2" .
+
+    then have "y^2 * ((exp x - x - 1) - x^2 /2) \<le> x^2 * ((exp y - y - 1) - y^2/2)"
+      by (smt (verit, best) ineq diff_divide_distrib exp_lower_Taylor_quadratic le(1) le(2) mult_nonneg_nonneg one_less_exp_iff power_zero_numeral prob_space.psi_mono prob_space_completion right_diff_distrib zero_le_power2)
+
+    then have "y^2 * (exp x - x - 1) \<le> x^2 * (exp y - y - 1)"
+      by (simp add: mult.commute right_diff_distrib)
+  }
+  ultimately show ?thesis by auto
+qed
+
+(* Helper lemma, starting with normalized variables *)
+lemma bennett_inequality_1:
+  assumes I: "finite I"
+  assumes ind: "indep_vars (\<lambda> _. borel) X I"
+  assumes intsq: "\<And>i. i \<in> I \<Longrightarrow> integrable M (\<lambda>x. (X i x)^2)"
+  assumes bnd: "\<And>i. i \<in> I \<Longrightarrow> AE x in M. X i x \<le> 1"
+  assumes t: "t \<ge> 0"
+  defines "V \<equiv> (\<Sum>i \<in> I. expectation(\<lambda>x. X i x^2))"
+  shows "prob {x \<in> space M. (\<Sum>i \<in> I. X i x - expectation (X i)) \<ge> t} \<le>
+    exp (-V * bennett_h (t / V))"
+proof (cases "V = 0")
+  case True
+  then show ?thesis
+    by auto
+next
+  case f: False
+  have "V \<ge> 0"
+    unfolding V_def
+    apply (intro sum_nonneg  integral_nonneg_AE)
+    by auto
+  then have Vpos: "V > 0" using f by auto
+
+  define l :: real where "l = ln(1 + t / V)"
+  then have l: "l \<ge> 0"
+    using t Vpos by auto
+  have rv[measurable]: "\<And>i. i \<in> I \<Longrightarrow> random_variable borel (X i)"
+    using ind unfolding indep_vars_def by blast
+
+  define \<psi> where "\<psi> = (\<lambda>x::real. exp(x) - x - 1)"
+
+  have rw: "exp y = 1 + y + \<psi> y" for y
+    unfolding \<psi>_def by auto
+
+  have ebnd: "\<And>i. i \<in> I \<Longrightarrow>
+         AE x in M. exp (l * X i x) \<le> exp l"
+     apply (drule bnd)
+     using l by (auto simp add: mult_left_le)
+
+  (* integrability *)
+  have int: "\<And>i. i \<in> I \<Longrightarrow> integrable M (\<lambda>x. (X i x))"
+  using rv intsq square_integrable_imp_integrable by blast
+
+  have intl: "\<And>i. i \<in> I \<Longrightarrow> integrable M (\<lambda>x. (l * X i x))"
+    using int by blast
+
+  have intexpl: "\<And>i. i \<in> I \<Longrightarrow> integrable M (\<lambda>x. exp (l * X i x))"
+    apply (intro integrable_const_bound[where B = "exp l"])
+    using ebnd by auto
+
+  have intpsi: "\<And>i. i \<in> I \<Longrightarrow> integrable M (\<lambda>x. \<psi> (l * X i x))"
+    unfolding \<psi>_def
+    using intl intexpl by auto
+
+  have **: "\<And>i. i \<in> I \<Longrightarrow>
+    expectation (\<lambda>x. \<psi> (l * X i x)) \<le> \<psi> l * expectation (\<lambda>x. (X i x)^2)"
+  proof -
+    fix i assume i: "i \<in> I"
+    then have "AE x in M. l * X i x \<le> l"
+      using ebnd by auto
+    then have "AE x in M. l^2 * \<psi> (l * X i x) \<le> (l * X i x)^2 * \<psi> l"
+      using psi_inequality[OF _ l] unfolding \<psi>_def
+      by auto
+    then have "AE x in M. l^2 * \<psi> (l * X i x) \<le> l^2 * (\<psi> l * (X i x)^2)"
+      by (auto simp add: field_simps)
+    then have "AE x in M. \<psi> (l * X i x) \<le> \<psi> l * (X i x)^2 "
+      by (smt (verit, best) AE_cong \<psi>_def exp_eq_one_iff mult_cancel_left mult_eq_0_iff mult_left_mono zero_eq_power2 zero_le_power2)
+    then have "AE x in M. 0 \<le> \<psi> l * (X i x)^2 - \<psi> (l * X i x) "
+      by auto
+    then have "expectation (\<lambda>x. \<psi> l * (X i x)^2 + (- \<psi> (l * X i x))) \<ge> 0"
+      by (simp add: integral_nonneg_AE)
+    also have "expectation (\<lambda>x. \<psi> l * (X i x)^2 + (- \<psi> (l * X i x))) =
+        \<psi> l * expectation (\<lambda>x. (X i x)^2) - expectation (\<lambda>x. \<psi> (l * X i x))"
+      apply (subst Bochner_Integration.integral_add)
+      using intpsi[OF i] intsq[OF i] by auto
+    finally show "expectation (\<lambda>x. \<psi> (l * X i x)) \<le> \<psi> l * expectation (\<lambda>x. (X i x)^2)"
+      by auto
+  qed
+
+  (* Analyzing the expectation *)
+  then have *: "\<And>i. i \<in> I \<Longrightarrow>
+      expectation (\<lambda>x. exp (l * X i x)) \<le>
+      exp (l * expectation (X i)) * exp (\<psi> l * expectation (\<lambda>x. X i x^2))"
+  proof -
+    fix i
+    assume iI: "i \<in> I"
+    have "expectation (\<lambda>x. exp (l * X i x)) =
+      1 + l * expectation (\<lambda>x. X i x) +
+       expectation (\<lambda>x. \<psi> (l * X i x))"
+      unfolding rw
+      apply (subst Bochner_Integration.integral_add)
+      using iI intl intpsi apply auto[2]
+      apply (subst Bochner_Integration.integral_add)
+      using intl iI prob_space by auto
+    also have "... = l * expectation (X i) + 1 + expectation (\<lambda>x. \<psi> (l * X i x))"
+      by auto
+    also have "... \<le> 1 + l * expectation (X i) + \<psi> l * expectation (\<lambda>x. X i x^2)"
+      using **[OF iI] by auto
+    also have "... \<le> exp (l * expectation (X i)) * exp (\<psi> l  * expectation (\<lambda>x. X i x^2))"
+      by (simp add: is_num_normalize(1) mult_exp_exp)
+    finally show "expectation (\<lambda>x. exp (l * X i x)) \<le>
+      exp (l * expectation (X i)) * exp (\<psi> l  * expectation (\<lambda>x. X i x^2))" .
+  qed
+
+  have "(\<Prod>i\<in>I. expectation (\<lambda>x. exp (l * (X i x)))) \<le>
+    (\<Prod>i\<in>I. exp (l * expectation (X i)) * exp (\<psi> l  * expectation (\<lambda>x. X i x^2)))"
+    by (auto intro!: prod_mono simp add: *)
+  also have "... =
+    (\<Prod>i\<in>I. exp (l * expectation (X i))) * (\<Prod>i\<in>I. exp (\<psi> l  * expectation (\<lambda>x. X i x^2)))"
+    by (auto simp add: prod.distrib)
+  finally have **:
+    "(\<Prod>i\<in>I. expectation (\<lambda>x. exp (l * (X i x)))) \<le>
+    (\<Prod>i\<in>I. exp (l * expectation (X i))) * exp (\<psi> l * V)"
+    by (simp add: V_def I exp_sum sum_distrib_left)
+
+  from indep_vars_Chernoff_ineq_ge[OF I ind l intexpl]
+  have "prob {x \<in> space M. (\<Sum>i \<in> I. X i x - expectation (X i)) \<ge> t} \<le>
+    exp (- l * t) *
+     (\<Prod>i\<in>I. expectation (\<lambda>x. exp (l * (X i x - expectation (X i)))))"
+     by auto
+  also have "(\<Prod>i\<in>I. expectation (\<lambda>x. exp (l * (X i x - expectation (X i))))) =
+    (\<Prod>i\<in>I. expectation (\<lambda>x. exp (l * (X i x))) * exp (- l * expectation (X i)))"
+    by (auto intro!: prod.cong simp add: field_simps exp_diff exp_minus_inverse)
+  also have "... =
+     (\<Prod>i\<in>I. exp (- l * expectation (X i))) * (\<Prod>i\<in>I. expectation (\<lambda>x. exp (l * (X i x))))"
+    by (auto simp add: prod.distrib)
+  also have "... \<le>
+     (\<Prod>i\<in>I. exp (- l * expectation (X i))) * ((\<Prod>i\<in>I. exp (l * expectation (X i))) * exp (\<psi> l * V))"
+    apply (intro mult_left_mono[OF **])
+    by (meson exp_ge_zero prod_nonneg)
+  also have "... = exp (\<psi> l * V)"
+    apply (simp add: prod.distrib [symmetric])
+    by (smt (verit, ccfv_threshold) exp_minus_inverse prod.not_neutral_contains_not_neutral)
+  finally have "
+    prob {x \<in> space M. (\<Sum>i \<in> I. X i x - expectation (X i)) \<ge> t} \<le>
+    exp (\<psi> l * V - l * t)"
+    by (simp add:mult_exp_exp)
+  also have "\<psi> l * V - l * t = -V * bennett_h (t / V)"
+    unfolding \<psi>_def l_def bennett_h_def
+    apply (subst exp_ln)
+    subgoal by (smt (verit) Vpos divide_nonneg_nonneg t)
+    by (auto simp add: algebra_simps)
+  finally show ?thesis .
+qed
+
+lemma real_AE_le_sum:
+  assumes "\<And>i. i \<in> I \<Longrightarrow> AE x in M. f i x \<le> (g i x::real)"
+  shows "AE x in M. (\<Sum>i\<in>I. f i x) \<le> (\<Sum>i\<in>I. g i x)"
+proof (cases)
+  assume "finite I"
+  with AE_finite_allI[OF this assms] have 0:"AE x in M. (\<forall>i\<in>I. f i x \<le> g i x)" by auto
+  show ?thesis by (intro eventually_mono[OF 0] sum_mono) auto
+qed simp
+
+lemma real_AE_eq_sum:
+  assumes "\<And>i. i \<in> I \<Longrightarrow> AE x in M. f i x = (g i x::real)"
+  shows "AE x in M. (\<Sum>i\<in>I. f i x) = (\<Sum>i\<in>I. g i x)"
+proof -
+  have 1: "AE x in M. (\<Sum>i\<in>I. f i x) \<le> (\<Sum>i\<in>I. g i x)"
+    apply (intro real_AE_le_sum)
+    apply (drule assms)
+    by auto
+  have 2: "AE x in M. (\<Sum>i\<in>I. g i x) \<le> (\<Sum>i\<in>I. f i x)"
+    apply (intro real_AE_le_sum)
+    apply (drule assms)
+    by auto
+  show ?thesis
+    using 1 2
+    by auto
+qed
+
+(* B = 0 case trivial *)
+theorem bennett_inequality:
+  assumes I: "finite I"
+  assumes ind: "indep_vars (\<lambda> _. borel) X I"
+  assumes intsq: "\<And>i. i \<in> I \<Longrightarrow> integrable M (\<lambda>x. (X i x)^2)"
+  assumes bnd: "\<And>i. i \<in> I \<Longrightarrow> AE x in M. X i x \<le> B"
+  assumes t: "t \<ge> 0"
+  assumes B: "B > 0"
+  defines "V \<equiv> (\<Sum>i \<in> I. expectation (\<lambda>x. X i x^2))"
+  shows "prob {x \<in> space M. (\<Sum>i \<in> I. X i x - expectation (X i)) \<ge> t} \<le>
+    exp (- V / B^2 * bennett_h (t * B / V))"
+proof -
+  define Y where "Y = (\<lambda>i x. X i x / B)"
+
+  from indep_vars_compose[OF ind, where Y = "\<lambda>i x. x/ B"]
+  have 1: "indep_vars (\<lambda>_. borel) Y I"
+    unfolding Y_def by (auto simp add: o_def)
+  have 2: "\<And>i. i \<in> I \<Longrightarrow> integrable M (\<lambda>x. (Y i x)\<^sup>2)"
+    unfolding Y_def apply (drule intsq)
+    by (auto simp add: field_simps)
+  have 3: "\<And>i. i \<in> I \<Longrightarrow> AE x in M. Y i x \<le> 1"
+    unfolding Y_def apply (drule bnd)
+    using B by auto
+  have 4:"0 \<le> t / B" using t B by auto
+
+  have rw1: "(\<Sum>i\<in>I. Y i x - expectation (Y i)) =
+    (\<Sum>i\<in>I. X i x - expectation (X i)) / B" for x
+    unfolding Y_def
+    by (auto simp: diff_divide_distrib sum_divide_distrib)
+
+  have rw2: "expectation (\<lambda>x. (Y i x)\<^sup>2) =
+    expectation (\<lambda>x. (X i x)\<^sup>2) / B^2" for i
+    unfolding Y_def
+    by (simp add: power_divide)
+
+  have rw3:"- (\<Sum>i\<in>I. expectation (\<lambda>x. (X i x)\<^sup>2) / B^2) = - V / B^2"
+    unfolding V_def
+    by (auto simp add: sum_divide_distrib)
+
+  have "t / B / (\<Sum>i\<in>I. expectation (\<lambda>x. (X i x)\<^sup>2) / B^2) =
+    t / B / (V / B^2)"
+    unfolding V_def
+    by (auto simp add: sum_divide_distrib)
+  then have rw4: "t / B / (\<Sum>i\<in>I. expectation (\<lambda>x. (X i x)\<^sup>2) / B^2) =
+      t * B / V"
+      by (simp add: power2_eq_square)
+  have "prob {x \<in> space M. t \<le> (\<Sum>i\<in>I. X i x - expectation (X i))} =
+    prob{x \<in> space M. t / B \<le> (\<Sum>i\<in>I. X i x - expectation (X i)) / B}"
+    by (smt (verit, best) B Collect_cong divide_cancel_right divide_right_mono)
+  also have "... \<le>
+    exp (- V / B\<^sup>2 *
+          bennett_h (t * B / V))"
+    using bennett_inequality_1[OF I 1 2 3 4]
+    unfolding rw1 rw2 rw3 rw4 .
+  finally show ?thesis .
+qed
+
+(* This proof follows https://math.stackexchange.com/a/4066844 *)
+lemma bennett_h_bernstein_bound:
+  assumes "x \<ge> 0"
+  shows "bennett_h x \<ge> x^2 / (2 * (1 + x / 3))"
+proof -
+  have eq:"x^2 / (2 * (1 + x / 3)) = 3/2 * x - 9/2 * (x / (x+3))"
+    using assms
+    by (sos "(() & ())")
+
+  define g where "g = (\<lambda>x. bennett_h x - (3/2 * x - 9/2 * (x / (x+3))))"
+
+  define g' where "g' = (\<lambda>x::real.
+    ln(1 + x) +  27 / (2 * (x+3)^2) - 3 / 2)"
+  define g'' where "g'' = (\<lambda>x::real.
+      1 / (1 + x) - 27  / (x+3)^3)"
+
+  have "54 / ((2 * x + 6)^2) = 27 / (2 * (x + 3)\<^sup>2)" (is "?L = ?R") for x :: real
+  proof -
+    have "?L = 54 / (2^2 * (x + 3)^2)"
+      unfolding power_mult_distrib[symmetric] by (simp add:algebra_simps)
+    also have "... = ?R" by simp
+    finally show ?thesis by simp
+  qed
+
+  hence 1: "x \<ge> 0 \<Longrightarrow> (g has_real_derivative (g' x)) (at x)" for x
+    unfolding g_def g'_def bennett_h_def by (auto intro!: derivative_eq_intros simp:power2_eq_square)
+  have 2: "x \<ge> 0 \<Longrightarrow> (g' has_real_derivative (g'' x)) (at x)" for x
+    unfolding g'_def g''_def
+    apply (auto intro!: derivative_eq_intros)[1]
+    by (sos "(() & ())")
+
+  have gz: "g 0 = 0"
+    unfolding g_def bennett_h_def by auto
+  have g1z: "g' 0 = 0"
+    unfolding g'_def by auto
+
+  have p2: "g'' x  \<ge> 0" if "x \<ge> 0" for x
+  proof -
+    have "27 * (1+x) \<le> (x+3)^3"
+      using that unfolding power3_eq_cube by (auto simp:algebra_simps)
+    hence " 27 / (x + 3) ^ 3 \<le> 1 / (1+x)"
+      using that by (subst frac_le_eq) (auto intro!:divide_nonpos_pos)
+    thus ?thesis unfolding g''_def by simp
+  qed
+
+  from deriv_nonneg_imp_mono[OF 2 p2 _]
+  have "x \<ge> 0 \<Longrightarrow> g' x \<ge> 0" for x using g1z
+    by (metis atLeastAtMost_iff)
+
+  from deriv_nonneg_imp_mono[OF 1 this _]
+  have "x \<ge> 0 \<Longrightarrow> g x \<ge> 0" for x using gz
+    by (metis atLeastAtMost_iff)
+
+  thus ?thesis
+  using assms eq g_def by force
+qed
+
+lemma sum_sq_exp_eq_zero_imp_zero:
+  assumes "finite I" "i \<in> I"
+  assumes intsq: "integrable M (\<lambda>x. (X i x)^2)"
+  assumes "(\<Sum>i \<in> I. expectation (\<lambda>x. X i x^2)) = 0"
+  shows "AE x in M. X i x = (0::real)"
+proof -
+  have "(\<forall>i \<in>I. expectation (\<lambda>x. X i x^2) = 0)"
+    using assms
+    apply (subst sum_nonneg_eq_0_iff[symmetric])
+    by auto
+  then have "expectation (\<lambda>x. X i x^2) = 0"
+    using assms(2) by blast
+  thus ?thesis
+    using integral_nonneg_eq_0_iff_AE[OF intsq]
+    by auto
+qed
+
+corollary bernstein_inequality:
+  assumes I: "finite I"
+  assumes ind: "indep_vars (\<lambda> _. borel) X I"
+  assumes intsq: "\<And>i. i \<in> I \<Longrightarrow> integrable M (\<lambda>x. (X i x)^2)"
+  assumes bnd: "\<And>i. i \<in> I \<Longrightarrow> AE x in M. X i x \<le> B"
+  assumes t: "t \<ge> 0"
+  assumes B: "B > 0"
+  defines "V \<equiv> (\<Sum>i \<in> I. expectation (\<lambda>x. X i x^2))"
+  shows "prob {x \<in> space M. (\<Sum>i \<in> I. X i x - expectation (X i)) \<ge> t} \<le>
+    exp (- (t^2 / (2 * (V + t * B / 3))))"
+proof (cases "V = 0")
+  case True
+  then have 1:"\<And>i. i \<in> I \<Longrightarrow> AE x in M. X i x = 0"
+    unfolding V_def
+    using sum_sq_exp_eq_zero_imp_zero
+    by (metis I intsq)
+  then have 2:"\<And>i. i \<in> I \<Longrightarrow> expectation (X i) = 0"
+    using integral_eq_zero_AE by blast
+
+  have "AE x in M. (\<Sum>i \<in> I. X i x - expectation (X i)) = (\<Sum>i \<in> I. 0)"
+      apply (intro real_AE_eq_sum)
+      using 1 2
+      by auto
+  then have *: "AE x in M. (\<Sum>i \<in> I. X i x - expectation (X i)) = 0"
+    by force
+
+  moreover {
+    assume "t > 0"
+    then have "prob {x \<in> space M. (\<Sum>i \<in> I. X i x - expectation (X i)) \<ge> t} = 0"
+      apply (intro prob_eq_0_AE)
+      using * by auto
+    then have ?thesis by auto
+  }
+  ultimately show ?thesis
+    apply (cases "t = 0") using t by auto
+next
+  case f: False
+  have "V \<ge> 0"
+    unfolding V_def
+    apply (intro sum_nonneg  integral_nonneg_AE)
+    by auto
+  then have V: "V > 0" using f by auto
+
+  have "t * B / V \<ge> 0" using t B V by auto
+  from bennett_h_bernstein_bound[OF this]
+  have "(t * B / V)\<^sup>2 / (2 * (1 + t * B / V / 3))
+    \<le> bennett_h (t * B / V)" .
+
+  then have "(- V / B^2) * bennett_h (t * B / V) \<le>
+    (- V / B^2) * ((t * B / V)\<^sup>2 / (2 * (1 + t * B / V / 3)))"
+    apply (subst mult_left_mono_neg)
+    using B V by auto
+  also have "... =
+     ((- V / B^2) * (t * B / V)\<^sup>2) / (2 * (1 + t * B / V / 3))"
+    by auto
+  also have " ((- V / B^2) * (t * B / V)\<^sup>2) = -(t^2) / V"
+    using V B by (auto simp add: field_simps power2_eq_square)
+  finally have *: "(- V / B^2) * bennett_h (t * B / V) \<le>
+     -(t^2)  / (2 * (V + t * B  / 3))"
+    using V by (auto simp add: field_simps)
+
+  from bennett_inequality[OF assms(1-6)]
+  have "prob {x \<in> space M. (\<Sum>i \<in> I. X i x - expectation (X i)) \<ge> t} \<le>
+    exp (- V / B^2 * bennett_h (t * B / V))"
+    using V_def by auto
+  also have "... \<le> exp (- (t^2/ (2 * (V + t * B  / 3))))"
+    using *
+    by auto
+  finally show ?thesis .
+qed
+
+end
+
+end
diff --git a/thys/Concentration_Inequalities/Bienaymes_Identity.thy b/thys/Concentration_Inequalities/Bienaymes_Identity.thy
new file mode 100644
--- /dev/null
+++ b/thys/Concentration_Inequalities/Bienaymes_Identity.thy
@@ -0,0 +1,181 @@
+section \<open>Bienaym\'e's identity\<close>
+
+text \<open>Bienaym\'e's identity~\cite[\S 17]{loeve1977} can be used to deduce the variance of a sum of
+random variables, if their co-variance is known. A common use-case of the identity is the
+computation of the variance of the mean of pair-wise independent variables.\<close>
+
+theory Bienaymes_Identity
+  imports Concentration_Inequalities_Preliminary
+begin
+
+context prob_space
+begin
+
+lemma variance_divide:
+  fixes f :: "'a \<Rightarrow> real"
+  assumes "integrable M f"
+  shows "variance (\<lambda>\<omega>. f \<omega> / r) = variance f / r^2"
+  using assms
+  by (subst Bochner_Integration.integral_divide[OF assms(1)])
+    (simp add:diff_divide_distrib[symmetric] power2_eq_square algebra_simps)
+
+definition covariance where
+  "covariance f g = expectation (\<lambda>\<omega>. (f \<omega> - expectation f) * (g \<omega> - expectation g))"
+
+lemma covariance_eq:
+  fixes f :: "'a \<Rightarrow> real"
+  assumes "f \<in> borel_measurable M" "g \<in> borel_measurable M"
+  assumes "integrable M (\<lambda>\<omega>. f \<omega>^2)" "integrable M (\<lambda>\<omega>. g \<omega>^2)"
+  shows "covariance f g = expectation (\<lambda>\<omega>. f \<omega> * g \<omega>) - expectation f * expectation g"
+proof -
+  have "integrable M f" using square_integrable_imp_integrable assms by auto
+  moreover have "integrable M g" using square_integrable_imp_integrable assms by auto
+  ultimately show ?thesis
+    using assms cauchy_schwartz(1)[where M="M"]
+    by (simp add:covariance_def algebra_simps prob_space)
+qed
+
+lemma covar_integrable:
+  fixes f g :: "'a \<Rightarrow> real"
+  assumes "f \<in> borel_measurable M" "g \<in> borel_measurable M"
+  assumes "integrable M (\<lambda>\<omega>. f \<omega>^2)" "integrable M (\<lambda>\<omega>. g \<omega>^2)"
+  shows "integrable M (\<lambda>\<omega>. (f \<omega> - expectation f) * (g \<omega> - expectation g))"
+proof -
+  have "integrable M f" using square_integrable_imp_integrable assms by auto
+  moreover have "integrable M g" using square_integrable_imp_integrable assms by auto
+  ultimately show ?thesis using assms cauchy_schwartz(1)[where M="M"] by (simp add: algebra_simps)
+qed
+
+lemma sum_square_int:
+  fixes f :: "'b \<Rightarrow> 'a \<Rightarrow> real"
+  assumes "finite I"
+  assumes "\<And>i. i \<in> I \<Longrightarrow> f i \<in> borel_measurable M"
+  assumes "\<And>i. i \<in> I \<Longrightarrow> integrable M (\<lambda>\<omega>. f i \<omega>^2)"
+  shows "integrable M (\<lambda>\<omega>. (\<Sum>i \<in> I. f i \<omega>)\<^sup>2)"
+proof -
+  have " integrable M (\<lambda>\<omega>. \<Sum>i\<in>I. \<Sum>j\<in>I. f j \<omega> * f i \<omega>)"
+    using assms
+    by (intro Bochner_Integration.integrable_sum cauchy_schwartz(1)[where M="M"], auto)
+  thus ?thesis
+    by (simp add:power2_eq_square sum_distrib_left sum_distrib_right)
+qed
+
+theorem bienaymes_identity:
+  fixes f :: "'b \<Rightarrow> 'a \<Rightarrow> real"
+  assumes "finite I"
+  assumes "\<And>i. i \<in> I \<Longrightarrow> f i \<in> borel_measurable M"
+  assumes "\<And>i. i \<in> I \<Longrightarrow> integrable M (\<lambda>\<omega>. f i \<omega>^2)"
+  shows
+    "variance (\<lambda>\<omega>. (\<Sum>i \<in> I. f i \<omega>)) = (\<Sum>i \<in> I. (\<Sum>j \<in> I. covariance (f i) (f j)))"
+proof -
+  have a:"\<And>i j. i \<in> I \<Longrightarrow> j \<in> I \<Longrightarrow>
+    integrable M (\<lambda>\<omega>. (f i \<omega> - expectation (f i)) * (f j \<omega> - expectation (f j)))"
+    using assms covar_integrable by simp
+  have "variance (\<lambda>\<omega>. (\<Sum>i \<in> I. f i \<omega>)) = expectation (\<lambda>\<omega>. (\<Sum>i\<in>I. f i \<omega> - expectation (f i))\<^sup>2)"
+    using square_integrable_imp_integrable[OF assms(2,3)]
+    by (simp add: Bochner_Integration.integral_sum  sum_subtractf)
+  also have "... = expectation (\<lambda>\<omega>. (\<Sum>i \<in> I. (\<Sum>j \<in> I.
+    (f i \<omega> - expectation (f i)) *  (f j \<omega> - expectation (f j)))))"
+    by (simp add: power2_eq_square sum_distrib_right sum_distrib_left mult.commute)
+  also have "... = (\<Sum>i \<in> I. (\<Sum>j \<in> I. covariance (f i) (f j)))"
+    using a by (simp add: Bochner_Integration.integral_sum covariance_def)
+  finally show ?thesis by simp
+qed
+
+lemma covar_self_eq:
+  fixes f :: "'a \<Rightarrow> real"
+  shows "covariance f f = variance f"
+  by (simp add:covariance_def power2_eq_square)
+
+lemma covar_indep_eq_zero:
+  fixes f g :: "'a \<Rightarrow> real"
+  assumes "integrable M f"
+  assumes "integrable M g"
+  assumes "indep_var borel f borel g"
+  shows "covariance f g = 0"
+proof -
+  have a:"indep_var borel ((\<lambda>t. t - expectation f) \<circ> f) borel ((\<lambda>t. t - expectation g) \<circ> g)"
+    by (rule indep_var_compose[OF assms(3)], auto)
+
+  have b:"expectation (\<lambda>\<omega>. (f \<omega> - expectation f) * (g \<omega> - expectation g)) = 0"
+    using a assms by (subst indep_var_lebesgue_integral, auto simp add:comp_def prob_space)
+
+  thus ?thesis by (simp add:covariance_def)
+qed
+
+lemma bienaymes_identity_2:
+  fixes f :: "'b \<Rightarrow> 'a \<Rightarrow> real"
+  assumes "finite I"
+  assumes "\<And>i. i \<in> I \<Longrightarrow> f i \<in> borel_measurable M"
+  assumes "\<And>i. i \<in> I \<Longrightarrow> integrable M (\<lambda>\<omega>. f i \<omega>^2)"
+  shows "variance (\<lambda>\<omega>. (\<Sum>i \<in> I. f i \<omega>)) =
+      (\<Sum>i \<in> I. variance (f i)) + (\<Sum>i \<in> I. \<Sum>j \<in> I - {i}. covariance (f i) (f j))"
+proof -
+  have "variance (\<lambda>\<omega>. (\<Sum>i \<in> I. f i \<omega>)) = (\<Sum>i\<in>I. \<Sum>j\<in>I. covariance (f i) (f j))"
+    by (simp add: bienaymes_identity[OF assms(1,2,3)])
+  also have "... = (\<Sum>i\<in>I. covariance (f i) (f i) + (\<Sum>j\<in>I-{i}. covariance (f i) (f j)))"
+    using assms by (subst sum.insert[symmetric], auto simp add:insert_absorb)
+  also have "... = (\<Sum>i\<in>I. variance (f i)) +  (\<Sum>i \<in> I. (\<Sum>j\<in>I-{i}. covariance (f i) (f j)))"
+    by (simp add: covar_self_eq[symmetric] sum.distrib)
+  finally show ?thesis by simp
+qed
+
+theorem bienaymes_identity_pairwise_indep:
+  fixes f :: "'b \<Rightarrow> 'a \<Rightarrow> real"
+  assumes "finite I"
+  assumes "\<And>i. i \<in> I \<Longrightarrow> f i \<in> borel_measurable M"
+  assumes "\<And>i. i \<in> I \<Longrightarrow> integrable M (\<lambda>\<omega>. f i \<omega>^2)"
+  assumes "\<And>i j. i \<in> I \<Longrightarrow> j \<in> I \<Longrightarrow> i \<noteq> j \<Longrightarrow> indep_var borel (f i) borel (f j)"
+  shows "variance (\<lambda>\<omega>. (\<Sum>i \<in> I. f i \<omega>)) = (\<Sum>i \<in> I. variance (f i))"
+proof -
+  have "\<And>i j. i \<in> I \<Longrightarrow> j \<in> I - {i} \<Longrightarrow> covariance (f i) (f j) = 0"
+    using covar_indep_eq_zero assms(4) square_integrable_imp_integrable[OF assms(2,3)] by auto
+  hence a:"(\<Sum>i \<in> I. \<Sum>j \<in> I - {i}. covariance (f i) (f j)) = 0"
+    by simp
+  thus ?thesis by (simp add: bienaymes_identity_2[OF assms(1,2,3)])
+qed
+
+lemma indep_var_from_indep_vars:
+  assumes "i \<noteq> j"
+  assumes "indep_vars (\<lambda>_. M') f {i, j}"
+  shows "indep_var M' (f i) M' (f j)"
+proof -
+  have a:"inj (case_bool i j)" using assms(1)
+    by (simp add: bool.case_eq_if inj_def)
+  have b:"range (case_bool i j) = {i,j}"
+    by (simp add: UNIV_bool insert_commute)
+  have c:"indep_vars (\<lambda>_. M') f (range (case_bool i j))" using assms(2) b by simp
+
+  have "True = indep_vars (\<lambda>x. M') (\<lambda>x. f (case_bool i j x)) UNIV"
+    using indep_vars_reindex[OF a c]
+    by (simp add:comp_def)
+  also have "... = indep_vars (\<lambda>x. case_bool M' M' x) (\<lambda>x. case_bool (f i) (f j) x) UNIV"
+    by (rule indep_vars_cong, auto simp:bool.case_distrib bool.case_eq_if)
+  also have "... = ?thesis"
+    by (simp add: indep_var_def)
+  finally show ?thesis by simp
+qed
+
+lemma bienaymes_identity_pairwise_indep_2:
+  fixes f :: "'b \<Rightarrow> 'a \<Rightarrow> real"
+  assumes "finite I"
+  assumes "\<And>i. i \<in> I \<Longrightarrow> f i \<in> borel_measurable M"
+  assumes "\<And>i. i \<in> I \<Longrightarrow> integrable M (\<lambda>\<omega>. f i \<omega>^2)"
+  assumes "\<And>J. J \<subseteq> I \<Longrightarrow> card J = 2 \<Longrightarrow> indep_vars (\<lambda> _. borel) f J"
+  shows "variance (\<lambda>\<omega>. (\<Sum>i \<in> I. f i \<omega>)) = (\<Sum>i \<in> I. variance (f i))"
+  using assms(4)
+  by (intro bienaymes_identity_pairwise_indep[OF assms(1,2,3)] indep_var_from_indep_vars, auto)
+
+lemma bienaymes_identity_full_indep:
+  fixes f :: "'b \<Rightarrow> 'a \<Rightarrow> real"
+  assumes "finite I"
+  assumes "\<And>i. i \<in> I \<Longrightarrow> f i \<in> borel_measurable M"
+  assumes "\<And>i. i \<in> I \<Longrightarrow> integrable M (\<lambda>\<omega>. f i \<omega>^2)"
+  assumes "indep_vars (\<lambda> _. borel) f I"
+  shows "variance (\<lambda>\<omega>. (\<Sum>i \<in> I. f i \<omega>)) = (\<Sum>i \<in> I. variance (f i))"
+  by (intro bienaymes_identity_pairwise_indep_2[OF assms(1,2,3)] indep_vars_subset[OF assms(4)])
+    auto
+
+end
+
+end
diff --git a/thys/Concentration_Inequalities/Cantelli_Inequality.thy b/thys/Concentration_Inequalities/Cantelli_Inequality.thy
new file mode 100644
--- /dev/null
+++ b/thys/Concentration_Inequalities/Cantelli_Inequality.thy
@@ -0,0 +1,118 @@
+section \<open>Cantelli's Inequality\<close>
+
+text \<open>Cantelli's inequality~\cite{cantelli1929sui} is an improvement of Chebyshev's inequality for
+one-sided tail bounds.\<close>
+
+theory Cantelli_Inequality
+  imports "HOL-Probability.Probability"
+begin
+
+context prob_space
+begin
+
+lemma cantelli_arith:
+  assumes "a > (0::real)"
+  shows "(V + (V / a)^2) / (a + (V / a))^2 = V / (a ^2 + V)" (is "?L = ?R")
+proof -
+  have "?L = ((V * a^2 + V^2) / a^2) / ((a^2 + V)^2/a^2)"
+    using assms by (intro arg_cong2[where f="(/)"]) (simp_all add:field_simps power2_eq_square)
+  also have "... = (V * a\<^sup>2 + V\<^sup>2)/ (a\<^sup>2 + V)\<^sup>2"
+    using assms unfolding divide_divide_times_eq by simp
+  also have "... = V * (a^2 + V) / (a^2 + V)^2"
+    by (intro arg_cong2[where f="(/)"]) (simp_all add: algebra_simps power2_eq_square)
+  also have "... = ?R" by (simp add:power2_eq_square)
+  finally show ?thesis by simp
+qed
+
+theorem cantelli_inequality:
+  assumes [measurable]: "random_variable borel Z"
+  assumes intZsq: "integrable M (\<lambda>z. Z z^2)"
+  assumes a: "a > 0"
+  shows "prob {z \<in> space M. Z z - expectation Z \<ge> a} \<le>
+    variance Z / (a^2 + variance Z)"
+proof -
+  define u where "u = variance Z / a"
+  have u: "u \<ge> 0"
+    unfolding u_def
+    by (simp add: a divide_nonneg_pos)
+  define Y where "Y = (\<lambda>z. Z z + (-expectation Z))"
+  have "random_variable borel (\<lambda>z. \<bar>Y z + u\<bar>)"
+    unfolding Y_def
+    by auto
+  then have ev: "{z \<in> space M. a + u \<le> \<bar>Y z + u\<bar>} \<in> events"
+    by auto
+
+  have intZ:"integrable M Z"
+    apply (subst square_integrable_imp_integrable[OF _ intZsq])
+    by auto
+  then have i1: "integrable M (\<lambda>z. (Z z - expectation Z + u)\<^sup>2)"
+    unfolding power2_sum power2_diff using intZsq
+    by auto
+
+  have intY:"integrable M Y"
+    unfolding Y_def using intZ by auto
+  have intYsq:"integrable M (\<lambda>z. Y z^2)"
+    unfolding Y_def power2_sum using intZsq intZ by auto
+
+  have "expectation Y = 0"
+    unfolding Y_def
+    apply (subst Bochner_Integration.integral_add[OF intZ])
+    using prob_space by auto
+
+  then have "expectation (\<lambda>z. (Y z + u)^2) =
+    expectation (\<lambda>z. (Y z)^2) + u^2"
+    unfolding power2_sum
+    apply (subst Bochner_Integration.integral_add[OF _ _])
+    using intY intYsq apply auto[2]
+    apply (subst Bochner_Integration.integral_add[OF _ _])
+    using intY intYsq apply auto[2]
+    using prob_space by auto
+  then have *: "expectation (\<lambda>z. (Y z + u)^2) = variance Z + u^2"
+    unfolding Y_def by auto
+
+  have "
+    prob {z \<in> space M. Z z - expectation Z \<ge> a} =
+    prob {z \<in> space M. Y z + u \<ge> a + u}"
+    apply (intro arg_cong[where f = prob])
+    using Y_def by auto
+  also have "... \<le> prob {z \<in> space M. a + u \<le> \<bar>Y z + u\<bar>}"
+    apply (intro finite_measure_mono[OF _ ev])
+    by auto
+
+  also have "... \<le> expectation (\<lambda>z. (Y z + u)^2) / (a + u)^2"
+    apply (intro second_moment_method)
+    unfolding Y_def using a u i1 by auto
+  also have "... = ((variance Z) + u^2)  / (a + u)^2"
+    using * by auto
+  also have "... = variance Z / (a ^2 + variance Z)"
+    unfolding u_def using a by (auto intro!: cantelli_arith)
+  finally show ?thesis .
+qed
+
+(* the left sided (negative) version of the inequality *)
+corollary cantelli_inequality_neg:
+  assumes [measurable]: "random_variable borel Z"
+  assumes intZsq: "integrable M (\<lambda>z. Z z^2)"
+  assumes a: "a > 0"
+  shows "prob {z \<in> space M. Z z - expectation Z \<le> -a} \<le>
+    variance Z / (a^2 + variance Z)"
+proof -
+  define nZ where [simp]: "nZ = (\<lambda>z. -Z z)"
+  have vnZ: "variance nZ = variance Z"
+    unfolding nZ_def
+    by (auto simp add: power2_commute)
+
+  have 1: "random_variable borel nZ" by auto
+  have 2: "integrable M (\<lambda>z. (nZ z)\<^sup>2) "
+    using intZsq by auto
+  from cantelli_inequality[OF 1 2 a]
+  have "prob {z \<in> space M. a \<le> nZ z - expectation nZ} \<le>
+    variance nZ / (a^2 + variance nZ)"
+    by auto
+  thus ?thesis unfolding vnZ apply auto[1]
+    by (smt (verit, del_insts) Collect_cong)
+qed
+
+end
+
+end
\ No newline at end of file
diff --git a/thys/Concentration_Inequalities/Concentration_Inequalities_Preliminary.thy b/thys/Concentration_Inequalities/Concentration_Inequalities_Preliminary.thy
new file mode 100644
--- /dev/null
+++ b/thys/Concentration_Inequalities/Concentration_Inequalities_Preliminary.thy
@@ -0,0 +1,247 @@
+section \<open>Preliminary results\<close>
+
+theory Concentration_Inequalities_Preliminary
+  imports Lp.Lp
+begin
+
+text \<open>Version of Cauchy-Schwartz for the Lebesgue integral:\<close>
+lemma cauchy_schwartz:
+  fixes f g :: "_ \<Rightarrow> real"
+  assumes "f \<in> borel_measurable M" "g \<in> borel_measurable M"
+  assumes "integrable M (\<lambda>x. (f x) ^2)" "integrable M (\<lambda>x. (g x) ^2)"
+  shows "integrable M (\<lambda>x. f x * g x)" (is "?A")
+        "(\<integral>x. f x * g x \<partial>M) \<le> (\<integral>x. (f x)^2 \<partial>M) powr (1/2) * (\<integral>x. (g x)^ 2 \<partial>M) powr (1/2)"
+        (is "?L \<le> ?R")
+proof -
+  show 0:"?A"
+    using assms by (intro Holder_inequality(1)[where p="2" and q="2"]) auto
+
+  have "?L \<le> (\<integral>x. \<bar>f x * g x\<bar> \<partial>M)"
+    using 0 by (intro integral_mono) auto
+  also have "... \<le> (\<integral>x. \<bar>f x\<bar> powr 2 \<partial>M) powr (1/2) * (\<integral>x. \<bar>g x\<bar> powr 2 \<partial>M) powr (1/2)"
+    using assms by (intro Holder_inequality(2)) auto
+  also have "... = ?R" by simp
+  finally show "?L \<le> ?R" by simp
+qed
+
+text \<open>Generalization of @{thm [source] prob_space.indep_vars_iff_distr_eq_PiM'}:\<close>
+
+lemma (in prob_space) indep_vars_iff_distr_eq_PiM'':
+  fixes I :: "'i set" and X :: "'i \<Rightarrow> 'a \<Rightarrow> 'b"
+  assumes rv: "\<And>i. i \<in> I \<Longrightarrow> random_variable (M' i) (X i)"
+  shows "indep_vars M' X I \<longleftrightarrow>
+           distr M (\<Pi>\<^sub>M i\<in>I. M' i) (\<lambda>x. \<lambda>i\<in>I. X i x) = (\<Pi>\<^sub>M i\<in>I. distr M (M' i) (X i))"
+proof (cases "I = {}")
+  case True
+  have 0: " indicator A (\<lambda>_. undefined) = emeasure (count_space {\<lambda>_. undefined}) A" (is "?L = ?R")
+    if "A \<subseteq> {\<lambda>_. undefined}" for A :: "('i \<Rightarrow> 'b) set"
+  proof -
+    have 1:"A \<noteq> {} \<Longrightarrow> A = {\<lambda>_. undefined}"
+      using that by auto
+
+    have "?R = of_nat (card A)"
+      using finite_subset that by (intro emeasure_count_space_finite that) auto
+    also have "... = ?L"
+      using 1 by (cases "A = {}") auto
+    finally show ?thesis by simp
+  qed
+
+  have "distr M (\<Pi>\<^sub>M i\<in>I. M' i) (\<lambda>x. \<lambda>i\<in>I. X i x) =
+    distr M (count_space {\<lambda>_. undefined}) (\<lambda>_. (\<lambda>_. undefined))"
+    unfolding True PiM_empty by (intro distr_cong) (auto simp:restrict_def)
+  also have "... = return (count_space {\<lambda>_. undefined}) (\<lambda>_. undefined)"
+    by (intro distr_const) auto
+  also have "... = count_space ({\<lambda>_. undefined} :: ('i \<Rightarrow> 'b) set) "
+    by (intro measure_eqI) (auto simp:0)
+  also have "... = (\<Pi>\<^sub>M i\<in>I. distr M (M' i) (X i))"
+    unfolding True PiM_empty by simp
+  finally have "distr M (\<Pi>\<^sub>M i\<in>I. M' i) (\<lambda>x. \<lambda>i\<in>I. X i x)=(\<Pi>\<^sub>M i\<in>I. distr M (M' i) (X i)) \<longleftrightarrow> True"
+    by simp
+  also have "... \<longleftrightarrow> indep_vars M' X I"
+    unfolding indep_vars_def by (auto simp add: space_PiM indep_sets_def) (auto simp add:True)
+  finally show ?thesis by simp
+next
+  case False
+  thus ?thesis
+    by (intro indep_vars_iff_distr_eq_PiM' assms) auto
+qed
+
+lemma proj_indep:
+  assumes "\<And>i. i \<in> I \<Longrightarrow> prob_space (M i)"
+  shows "prob_space.indep_vars (PiM I M) M (\<lambda>i \<omega>. \<omega> i) I"
+proof -
+  interpret prob_space "(PiM I M)"
+    by (intro prob_space_PiM assms)
+
+  have "distr (Pi\<^sub>M I M) (Pi\<^sub>M I M) (\<lambda>x. restrict x I) = PiM I M"
+    by (intro distr_PiM_reindex assms) auto
+  also have "... =  Pi\<^sub>M I (\<lambda>i. distr (Pi\<^sub>M I M) (M i) (\<lambda>\<omega>. \<omega> i))"
+    by (intro PiM_cong refl distr_PiM_component[symmetric] assms)
+  finally have
+    "distr (Pi\<^sub>M I M) (Pi\<^sub>M I M) (\<lambda>x. restrict x I) = Pi\<^sub>M I (\<lambda>i. distr (Pi\<^sub>M I M) (M i) (\<lambda>\<omega>. \<omega> i))"
+    by simp
+  thus "indep_vars M (\<lambda>i \<omega>. \<omega> i) I"
+    by (intro iffD2[OF indep_vars_iff_distr_eq_PiM'']) simp_all
+qed
+
+lemma forall_Pi_to_PiE:
+  assumes "\<And>x. P x = P (restrict x I)"
+  shows "(\<forall>x \<in> Pi I A. P x) = (\<forall>x \<in> PiE I A. P x)"
+  using assms by (simp add:PiE_def Pi_def set_eq_iff, force)
+
+lemma PiE_reindex:
+  assumes "inj_on f I"
+  shows "PiE I (A \<circ> f) = (\<lambda>a. restrict (a \<circ> f) I) ` PiE (f ` I) A" (is "?lhs = ?g ` ?rhs")
+proof -
+  have "?lhs \<subseteq> ?g` ?rhs"
+  proof (rule subsetI)
+    fix x
+    assume a:"x \<in> Pi\<^sub>E I (A \<circ> f)"
+    define y where y_def: "y = (\<lambda>k. if k \<in> f ` I then x (the_inv_into I f k) else undefined)"
+    have b:"y \<in> PiE (f ` I) A"
+      using a assms the_inv_into_f_eq[OF assms]
+      by (simp add: y_def PiE_iff extensional_def)
+    have c: "x = (\<lambda>a. restrict (a \<circ> f) I) y"
+      using a assms the_inv_into_f_eq extensional_arb
+      by (intro ext, simp add:y_def PiE_iff, fastforce)
+    show "x \<in> ?g ` ?rhs" using b c by blast
+  qed
+  moreover have "?g ` ?rhs \<subseteq> ?lhs"
+    by (rule image_subsetI, simp add:Pi_def PiE_def)
+  ultimately show ?thesis by blast
+qed
+
+context prob_space
+begin
+
+lemma indep_sets_reindex:
+  assumes "inj_on f I"
+  shows "indep_sets A (f ` I) = indep_sets (\<lambda>i. A (f i)) I"
+proof -
+  have a: "\<And>J g. J \<subseteq> I \<Longrightarrow> (\<Prod>j \<in> f ` J. g j) = (\<Prod>j \<in> J. g (f j))"
+    by (metis assms prod.reindex_cong subset_inj_on)
+
+  have b:"J \<subseteq> I \<Longrightarrow> (\<Pi>\<^sub>E i \<in> J. A (f i)) = (\<lambda>a. restrict (a \<circ> f) J) ` PiE (f ` J) A" for J
+    using assms inj_on_subset
+    by (subst PiE_reindex[symmetric]) auto
+
+  have c:"\<And>J. J \<subseteq> I \<Longrightarrow> finite (f ` J) = finite J"
+    by (meson assms finite_image_iff inj_on_subset)
+
+  show ?thesis
+    by (simp add:indep_sets_def all_subset_image a c) (simp_all add:forall_Pi_to_PiE b)
+qed
+
+lemma indep_vars_reindex:
+  assumes "inj_on f I"
+  assumes "indep_vars M' X' (f ` I)"
+  shows "indep_vars (M' \<circ> f) (\<lambda>k \<omega>. X' (f k) \<omega>) I"
+  using assms by (simp add:indep_vars_def2 indep_sets_reindex)
+
+lemma indep_vars_cong_AE:
+  assumes "AE x in M. (\<forall>i \<in> I. X' i x = Y' i x)"
+  assumes "indep_vars M' X' I"
+  assumes "\<And>i. i \<in> I \<Longrightarrow> random_variable (M' i) (Y' i)"
+  shows "indep_vars M' Y' I"
+proof -
+  have a: "AE x in M. (\<lambda>i\<in>I. Y' i x) = (\<lambda>i\<in>I. X' i x)"
+    by (rule AE_mp[OF assms(1)], rule AE_I2, simp cong:restrict_cong)
+  have b: "\<And>i. i \<in> I \<Longrightarrow> random_variable (M' i) (X' i)"
+    using assms(2) by (simp add:indep_vars_def2)
+  have c: "\<And>x. x \<in> I \<Longrightarrow> AE xa in M. X' x xa = Y' x xa"
+    by (rule AE_mp[OF assms(1)], rule AE_I2, simp)
+
+  have "distr M (Pi\<^sub>M I M') (\<lambda>x. \<lambda>i\<in>I. Y' i x) = distr M (Pi\<^sub>M I M') (\<lambda>x. \<lambda>i\<in>I. X' i x)"
+    by (intro distr_cong_AE measurable_restrict a b assms(3)) auto
+  also have "... =  Pi\<^sub>M I (\<lambda>i. distr M (M' i) (X' i))"
+    using assms b by (subst indep_vars_iff_distr_eq_PiM''[symmetric]) auto
+  also have "... =  Pi\<^sub>M I (\<lambda>i. distr M (M' i) (Y' i))"
+    by (intro PiM_cong distr_cong_AE c assms(3) b) auto
+  finally have "distr M (Pi\<^sub>M I M') (\<lambda>x. \<lambda>i\<in>I. Y' i x) = Pi\<^sub>M I (\<lambda>i. distr M (M' i) (Y' i))"
+    by simp
+
+  thus ?thesis
+    using assms(3)
+    by (subst indep_vars_iff_distr_eq_PiM'') auto
+qed
+
+end
+
+text \<open>Integrability of bounded functions on finite measure spaces:\<close>
+
+lemma bounded_const: "bounded ((\<lambda>x. (c::real)) ` T)"
+  by (intro boundedI[where B="norm c"]) auto
+
+lemma bounded_exp:
+  fixes f :: "'a \<Rightarrow> real"
+  assumes "bounded ((\<lambda>x. f x) ` T)"
+  shows "bounded ((\<lambda>x. exp (f x)) ` T)"
+proof -
+  obtain m where "norm (f x) \<le> m" if "x \<in> T" for x
+    using assms unfolding bounded_iff by auto
+
+  thus ?thesis
+    by (intro boundedI[where B="exp m"]) fastforce
+qed
+
+lemma bounded_mult_comp:
+  fixes f :: "'a \<Rightarrow> real"
+  assumes "bounded (f ` T)" "bounded (g ` T)"
+  shows "bounded ((\<lambda>x. (f x) * (g x)) ` T)"
+proof -
+  obtain m1 where "norm (f x) \<le> m1" "m1 \<ge>0" if "x \<in> T" for x
+    using assms unfolding bounded_iff by fastforce
+  moreover obtain m2 where "norm (g x) \<le> m2" "m2 \<ge>0" if "x \<in> T" for x
+    using assms unfolding bounded_iff by fastforce
+
+  ultimately show ?thesis
+    by (intro boundedI[where B="m1 * m2"]) (auto intro!: mult_mono simp:abs_mult)
+qed
+
+lemma bounded_sum:
+  fixes f :: "'i \<Rightarrow> 'a \<Rightarrow> real"
+  assumes "finite I"
+  assumes "\<And>i. i \<in> I \<Longrightarrow> bounded (f i ` T)"
+  shows "bounded ((\<lambda>x. (\<Sum>i \<in> I. f i x)) ` T)"
+  using assms by (induction I) (auto intro:bounded_plus_comp bounded_const)
+
+lemma (in finite_measure) bounded_int:
+  fixes f :: "'i \<Rightarrow> 'a \<Rightarrow> real"
+  assumes "bounded ((\<lambda> x. f (fst x) (snd x)) ` (T \<times> space M))"
+  shows "bounded ((\<lambda>x. (\<integral>\<omega>. (f x \<omega>) \<partial>M)) ` T)"
+proof -
+  obtain m where "\<And>x y. x \<in> T \<Longrightarrow> y \<in> space M \<Longrightarrow> norm (f x y) \<le> m"
+    using assms unfolding bounded_iff by auto
+  hence m:"\<And>x y. x \<in> T \<Longrightarrow> y \<in> space M \<Longrightarrow> norm (f x y) \<le> max m 0"
+    by fastforce
+
+  have "norm (\<integral>\<omega>. (f x \<omega>) \<partial>M) \<le> max m 0 * measure M (space M)" (is "?L \<le> ?R") if "x \<in> T" for x
+  proof -
+    have "?L \<le> (\<integral>\<omega>. norm (f x \<omega>) \<partial>M)" by simp
+    also have "... \<le> (\<integral>\<omega>. max m 0 \<partial>M)"
+      using that m by (intro integral_mono') auto
+    also have "... = ?R"
+      by simp
+    finally show ?thesis by simp
+  qed
+  thus ?thesis
+    by (intro boundedI[where B="max m 0 * measure M (space M)"]) auto
+qed
+
+lemmas bounded_intros =
+  bounded_minus_comp bounded_plus_comp bounded_mult_comp bounded_sum finite_measure.bounded_int
+  bounded_const bounded_exp
+
+lemma (in prob_space) integrable_bounded:
+  fixes f :: "_ \<Rightarrow> ('b :: {banach,second_countable_topology})"
+  assumes "bounded (f ` space M)"
+  assumes "f \<in> M \<rightarrow>\<^sub>M borel"
+  shows "integrable M f"
+proof -
+  obtain m where "norm (f x) \<le> m" if "x \<in> space M" for x
+    using assms(1) unfolding bounded_iff by auto
+  thus ?thesis
+    by (intro integrable_const_bound[where B="m"] AE_I2 assms(2))
+qed
+
+end
\ No newline at end of file
diff --git a/thys/Concentration_Inequalities/Efron_Stein_Inequality.thy b/thys/Concentration_Inequalities/Efron_Stein_Inequality.thy
new file mode 100644
--- /dev/null
+++ b/thys/Concentration_Inequalities/Efron_Stein_Inequality.thy
@@ -0,0 +1,300 @@
+section \<open>Efron-Stein Inequality\<close>
+
+text \<open>In this section we verify the Efron-Stein inequality. The verified theorem is stated as
+Efron-Stein inequality for non-symmetric functions by Steele~\cite{steele1986}. However most
+textbook refer to this version as ``the Efron-Stein inequality''. The original result that was shown
+by Efron and Stein is a tail bound for the variance of a symmetric functions of i.i.d.
+random variables~\cite{efron1981}.\<close>
+
+theory Efron_Stein_Inequality
+  imports Concentration_Inequalities_Preliminary
+begin
+
+theorem efron_stein_inequality_distr:
+  fixes f :: "_ \<Rightarrow> real"
+  assumes "finite I"
+  assumes "\<And>i. i \<in> I \<Longrightarrow> prob_space (M i)"
+  assumes "integrable (PiM I M) (\<lambda>x. f x^2)" and f_meas: "f \<in> borel_measurable (PiM I M)"
+  shows "prob_space.variance (PiM I M) f \<le>
+    (\<Sum>i\<in>I. (\<integral>x. (f (\<lambda>j. x (j,False)) - f (\<lambda>j. x (j, j=i)))^2 \<partial>PiM (I\<times>UNIV) (M \<circ> fst))) / 2"
+    (is "?L \<le> ?R")
+proof -
+  let ?M = "PiM (I\<times>(UNIV::bool set)) (M \<circ> fst)"
+
+  have prob: "prob_space (PiM I M)"
+    using assms(2) by (intro prob_space_PiM) auto
+
+  interpret prob_space "?M"
+    using assms(2) by (intro prob_space_PiM) auto
+
+  define n where "n = card I"
+
+  obtain q :: "_ \<Rightarrow> nat" where q:"bij_betw q I {..<n}"
+    unfolding n_def using ex_bij_betw_finite_nat[OF assms(1)] atLeast0LessThan by auto
+
+  let ?\<phi> = "(\<lambda>n x. f (\<lambda>j. x (j, q j < n)))"
+  let ?\<tau> = "(\<lambda>n x. f (\<lambda>j. x (j, q j = n)))"
+  let ?\<sigma> = "(\<lambda>x. f (\<lambda>j. x (j, False)))"
+  let ?\<chi> = "(\<lambda>x. f (\<lambda>j. x (j, True)))"
+
+  have meas_1: "(\<lambda>\<omega>. f (g \<omega>)) \<in> borel_measurable ?M"
+    if "g \<in> Pi\<^sub>M (I \<times> UNIV) (M \<circ> fst) \<rightarrow>\<^sub>M Pi\<^sub>M I M" for g
+    using that by (intro measurable_compose[OF _ f_meas])
+
+  have meas_2: "(\<lambda>x j. x (j, h j)) \<in> ?M \<rightarrow>\<^sub>M Pi\<^sub>M I M" for h
+  proof -
+    have "?thesis \<longleftrightarrow> (\<lambda>x. (\<lambda>j \<in> I. x (j, h j))) \<in> ?M \<rightarrow>\<^sub>M Pi\<^sub>M I M"
+      by (intro measurable_cong) (auto simp:space_PiM PiE_def extensional_def)
+    also have "... \<longleftrightarrow> True"
+      unfolding eq_True
+      by (intro measurable_restrict measurable_PiM_component_rev) auto
+    finally show ?thesis by simp
+  qed
+
+  have int_1: "integrable ?M (\<lambda>x. (g x - h x)^2)"
+    if "integrable ?M (\<lambda>x. (g x)^2)"  "integrable ?M (\<lambda>x. (h x)^2)"
+    and "g \<in> borel_measurable ?M" "h \<in> borel_measurable ?M"
+    for g h :: "_ \<Rightarrow> real"
+  proof -
+    have "integrable ?M (\<lambda>x. (g x)^2 + (h x)^2 - 2 * (g x * h x))"
+      using that by (intro Bochner_Integration.integrable_add Bochner_Integration.integrable_diff
+          integrable_mult_right cauchy_schwartz(1))
+    thus ?thesis by (simp add:algebra_simps power2_eq_square)
+  qed
+
+  note meas_rules = borel_measurable_add borel_measurable_times borel_measurable_diff
+    borel_measurable_power meas_1 meas_2
+
+  have f_int: "integrable (Pi\<^sub>M I M) f"
+    by (intro finite_measure.square_integrable_imp_integrable[OF _ f_meas assms(3)]
+        prob_space.finite_measure prob)
+  moreover have "integrable (Pi\<^sub>M I M) (\<lambda>x. f (restrict x I)) = integrable (Pi\<^sub>M I M) f"
+    by (intro  Bochner_Integration.integrable_cong) (auto simp:space_PiM)
+  ultimately have f_int_2: "integrable (Pi\<^sub>M I M) (\<lambda>x. f (restrict x I))" by simp
+
+  have cong: "(\<integral>x. g (\<lambda>j\<in>I. x (j, h j)) \<partial>?M) = (\<integral>x. g (\<lambda>j. x (j, h j)) \<partial>?M)" (is "?L1 = ?R1")
+    for g :: "_ \<Rightarrow> real" and h
+    by (intro Bochner_Integration.integral_cong arg_cong[where f="g"] refl)
+       (auto simp add:space_PiM PiE_def extensional_def restrict_def)
+
+  have lift: "(\<integral>x. g x \<partial>PiM I M) = (\<integral>x. g (\<lambda>j. x (j, h j)) \<partial>?M)" (is "?L1 = ?R1")
+    if "g \<in> borel_measurable (Pi\<^sub>M I M)"
+    for g :: "_ \<Rightarrow> real" and h
+  proof -
+    let ?J = "(\<lambda>i. (i, h i)) ` I"
+    have "?R1 = (\<integral>x. g (\<lambda>j \<in> I. x (j, h j)) \<partial>?M)"
+      by (intro cong[symmetric])
+    also have "... = (\<integral>x. g x \<partial>distr ?M (PiM I (\<lambda>i. (M\<circ>fst) (i, h i))) (\<lambda>x. (\<lambda>j \<in> I. x (j, h j))))"
+      using that
+      by (intro integral_distr[symmetric] measurable_restrict measurable_component_singleton) auto
+    also have "... = (\<integral>x. g x \<partial>PiM I (\<lambda>i. (M \<circ> fst) (i, h i)))"
+      using assms(2)
+      by (intro arg_cong2[where f="integral\<^sup>L"] refl distr_PiM_reindex inj_onI) auto
+    also have "... = ?L1"
+      by auto
+    finally show ?thesis
+      by simp
+  qed
+
+  have lift_int: "integrable ?M (\<lambda>x. g (\<lambda>j. x (j, h j)))" if "integrable (Pi\<^sub>M I M) g"
+    for g :: "_ \<Rightarrow> real" and h
+  proof -
+    have 0:"integrable (distr ?M (PiM I (\<lambda>i. (M\<circ>fst) (i, h i))) (\<lambda>x. (\<lambda>j \<in> I. x (j, h j)))) g"
+      using that assms(2) by (subst distr_PiM_reindex) (auto intro:inj_onI)
+    have "integrable ?M (\<lambda>x. g (\<lambda>j\<in>I. x (j, h j)))"
+      by (intro integrable_distr[OF _ 0] measurable_restrict measurable_component_singleton) auto
+    moreover have "integrable ?M (\<lambda>x. g (\<lambda>j\<in>I. x (j, h j))) \<longleftrightarrow> ?thesis"
+      by (intro Bochner_Integration.integrable_cong refl arg_cong[where f="g"] ext)
+       (auto simp:PiE_def space_PiM extensional_def)
+    ultimately show ?thesis
+      by simp
+  qed
+
+  note int_rules = cauchy_schwartz(1) int_1 lift_int assms(3) f_int f_int_2
+
+  have "(\<integral>x. g x \<partial>?M) = (\<integral>x. g (\<lambda>(j,v). x (j, v \<noteq> h j)) \<partial>?M)" (is "?L1 = ?R1")
+    if "g \<in> borel_measurable ?M" for g :: "_ \<Rightarrow> real" and h
+  proof -
+    have "?L1 = (\<integral>x. g x \<partial>distr ?M (PiM (I\<times>UNIV) (\<lambda>i. (M \<circ> fst) (fst i, snd i \<noteq> h (fst i))))
+      (\<lambda>x.(\<lambda>i \<in> I\<times>UNIV. x (fst i, snd i \<noteq> h (fst i))) ))"
+      by (subst distr_PiM_reindex) (auto intro:inj_onI assms(2) simp:comp_def)
+    also have "... = (\<integral>x. g (\<lambda>i \<in> I\<times>UNIV. x (fst i, snd i \<noteq> h (fst i))) \<partial>?M)"
+      using that by (intro integral_distr measurable_restrict measurable_component_singleton)
+        (auto simp:comp_def)
+    also have "... = ?R1"
+      by (intro Bochner_Integration.integral_cong refl arg_cong[where f="g"] ext)
+       (auto simp add:space_PiM PiE_def extensional_def restrict_def)
+    finally show ?thesis
+      by simp
+  qed
+
+  hence switch: "(\<integral>x. g x \<partial>?M) = (\<integral>x. h x \<partial>?M)"
+    if "\<And>x. h x = g (\<lambda>(j,v). x (j, v \<noteq> u j))" "g \<in> borel_measurable ?M"
+    for g h :: "_ \<Rightarrow> real" and u
+    using that by simp
+
+  have 1: "(\<integral>x. (?\<sigma> x) * (?\<phi> i x - ?\<phi> (i+1) x) \<partial>?M) \<le> (\<integral>x. (?\<sigma> x - ?\<tau> i x)^2 \<partial>?M) / 2"
+    (is "?L1 \<le> ?R1")
+    if "i < n" for i
+  proof -
+    have "?L1 = (\<integral>x. (?\<tau> i x) * (?\<phi> (i+1) x - ?\<phi> i x) \<partial>?M)"
+      by (intro switch[of _ _ "(\<lambda>j. q j = i)"] arg_cong2[where f="(*)"]
+            arg_cong2[where f="(-)"] arg_cong[where f="f"] ext meas_rules) (auto intro:arg_cong)
+    hence "?L1 = (?L1 + (\<integral>x. (?\<tau> i x) * (?\<phi> (i+1) x - ?\<phi> i x) \<partial>?M)) / 2"
+      by simp
+    also have "... = (\<integral>x. (?\<sigma> x) * (?\<phi> i x - ?\<phi>(i+1) x) + (?\<tau> i x) * (?\<phi>(i+1) x - ?\<phi> i x) \<partial>?M)/2"
+      by (intro Bochner_Integration.integral_add[symmetric] arg_cong2[where f="(/)"] refl
+          int_rules meas_rules)
+    also have "... = (\<integral>x. (?\<sigma> x - ?\<tau> i x) * (?\<phi> i x - ?\<phi>(i+1) x) \<partial>?M)/2"
+      by (intro arg_cong2[where f="(/)"] Bochner_Integration.integral_cong)
+        (auto simp:algebra_simps)
+    also have "...\<le>((\<integral>x. (?\<sigma> x-?\<tau> i x)^2 \<partial>?M)powr(1/2)*(\<integral>x.(?\<phi> i x-?\<phi>(i+1)x)^2 \<partial>?M) powr (1/2))/2"
+      by (intro divide_right_mono cauchy_schwartz meas_rules int_rules) auto
+    also have "...=((\<integral>x. (?\<sigma> x-?\<tau> i x)^2 \<partial>?M)powr(1/2)*(\<integral>x.(?\<sigma> x-?\<tau> i x)^2 \<partial>?M) powr (1/2))/2"
+      by (intro arg_cong2[where f="(/)"] arg_cong2[where f="(*)"] arg_cong2[where f="(powr)"] refl
+         switch[of _ _ "(\<lambda>j. q j < i)"] arg_cong2[where f="power"] arg_cong2[where f="(-)"]
+         arg_cong[where f="f"] ext meas_rules) (auto intro:arg_cong)
+    also have "... = (\<integral>x. (?\<sigma> x-?\<tau> i x)^2 \<partial>?M)/2"
+      by (simp add:powr_add[symmetric])
+    finally show ?thesis by simp
+  qed
+
+  have "indep_vars (M \<circ> fst) (\<lambda>i \<omega>. \<omega> i) (I \<times> UNIV)"
+    using assms(2) by (intro proj_indep) auto
+  hence 2:"indep_var (Pi\<^sub>M (I\<times>{False}) (M\<circ>fst)) (\<lambda>x. \<lambda>j\<in>I\<times>{False}. x j)
+    (Pi\<^sub>M (I\<times>{True}) (M\<circ>fst)) (\<lambda>x. \<lambda>j\<in>I\<times>{True}. x j)"
+    by (intro indep_var_restrict[where I="I \<times> UNIV"]) auto
+  have "indep_var
+    (Pi\<^sub>M I M) ((\<lambda>x. (\<lambda>i \<in> I. x (i, False))) \<circ> (\<lambda>x. (\<lambda>j \<in> I\<times>{False}. x j)))
+    (Pi\<^sub>M I M) ((\<lambda>x. (\<lambda>i \<in> I. x (i, True))) \<circ> (\<lambda>x. (\<lambda>j \<in> I\<times>{True}. x j)))"
+    by (intro indep_var_compose[OF 2] measurable_restrict measurable_PiM_component_rev) auto
+  hence "indep_var (Pi\<^sub>M I M) (\<lambda>x. (\<lambda>j\<in>I. x (j, False))) (Pi\<^sub>M I M) (\<lambda>x. (\<lambda>j\<in>I. x (j, True)))"
+    unfolding comp_def by (simp add:restrict_def cong:if_cong)
+
+  hence "indep_var borel (f \<circ> (\<lambda>x. (\<lambda>j\<in>I. x (j, False)))) borel (f \<circ> (\<lambda>x. (\<lambda>j \<in> I. x (j, True))))"
+    by (intro indep_var_compose[OF _ assms(4,4)]) auto
+  hence indep:"indep_var borel (\<lambda>x. f (\<lambda>j\<in>I. x (j, False))) borel (\<lambda>x. f (\<lambda>j\<in>I. x (j, True)))"
+    by (simp add:comp_def)
+
+  have 3: "\<omega> (j, q j = q i) = \<omega> (j, j = i)" if
+    "\<omega> \<in> PiE (I \<times> UNIV) (\<lambda>i. space (M (fst i)))" "i \<in> I" for i j \<omega>
+  proof (cases "j \<in> I")
+    case True
+    hence "(q j = q i) = (j = i)"
+      using that inj_onD[OF bij_betw_imp_inj_on[OF q]] by blast
+    thus ?thesis by simp
+  next
+    case False
+    hence "\<omega> (j, a) = undefined" for a
+      using that unfolding PiE_def extensional_def by simp
+    thus ?thesis by simp
+  qed
+
+  have "?L = (\<integral>x. (f x)^2 \<partial>PiM I M) - (\<integral>x. (f x) \<partial>PiM I M)^2"
+    by (intro prob_space.variance_eq f_int assms(3) prob)
+  also have "... = (\<integral>x. (f x)^2 \<partial>PiM I M) - (\<integral>x. f x \<partial>PiM I M) * (\<integral>x. f x \<partial>PiM I M)"
+    by (simp add:power2_eq_square)
+  also have "... = (\<integral>x. (?\<sigma> x)^2 \<partial>?M) - (\<integral>x. ?\<sigma> x \<partial>?M) * (\<integral>x. ?\<chi> x \<partial>?M)"
+    by (intro arg_cong2[where f="(-)"] lift  arg_cong2[where f="(*)"] meas_rules f_meas)
+  also have "... = (\<integral>x. (?\<sigma> x)^2 \<partial>?M)-(\<integral>x. f (\<lambda>j\<in>I. x (j,False)) \<partial>?M)*(\<integral>x. f(\<lambda>j\<in>I. x(j,True)) \<partial>?M)"
+    by (intro arg_cong2[where f="(-)"] arg_cong2[where f="(*)"] cong[symmetric] refl)
+  also have "... = (\<integral>x. (?\<sigma> x)^2 \<partial>?M) - (\<integral>x. f (\<lambda>j\<in>I. x (j,False))* f(\<lambda>j\<in>I. x(j,True))  \<partial>?M)"
+    by (intro arg_cong2[where f="(-)"] indep_var_lebesgue_integral[symmetric] refl int_rules indep)
+  also have "... = (\<integral>x. (?\<sigma> x) * (?\<phi> 0 x) \<partial>?M) - (\<integral>x. (?\<sigma> x) * (?\<phi> n x)  \<partial>?M)"
+    using bij_betw_apply[OF q] by (intro arg_cong2[where f="(-)"] arg_cong2[where f="(*)"] ext
+        arg_cong[where f="f"] Bochner_Integration.integral_cong)
+     (auto simp:space_PiM power2_eq_square PiE_def extensional_def)
+  also have "... = (\<Sum>i < n. (\<integral>x. (?\<sigma> x) *  (?\<phi> i x)  \<partial>?M) -  (\<integral>x. (?\<sigma> x) *  (?\<phi> (Suc i) x) \<partial>?M))"
+    unfolding power2_eq_square by (intro sum_lessThan_telescope'[symmetric])
+  also have "... = (\<Sum>i < n. (\<integral>x. (?\<sigma> x) *  (?\<phi> i x) - (?\<sigma> x) *  (?\<phi> (Suc i) x) \<partial>?M))"
+    by (intro sum.cong Bochner_Integration.integral_diff[symmetric] int_rules meas_rules) auto
+  also have "... = (\<Sum>i < n. (\<integral>x. (?\<sigma> x) * (?\<phi> i x - ?\<phi> (i+1) x) \<partial>?M))"
+    by (simp_all add:power2_eq_square algebra_simps)
+  also have "... \<le> (\<Sum>i< n. ((\<integral>x. (?\<sigma> x - ?\<tau> i x)^2 \<partial>?M)) / 2)"
+    by (intro sum_mono 1) auto
+  also have "... = (\<Sum>i \<in> I. ((\<integral>x. (f (\<lambda>j. x (j,False)) - f (\<lambda>j. x (j,q j=q i)))^2 \<partial>?M))/ 2)"
+    by (intro sum.reindex_bij_betw[OF q, symmetric])
+  also have "... = (\<Sum>i \<in> I. ((\<integral>x. (f (\<lambda>j. x (j,False)) -  f (\<lambda>j. x (j,q j=q i)))^2 \<partial>?M)))/2"
+    unfolding sum_divide_distrib[symmetric] by simp
+  also have "... = ?R"
+    using inj_onD[OF bij_betw_imp_inj_on[OF q]]
+    by (intro arg_cong2[where f="(/)"] arg_cong2[where f="(-)"]  arg_cong2[where f="power"]
+          arg_cong[where f="f"] Bochner_Integration.integral_cong sum.cong refl ext 3)
+     (auto  simp add:space_PiM )
+  finally show ?thesis
+    by simp
+qed
+
+theorem (in prob_space) efron_stein_inequality_classic:
+  fixes f :: "_ \<Rightarrow> real"
+  assumes "finite I"
+  assumes "indep_vars (M' \<circ> fst) X (I \<times> (UNIV :: bool set))"
+  assumes "f \<in> borel_measurable (PiM I M')"
+  assumes "integrable M (\<lambda>\<omega>. f (\<lambda>i\<in>I. X (i,False) \<omega>)^2)"
+  assumes "\<And>i. i \<in> I \<Longrightarrow> distr M (M' i) (X (i, True)) = distr M (M' i) (X (i, False))"
+  shows "variance (\<lambda>\<omega>. f (\<lambda>i\<in>I. X (i,False) \<omega>)) \<le>
+    (\<Sum>j \<in> I. expectation (\<lambda>\<omega>. (f (\<lambda>i\<in>I. X (i,False) \<omega>) - f (\<lambda>i\<in>I. X (i, i=j) \<omega>))^2))/2"
+    (is "?L \<le> ?R")
+proof -
+  let ?D = "distr M (PiM I M') (\<lambda>\<omega>. \<lambda>i\<in>I. X (i, False) \<omega>)"
+
+  let ?M = "PiM I (\<lambda>i. distr M (M' i) (X (i,False)))"
+  let ?N = "PiM (I \<times> (UNIV::bool set)) ((\<lambda>i. distr M (M' i) (X (i,False))) \<circ> fst)"
+
+  have rv: "random_variable (M' i) (X (i, j))" if "i \<in> I" for i j
+    using assms(2) that unfolding indep_vars_def by auto
+
+  have proj_meas: "(\<lambda>x j. x (j, h j)) \<in> Pi\<^sub>M (I \<times> UNIV) (M' \<circ> fst) \<rightarrow>\<^sub>M Pi\<^sub>M I M'"
+    for h :: " _ \<Rightarrow> bool"
+  proof -
+    have "?thesis \<longleftrightarrow> (\<lambda>x. (\<lambda>j \<in> I. x (j, h j))) \<in> Pi\<^sub>M (I \<times> UNIV) (M' \<circ> fst) \<rightarrow>\<^sub>M Pi\<^sub>M I M'"
+      by (intro measurable_cong) (auto simp:space_PiM PiE_def extensional_def)
+    also have "... \<longleftrightarrow> True"
+      unfolding eq_True
+      by (intro measurable_restrict measurable_PiM_component_rev) auto
+    finally show ?thesis by simp
+  qed
+
+  note meas_rules = borel_measurable_add borel_measurable_times borel_measurable_diff proj_meas
+    borel_measurable_power assms(3) measurable_restrict measurable_compose[OF _ assms(3)]
+
+  have "indep_vars ((M' \<circ> fst) \<circ> (\<lambda>i. (i, False))) (\<lambda>i. X (i, False)) I"
+    by (intro indep_vars_reindex indep_vars_subset[OF assms(2)] inj_onI) auto
+  hence "indep_vars M' (\<lambda>i. X (i, False)) I" by (simp add: comp_def)
+  hence 0:"?D = PiM I (\<lambda>i. distr M (M' i) (X (i,False)))"
+    by (intro iffD1[OF indep_vars_iff_distr_eq_PiM''] rv)
+
+  have "distr M (M' (fst x)) (X (fst x, False)) = distr M (M' (fst x)) (X x)"
+    if "x \<in> I \<times> UNIV" for x
+    using that assms(5) by (cases x, cases "snd x") auto
+
+  hence 1: "?N = PiM (I \<times> UNIV) (\<lambda>i. distr M ((M' \<circ> fst) i) (X i))"
+    using assms(3) by (intro PiM_cong refl) (simp add:comp_def)
+  also have "... = distr M (PiM (I \<times> UNIV) (M' \<circ> fst)) (\<lambda>x. \<lambda>i\<in>I \<times> UNIV. X i x)"
+    using rv by (intro iffD1[OF indep_vars_iff_distr_eq_PiM'', symmetric] assms(2)) auto
+  finally have 2:"?N = distr M (PiM (I \<times> UNIV) (M' \<circ> fst)) (\<lambda>x. \<lambda>i\<in>I \<times> UNIV. X i x)"
+    by simp
+
+  have 3: "integrable (Pi\<^sub>M I (\<lambda>i. distr M (M' i) (X (i, False)))) (\<lambda>x. (f x)\<^sup>2)"
+    unfolding 0[symmetric] by (intro iffD2[OF integrable_distr_eq] meas_rules assms rv)
+
+  have "?L = (\<integral>x. (f x - expectation (\<lambda>\<omega>. f (\<lambda>i\<in>I. X (i,False) \<omega>)))^2 \<partial>?D)"
+    using rv by (intro integral_distr[symmetric] meas_rules measurable_restrict) auto
+  also have "... = prob_space.variance ?D f"
+    by (intro arg_cong[where f="integral\<^sup>L ?D"] arg_cong2[where f="(-)"] arg_cong2[where f="power"]
+        refl ext integral_distr[symmetric] measurable_restrict rv assms(3))
+  also have "... = prob_space.variance ?M f"
+    unfolding 0 by simp
+  also have "... \<le> (\<Sum>i\<in>I. (\<integral>x. (f (\<lambda>j. x (j, False)) - f (\<lambda>j. x (j, j = i)))^2 \<partial>?N)) / 2"
+    using assms(3) by (intro efron_stein_inequality_distr prob_space_distr rv assms(1) 3) auto
+  also have "... = (\<Sum>i\<in>I. expectation (\<lambda>\<omega>. (f (\<lambda>j. (\<lambda>i\<in>I\<times>UNIV. X i \<omega>) (j, False)) -
+    f (\<lambda>j. (\<lambda>i\<in>I\<times>UNIV. X i \<omega>) (j, j=i)))\<^sup>2)) / 2"
+    using rv unfolding 2
+    by (intro sum.cong arg_cong2[where f="(/)"] integral_distr refl meas_rules) auto
+  also have "... = ?R"
+    by (simp add:restrict_def)
+  finally show ?thesis
+    by simp
+qed
+
+end
\ No newline at end of file
diff --git a/thys/Concentration_Inequalities/McDiarmid_Inequality.thy b/thys/Concentration_Inequalities/McDiarmid_Inequality.thy
new file mode 100644
--- /dev/null
+++ b/thys/Concentration_Inequalities/McDiarmid_Inequality.thy
@@ -0,0 +1,777 @@
+section \<open>McDiarmid's inequality\<close>
+
+text \<open>In this section we verify McDiarmid's inequality \cite[Lemma 1.2]{mcdiarmid1989}. In the
+source and also further sources sometimes refer to the result as the ``independent bounded
+differences'' inequality.\<close>
+
+theory McDiarmid_Inequality
+  imports Concentration_Inequalities_Preliminary
+begin
+
+lemma Collect_restr_cong:
+  assumes "A = B"
+  assumes "\<And>x. x \<in> A \<Longrightarrow> P x = Q x"
+  shows "{x \<in> A. P x} = {x \<in> B. Q x}"
+  using assms by auto
+
+lemma ineq_chain:
+  fixes h :: "nat \<Rightarrow> real"
+  assumes "\<And>i. i < n \<Longrightarrow> h (i+1) \<le> h i"
+  shows "h n \<le> h 0"
+  using assms by (induction n) force+
+
+lemma restrict_subset_eq:
+  assumes "A \<subseteq> B"
+  assumes "restrict f B = restrict g B"
+  shows "restrict f A = restrict g A"
+  using assms unfolding restrict_def by (meson subsetD)
+
+text \<open>Bochner Integral version of Hoeffding's Lemma using
+  @{thm [source] interval_bounded_random_variable.Hoeffdings_lemma_nn_integral_0}\<close>
+
+lemma (in prob_space) Hoeffdings_lemma_bochner:
+  assumes "l > 0" and E0: "expectation f = 0"
+  assumes "random_variable borel f"
+  assumes "AE x in M. f x \<in> {a..b::real}"
+  shows   "expectation (\<lambda>x. exp (l * f x)) \<le> exp (l\<^sup>2 * (b - a)\<^sup>2 / 8)" (is "?L \<le> ?R")
+proof -
+  interpret interval_bounded_random_variable M f a b
+    using assms by (unfold_locales) auto
+
+  have "integrable M (\<lambda>x. exp (l * f x))"
+    using assms(1,3,4) by (intro integrable_const_bound[where B="exp (l * b)"]) simp_all
+
+  hence "ennreal (?L) = (\<integral>\<^sup>+ x. exp (l * f x) \<partial>M)"
+    by (intro nn_integral_eq_integral[symmetric]) auto
+  also have "... \<le> ennreal (?R)"
+    by (intro Hoeffdings_lemma_nn_integral_0 assms)
+  finally have 0:"ennreal (?L) \<le> ennreal ?R"
+    by simp
+  show ?thesis
+  proof (cases "?L \<ge> 0")
+    case True
+    thus ?thesis using 0 by simp
+  next
+    case False
+    hence "?L \<le> 0" by simp
+    also have "... \<le> ?R" by simp
+    finally show ?thesis by simp
+  qed
+qed
+
+lemma (in prob_space) Hoeffdings_lemma_bochner_2:
+  assumes "l > 0" and E0: "expectation f = 0"
+  assumes "random_variable borel f"
+  assumes "\<And>x y. {x,y} \<subseteq> space M \<Longrightarrow> \<bar>f x - f y\<bar> \<le> (c::real)"
+  shows   "expectation (\<lambda>x. exp (l * f x)) \<le> exp (l^2 * c^2 / 8)" (is "?L \<le> ?R")
+proof -
+  define a :: real where "a = (INF x \<in> space M. f x)"
+  define b :: real where "b = a+c"
+
+  obtain \<omega> where \<omega>:"\<omega> \<in> space M" using not_empty by auto
+  hence 0:"f ` space M \<noteq> {}" by auto
+  have 1: "c = b - a" unfolding b_def by simp
+
+  have "bdd_below (f ` space M)"
+    using \<omega> assms(4) unfolding abs_le_iff
+    by (intro bdd_belowI[where m="f \<omega> - c"]) (auto simp add:algebra_simps)
+  hence "f x \<ge> a" if "x \<in> space M" for x unfolding a_def by (intro cINF_lower that)
+  moreover have "f x \<le> b" if x_space: "x \<in> space M" for x
+  proof (rule ccontr)
+    assume "\<not>(f x \<le> b)"
+    hence a:"f x > a + c" unfolding b_def by simp
+    have "f y \<ge> f x - c" if "y \<in> space M" for y
+      using that x_space assms(4) unfolding abs_le_iff by (simp add:algebra_simps)
+    hence "f x - c \<le> a" unfolding a_def using cInf_greatest[OF 0] by auto
+    thus "False" using a by simp
+  qed
+  ultimately have "f x \<in> {a..b}" if "x \<in> space M" for x using that by auto
+  hence "AE x in M. f x \<in> {a..b}" by simp
+  thus ?thesis unfolding 1 by (intro Hoeffdings_lemma_bochner assms(1,2,3))
+qed
+
+lemma (in prob_space) Hoeffdings_lemma_bochner_3:
+  assumes "expectation f = 0"
+  assumes "random_variable borel f"
+  assumes "\<And>x y. {x,y} \<subseteq> space M \<Longrightarrow> \<bar>f x - f y\<bar> \<le> (c::real)"
+  shows   "expectation (\<lambda>x. exp (l * f x)) \<le> exp (l^2 * c^2 / 8)" (is "?L \<le> ?R")
+proof -
+  consider (a) "l > 0" | (b) "l = 0" | (c) "l < 0"
+    by argo
+  then show ?thesis
+  proof (cases)
+    case a thus ?thesis by (intro Hoeffdings_lemma_bochner_2 assms) auto
+  next
+    case b thus ?thesis by simp
+  next
+    case c
+    have "?L = expectation (\<lambda>x. exp ((-l) * (-f x)))" by simp
+    also have "... \<le> exp ((-l)^2 * c\<^sup>2/8)" using c assms by (intro Hoeffdings_lemma_bochner_2) auto
+    also have "... = ?R" by simp
+    finally show ?thesis by simp
+  qed
+qed
+
+text \<open>Version of @{thm [source] product_sigma_finite.product_integral_singleton} without the
+condition that @{term "M i"} has to be sigma finite for all @{term "i"}:\<close>
+
+lemma product_integral_singleton:
+  fixes f :: "_ \<Rightarrow> _::{banach, second_countable_topology}"
+  assumes "sigma_finite_measure (M i)"
+  assumes "f \<in> borel_measurable (M i)"
+  shows "(\<integral>x. f (x i) \<partial>(PiM {i} M)) = (\<integral>x. f x \<partial>(M i))" (is "?L = ?R")
+proof -
+  define M' where "M' j = (if j=i then M i else count_space {undefined})" for j
+
+  interpret product_sigma_finite "M'"
+    using assms(1) unfolding product_sigma_finite_def M'_def
+    by (auto intro!:sigma_finite_measure_count_space_finite)
+
+  have "?L = \<integral>x. f (x i) \<partial>(PiM {i} M')"
+    by (intro Bochner_Integration.integral_cong PiM_cong) (simp_all add:M'_def)
+  also have "... = (\<integral>x. f x \<partial>(M' i))"
+    using assms(2) by (intro product_integral_singleton) (simp add:M'_def)
+  also have "... = ?R"
+    by (intro Bochner_Integration.integral_cong PiM_cong) (simp_all add:M'_def)
+  finally show ?thesis by simp
+qed
+
+text \<open>Version of @{thm [source] product_sigma_finite.product_integral_fold} without the
+condition that @{term "M i"} has to be sigma finite for all @{term "i"}:\<close>
+
+lemma product_integral_fold:
+  fixes f :: "_ \<Rightarrow> _::{banach, second_countable_topology}"
+  assumes "\<And>i. i \<in> I \<union> J \<Longrightarrow> sigma_finite_measure (M i)"
+  assumes "I \<inter> J = {}"
+  assumes "finite I"
+  assumes "finite J"
+  assumes "integrable (PiM (I \<union> J) M) f"
+  shows "(\<integral>x. f x \<partial>PiM (I \<union> J) M) = (\<integral>x. (\<integral>y. f (merge I J(x,y)) \<partial>PiM J M) \<partial>PiM I M)" (is "?L = ?R")
+    and "integrable (PiM I M) (\<lambda>x. (\<integral>y. f (merge I J(x,y)) \<partial>PiM J M))" (is "?I")
+    and "AE x in PiM I M. integrable (PiM J M) (\<lambda>y. f (merge I J(x,y)))" (is "?T")
+proof -
+  define M' where "M' i = (if i \<in> I \<union> J then M i else count_space {undefined})" for i
+
+  interpret product_sigma_finite "M'"
+    using assms(1) unfolding product_sigma_finite_def M'_def
+    by (auto intro!:sigma_finite_measure_count_space_finite)
+
+  interpret pair_sigma_finite "Pi\<^sub>M I M'" "Pi\<^sub>M J M'"
+    using assms(3,4) sigma_finite unfolding pair_sigma_finite_def by blast
+
+  have 0: "integrable (Pi\<^sub>M (I \<union> J) M') f = integrable (Pi\<^sub>M (I \<union> J) M) f"
+    by (intro Bochner_Integration.integrable_cong PiM_cong) (simp_all add:M'_def)
+
+  have "?L = (\<integral>x. f x \<partial>PiM (I \<union> J) M')"
+    by (intro Bochner_Integration.integral_cong PiM_cong) (simp_all add:M'_def)
+  also have "... = (\<integral>x. (\<integral>y. f (merge I J (x,y)) \<partial>PiM J M') \<partial>PiM I M')"
+    using assms(5) by (intro product_integral_fold assms(2,3,4)) (simp add:0)
+  also have "... = ?R"
+    by (intro Bochner_Integration.integral_cong PiM_cong) (simp_all add:M'_def)
+  finally show "?L = ?R" by simp
+
+  have "integrable (Pi\<^sub>M (I \<union> J) M') f = integrable (PiM I M' \<Otimes>\<^sub>M PiM J M') (\<lambda>x. f (merge I J x))"
+    using assms(5) apply (subst distr_merge[OF assms(2,3,4),symmetric])
+    by (intro integrable_distr_eq) (simp_all add:0[symmetric])
+  hence 1:"integrable (PiM I M' \<Otimes>\<^sub>M PiM J M') (\<lambda>x. f (merge I J x))"
+    using assms(5) 0 by simp
+
+  hence "integrable (PiM I M') (\<lambda>x. (\<integral>y. f (merge I J(x,y)) \<partial>PiM J M'))" (is "?I'")
+    by (intro integrable_fst') auto
+  moreover have "?I' = ?I"
+    by (intro Bochner_Integration.integrable_cong PiM_cong ext Bochner_Integration.integral_cong)
+     (simp_all add:M'_def)
+  ultimately show "?I"
+    by simp
+
+  have "AE x in Pi\<^sub>M I M'. integrable (Pi\<^sub>M J M') (\<lambda>y. f (merge I J (x, y)))" (is "?T'")
+    by (intro AE_integrable_fst'[OF 1])
+  moreover have "?T' = ?T"
+    by (intro arg_cong2[where f="almost_everywhere"] PiM_cong ext Bochner_Integration.integrable_cong)
+     (simp_all add:M'_def)
+  ultimately show  "?T"
+    by simp
+qed
+
+lemma product_integral_insert:
+  fixes f :: "_ \<Rightarrow> _::{banach, second_countable_topology}"
+  assumes "\<And>k. k \<in> {i} \<union> J \<Longrightarrow> sigma_finite_measure (M k)"
+  assumes "i \<notin> J"
+  assumes "finite J"
+  assumes "integrable (PiM (insert i J) M) f"
+  shows "(\<integral>x. f x \<partial>PiM (insert i J) M) = (\<integral>x. (\<integral>y. f (y(i := x)) \<partial>PiM J M) \<partial>M i)" (is "?L = ?R")
+proof -
+  note meas_cong = iffD1[OF measurable_cong]
+
+  have "integrable (PiM {i} M) (\<lambda>x. (\<integral>y. f (merge {i} J (x,y)) \<partial>PiM J M))"
+    using assms by (intro product_integral_fold) auto
+  hence 0:"(\<lambda>x. (\<integral>y. f (merge {i} J (x,y)) \<partial>PiM J M)) \<in> borel_measurable (PiM {i} M)"
+    using borel_measurable_integrable by simp
+  have 1:"(\<lambda>x. (\<integral>y. f (y(i := (x i))) \<partial>PiM J M)) \<in> borel_measurable (PiM {i} M)"
+    by (intro meas_cong[OF _ 0] Bochner_Integration.integral_cong arg_cong[where f="f"])
+     (auto simp add:space_PiM merge_def fun_upd_def PiE_def extensional_def)
+  have "(\<lambda>x. (\<integral>y. f (y(i := (\<lambda>i\<in>{i}. x) i)) \<partial>PiM J M)) \<in> borel_measurable (M i)"
+    by (intro measurable_compose[OF _ 1, where f="(\<lambda>x. (\<lambda>i\<in>{i}. x))"] measurable_restrict) auto
+  hence 2:"(\<lambda>x. (\<integral>y. f (y(i := x )) \<partial>PiM J M)) \<in> borel_measurable (M i)" by simp
+
+  have "?L = (\<integral>x. f x \<partial>PiM ({i} \<union> J) M)" by simp
+  also have "... = (\<integral>x. (\<integral>y. f (merge {i} J (x,y)) \<partial>PiM J M) \<partial>PiM {i} M)"
+    using assms(2,4) by (intro product_integral_fold assms(1,3)) auto
+  also have "... = (\<integral>x. (\<integral>y. f (y(i := (x i))) \<partial>PiM J M) \<partial>PiM {i} M)"
+    by (intro Bochner_Integration.integral_cong refl arg_cong[where f="f"])
+     (auto simp add:space_PiM merge_def fun_upd_def PiE_def extensional_def)
+  also have "... = ?R"
+    using assms(1,4) by (intro product_integral_singleton assms(1) 2) auto
+  finally show ?thesis by simp
+qed
+
+lemma product_integral_insert_rev:
+  fixes f :: "_ \<Rightarrow> _::{banach, second_countable_topology}"
+  assumes "\<And>k. k \<in> {i} \<union> J \<Longrightarrow> sigma_finite_measure (M k)"
+  assumes "i \<notin> J"
+  assumes "finite J"
+  assumes "integrable (PiM (insert i J) M) f"
+  shows "(\<integral>x. f x \<partial>PiM (insert i J) M) = (\<integral>y. (\<integral>x. f (y(i := x)) \<partial>M i) \<partial>PiM J M)" (is "?L = ?R")
+proof -
+  have "?L = (\<integral>x. f x \<partial>PiM (J \<union> {i}) M)" by simp
+  also have "... = (\<integral>x. (\<integral>y. f (merge J {i} (x,y)) \<partial>PiM {i} M) \<partial>PiM J M)"
+    using assms(2,4) by (intro product_integral_fold assms(1,3)) auto
+  also have "... = (\<integral>x. (\<integral>y. f (x(i := (y i))) \<partial>PiM {i} M) \<partial>PiM J M)"
+    unfolding merge_singleton[OF assms(2)]
+    by (intro Bochner_Integration.integral_cong refl arg_cong[where f="f"])
+     (metis PiE_restrict assms(2) restrict_upd space_PiM)
+  also have "... = ?R"
+    using assms(1,4) by (intro Bochner_Integration.integral_cong product_integral_singleton) auto
+  finally show ?thesis by simp
+qed
+
+lemma merge_empty[simp]:
+  "merge {} I (y,x) = restrict x I"
+  "merge I {} (y,x) = restrict y I"
+  unfolding merge_def restrict_def by auto
+
+lemma merge_cong:
+  assumes "restrict x1 I = restrict x2 I"
+  assumes "restrict y1 J = restrict y2 J"
+  shows "merge I J (x1,y1) = merge I J (x2,y2)"
+  using assms unfolding merge_def restrict_def
+  by (intro ext) (smt (verit, best) case_prod_conv)
+
+lemma restrict_merge:
+  "restrict (merge I J x) K = merge (I \<inter> K) (J \<inter> K) x"
+  unfolding restrict_def merge_def by (intro ext) (auto simp:case_prod_beta)
+
+lemma map_prod_measurable:
+  assumes "f \<in> M \<rightarrow>\<^sub>M M'"
+  assumes "g \<in> N \<rightarrow>\<^sub>M N'"
+  shows "map_prod f g \<in> M \<Otimes>\<^sub>M N \<rightarrow>\<^sub>M M' \<Otimes>\<^sub>M N'"
+  using assms by (subst measurable_pair_iff) simp
+
+lemma mc_diarmid_inequality_aux:
+  fixes f :: "(nat \<Rightarrow> 'a) \<Rightarrow> real"
+  fixes n :: nat
+  assumes "\<And>i. i < n \<Longrightarrow> prob_space (M i)"
+  assumes "\<And>i x y. i<n \<Longrightarrow> {x,y} \<subseteq> space (PiM {..<n} M) \<Longrightarrow> (\<forall>j\<in>{..<n}-{i}. x j=y j) \<Longrightarrow> \<bar>f x-f y\<bar>\<le>c i"
+  assumes f_meas: "f \<in> borel_measurable (PiM {..<n} M)" and \<epsilon>_gt_0: "\<epsilon> >0"
+  shows "\<P>(\<omega> in PiM {..<n} M. f \<omega> - (\<integral>\<xi>. f \<xi> \<partial>PiM {..<n} M) \<ge> \<epsilon>) \<le> exp (-(2*\<epsilon>^2)/(\<Sum>i<n. (c i)^2))"
+    (is "?L \<le> ?R")
+proof -
+  define h where "h k = (\<lambda>\<xi>. (\<integral>\<omega>. f (merge {..<k} {k..<n} (\<xi>, \<omega>)) \<partial>PiM {k..<n} M))" for k
+
+  define t :: real where "t = 4 * \<epsilon> / (\<Sum>i<n. (c i)^2)"
+
+  define V where "V i \<xi> = h (Suc i) \<xi> - h i \<xi>" for i \<xi>
+
+  obtain x0 where x0:"x0 \<in> space (PiM {..<n} M)"
+    using prob_space.not_empty[OF prob_space_PiM] assms(1) by fastforce
+
+  have delta: "\<bar>f x - f y\<bar> \<le> c i" if "i < n"
+    "x \<in> PiE {..<n} (\<lambda>i. space (M i))" "y \<in> PiE {..<n} (\<lambda>i. space (M i))"
+    "restrict x ({..<n}-{i}) = restrict y ({..<n}-{i})"
+  for x y i
+  proof (rule assms(2)[OF that(1)], goal_cases)
+    case 1
+    then show ?case using that(2,3) unfolding space_PiM by auto
+  next
+    case 2
+    then show ?case using that(4) by (intro ballI) (metis restrict_apply')
+  qed
+
+  have c_ge_0: "c j \<ge> 0" if "j < n" for j
+  proof -
+    have "0 \<le> \<bar>f x0 - f x0\<bar>" by simp
+    also have "... \<le> c j" using x0 unfolding space_PiM by (intro delta that) auto
+    finally show ?thesis by simp
+  qed
+  hence sum_c_ge_0: "(\<Sum>i<n. (c i)^2) \<ge> 0" by (meson sum_nonneg zero_le_power2)
+
+  hence t_ge_0: "t \<ge> 0" using \<epsilon>_gt_0 unfolding t_def by simp
+
+  note borel_rules =
+    borel_measurable_sum measurable_compose[OF _ borel_measurable_exp]
+    borel_measurable_times
+
+  note int_rules =
+    prob_space_PiM assms(1) borel_rules
+    prob_space.integrable_bounded bounded_intros
+  have h_n: "h n \<xi> = f \<xi>" if "\<xi> \<in> space (PiM {..<n} M)" for \<xi>
+  proof -
+    have "h n \<xi> = (\<integral>\<omega>. f (\<lambda>i\<in>{..<n}. \<xi> i) \<partial>PiM {} M)"
+      unfolding h_def using leD
+      by (intro Bochner_Integration.integral_cong PiM_cong arg_cong[where f="f"] restrict_cong)
+       auto
+    also have "... = f (restrict \<xi> {..<n})"
+      unfolding PiM_empty by simp
+    also have "... = f \<xi>"
+      using that unfolding space_PiM PiE_def
+      by (simp add: extensional_restrict)
+    finally show ?thesis
+      by simp
+  qed
+
+  have h_0: "h 0 \<xi> = (\<integral>\<omega>. f \<omega> \<partial>PiM {..<n} M)" for \<xi>
+    unfolding h_def by (intro Bochner_Integration.integral_cong PiM_cong refl)
+     (simp_all add:space_PiM atLeast0LessThan)
+
+  have h_cong: "h j \<omega> = h j \<xi>" if "restrict \<omega> {..<j} = restrict \<xi> {..<j}" for j \<omega> \<xi>
+    using that unfolding h_def
+    by (intro Bochner_Integration.integral_cong refl arg_cong[where f="f"] merge_cong) auto
+
+  have h_meas: "h i \<in> borel_measurable (PiM I M)" if "i \<le> n" "{..<i} \<subseteq> I" for i I
+  proof -
+    have 0: "{..<n} = {..<i} \<union> {i..<n}"
+      using that(1) by auto
+
+    have 1: "merge {..<i} {i..<n} = merge {..<i} {i..<n} \<circ> map_prod (\<lambda>x. restrict x {..<i}) id"
+      unfolding merge_def map_prod_def restrict_def comp_def
+      by (intro ext) (auto simp:case_prod_beta')
+
+    have "merge {..<i} {i..<n} \<in> Pi\<^sub>M I M \<Otimes>\<^sub>M Pi\<^sub>M {i..<n} M \<rightarrow>\<^sub>M Pi\<^sub>M {..<n} M"
+      unfolding 0 by (subst 1) (intro measurable_comp[OF _ measurable_merge] map_prod_measurable
+          measurable_ident measurable_restrict_subset that(2))
+    hence "(\<lambda>x. f (merge {..<i} {i..<n} x)) \<in> borel_measurable (Pi\<^sub>M I M \<Otimes>\<^sub>M Pi\<^sub>M {i..<n} M)"
+      by (intro measurable_compose[OF _ f_meas])
+    thus ?thesis
+      unfolding h_def by (intro sigma_finite_measure.borel_measurable_lebesgue_integral
+            prob_space_imp_sigma_finite prob_space_PiM assms(1)) (auto simp:case_prod_beta')
+  qed
+
+  have merge_space_aux:"merge {..<j} {j..<n} u \<in> (\<Pi>\<^sub>E i\<in>{..<n}. space (M i))"
+    if "j \<le> n" "fst u \<in> Pi {..<j} (\<lambda>i. space (M i))" "snd u \<in> Pi {j..<n} (\<lambda>i. space (M i))"
+    for u  j
+  proof -
+    have "merge {..<j} {j..<n} (fst u, snd u) \<in> (PiE ({..<j} \<union> {j..<n}) (\<lambda>i. space (M i)))"
+      using that by (intro iffD2[OF PiE_cancel_merge]) auto
+    also have "... =  (\<Pi>\<^sub>E i\<in>{..<n}. space (M i))"
+      using that by (intro arg_cong2[where f="PiE"] refl) auto
+    finally show ?thesis by simp
+  qed
+
+  have merge_space:"merge {..<j} {j..<n} (u, v) \<in> (\<Pi>\<^sub>E i\<in>{..<n}. space (M i))"
+    if "j \<le> n" "u \<in> PiE {..<j} (\<lambda>i. space (M i))" "v \<in> PiE {j..<n} (\<lambda>i. space (M i))"
+    for u v j
+    using that by (intro merge_space_aux) (simp_all add:PiE_def)
+
+  have delta': "\<bar>f x - f y\<bar> \<le> (\<Sum>i<n. c i)"
+    if "x \<in> PiE {..<n} (\<lambda>i. space (M i))" "y \<in> PiE {..<n} (\<lambda>i. space (M i))" for x y
+  proof -
+    define m where "m i = merge {..<i} {i..<n} (x,y)" for i
+
+    have 0: "z \<in> Pi I (\<lambda>i. space (M i))" if "z \<in> PiE {..<n} (\<lambda>i. space (M i))"
+       "I \<subseteq> {..<n}" for z I
+      using that unfolding PiE_def by auto
+
+    have 3: "{..<Suc i} \<inter> ({..<n} - {i}) = {..<i}"
+      "{Suc i..<n} \<inter> ({..<n} - {i}) = {Suc i..<n}"
+      "{..<i} \<inter> ({..<n} - {i}) = {..<i}"
+      "{i..<n} \<inter> ({..<n} - {i}) = {Suc i..<n}"
+      if "i < n" for i
+      using that by auto
+
+    have "\<bar>f x - f y\<bar> = \<bar>f (m n) - f(m 0)\<bar>"
+      using that unfolding m_def by (simp add:atLeast0LessThan)
+    also have "... = \<bar>\<Sum>i < n. f (m (Suc i)) - f (m i)\<bar>"
+      by (subst sum_lessThan_telescope) simp
+    also have "... \<le> (\<Sum>i < n. \<bar>f (m (Suc i)) - f (m i)\<bar>)"
+      by simp
+    also have "... \<le> (\<Sum>i < n. c i)"
+      using that unfolding m_def by (intro delta sum_mono merge_space_aux 0 subsetI)
+       (simp_all add:restrict_merge 3)
+    finally show ?thesis
+      by simp
+  qed
+
+  have "norm (f x) \<le> norm (f x0) + sum c {..<n}" if "x \<in> space (Pi\<^sub>M {..<n} M)" for x
+  proof -
+    have "\<bar>f x - f x0\<bar> \<le> sum c {..<n}"
+      using x0 that unfolding space_PiM by (intro delta') auto
+    thus ?thesis
+      by simp
+  qed
+  hence f_bounded: "bounded (f ` space (PiM {..<n} M))"
+    by (intro boundedI[where B="norm (f x0) + (\<Sum>i<n. c i)"]) auto
+
+  have f_merge_bounded:
+    "bounded ((\<lambda>\<omega>. (f (merge {..<j} {j..<n} (u, \<omega>)))) ` space (Pi\<^sub>M {j..<n} M))"
+    if "j \<le> n" "u \<in> PiE {..<j} (\<lambda>i. space (M i))" for u j
+  proof -
+    have "(\<lambda>\<omega>. merge {..<j} {j..<n} (u, \<omega>)) ` space (Pi\<^sub>M {j..<n} M) \<subseteq> space (Pi\<^sub>M {..<n} M)"
+      using that  unfolding space_PiM
+      by (intro image_subsetI merge_space) auto
+    thus ?thesis
+      by (subst image_image[of "f",symmetric]) (intro bounded_subset[OF f_bounded] image_mono)
+  qed
+
+  have f_merge_meas_aux:
+    "(\<lambda>\<omega>. f (merge {..<j} {j..<n} (u, \<omega>))) \<in> borel_measurable (Pi\<^sub>M {j..<n} M)"
+    if "j \<le> n" "u \<in> Pi {..<j} (\<lambda>i. space (M i))" for j u
+  proof -
+
+    have 0: "{..<n} = {..<j } \<union> {j ..<n}"
+      using that(1) by auto
+
+    have 1: "merge {..<j} {j..<n} (u,\<omega>) = merge {..<j} {j..<n} (restrict u {..<j},\<omega>)" for \<omega>
+      by (intro merge_cong) auto
+
+    have "(\<lambda>\<omega>. merge {..<j} {j..<n} (u, \<omega>)) \<in> Pi\<^sub>M {j..<n} M \<rightarrow>\<^sub>M Pi\<^sub>M {..<n} M"
+      using that unfolding 0 1
+      by (intro measurable_compose[OF _ measurable_merge] measurable_Pair1')
+       (simp add:space_PiM)
+    thus ?thesis
+      by (intro measurable_compose[OF _ f_meas])
+  qed
+
+  have f_merge_meas: "(\<lambda>\<omega>. f (merge {..<j} {j..<n} (u, \<omega>))) \<in> borel_measurable (Pi\<^sub>M {j..<n} M)"
+    if "j \<le> n" "u \<in> PiE {..<j} (\<lambda>i. space (M i))" for j u
+    using that unfolding PiE_def by (intro f_merge_meas_aux) auto
+
+  have h_bounded: "bounded (h i ` space (PiM I M))"
+    if h_bounded_assms: "i \<le> n" "{..<i} \<subseteq> I" for i I
+  proof -
+    have "merge {..<i} {i..<n} x \<in> space (Pi\<^sub>M {..<n} M)"
+      if "x \<in> (\<Pi>\<^sub>E i\<in>I. space (M i)) \<times> (\<Pi>\<^sub>E i\<in>{i..<n}. space (M i))" for x
+      using that h_bounded_assms unfolding space_PiM by (intro merge_space_aux)
+        (auto simp: PiE_def mem_Times_iff)
+    hence "bounded ((\<lambda>x. f (merge {..<i} {i..<n} x)) `
+      ((\<Pi>\<^sub>E i\<in>I. space (M i)) \<times> (\<Pi>\<^sub>E i\<in>{i..<n}. space (M i))))"
+      by (subst image_image[of "f",symmetric])
+       (intro bounded_subset[OF f_bounded] image_mono image_subsetI)
+    thus ?thesis
+      using that unfolding h_def
+      by (intro prob_space.finite_measure finite_measure.bounded_int int_rules)
+        (auto simp:space_PiM PiE_def)
+  qed
+
+  have V_bounded: "bounded (V i ` space (PiM I M))"
+    if "i < n" "{..<i+1} \<subseteq> I" for i I
+    using that unfolding V_def by (intro bounded_intros h_bounded) auto
+
+  have V_upd_bounded: "bounded ((\<lambda>x. V j (\<xi>(j := x))) ` space (M j))"
+    if V_upd_bounded_assms: "\<xi> \<in> space (Pi\<^sub>M {..<j} M)" "j < n" for j \<xi>
+  proof -
+    have "\<xi>(j := v) \<in> space (Pi\<^sub>M {..<j + 1} M)" if "v \<in> space (M j)" for v
+      using V_upd_bounded_assms that unfolding space_PiM PiE_def extensional_def Pi_def by auto
+    thus ?thesis
+        using that unfolding image_image[of "V j" "(\<lambda>x. (\<xi>(j := x)))",symmetric]
+        by (intro bounded_subset[OF V_bounded[of "j" "{..<j+1}"]] that image_mono) auto
+  qed
+
+  have h_step: "h j \<omega> = \<integral>\<tau>. h (j+1) (\<omega>(j := \<tau>)) \<partial> M j" (is "?L1 = ?R1")
+    if "\<omega> \<in> space (PiM {..<j} M)" "j < n" for j \<omega>
+  proof -
+    have 0: "(\<lambda>x. f (merge {..<j} {j..<n} (\<omega>, x))) \<in> borel_measurable (Pi\<^sub>M {j..<n} M)"
+      using that unfolding space_PiM by (intro f_merge_meas) auto
+
+    have 1: "insert j {Suc j..<n} = {j..<n}"
+      using that by auto
+
+    have 2: "bounded ((\<lambda>x.(f (merge {..<j} {j..<n} (\<omega>, x)))) ` space (Pi\<^sub>M {j..<n} M))"
+      using that by (intro f_merge_bounded) (simp_all add: space_PiM)
+
+    have "?L1 = (\<integral>\<xi>. f (merge {..<j} {j..<n} (\<omega>, \<xi>)) \<partial>PiM (insert j {j+1..<n}) M)"
+      unfolding h_def using that by (intro Bochner_Integration.integral_cong refl PiM_cong) auto
+    also have "...=(\<integral>\<tau>.(\<integral>\<xi>. f (merge {..<j} {j..<n} (\<omega>, (\<xi>(j := \<tau>)))) \<partial>PiM {j+1..<n} M)\<partial>M j)"
+      using that(1,2) 0 1 2 by (intro product_integral_insert prob_space_imp_sigma_finite assms(1)
+          int_rules f_merge_meas) (simp_all)
+    also have "... = ?R1"
+      using that(2) unfolding h_def
+      by (intro Bochner_Integration.integral_cong arg_cong[where f="f"] ext) (auto simp:merge_def)
+    finally show ?thesis
+      by simp
+  qed
+
+  have V_meas: "V i \<in> borel_measurable (PiM I M)" if "i < n" "{..<i+1} \<subseteq> I" for i I
+    unfolding V_def using that by (intro borel_measurable_diff h_meas) auto
+
+  have V_upd_meas: "(\<lambda>x. V j (\<xi>(j := x))) \<in> borel_measurable (M j)"
+    if "j < n" "\<xi> \<in> space (Pi\<^sub>M {..<j} M)" for j \<xi>
+    using that by (intro measurable_compose[OF _ V_meas[where I="insert j {..<j}"]]
+          measurable_component_update) auto
+
+  have V_cong:
+    "V j \<omega> = V j \<xi>" if "restrict \<omega> {..<(j+1)} = restrict \<xi> {..<(j+1)}" for j \<omega> \<xi>
+    using that restrict_subset_eq[OF _ that] unfolding V_def
+    by (intro arg_cong2[where f="(-)"] h_cong) simp_all
+
+  have exp_V: "(\<integral>\<omega>. V j (\<xi>(j := \<omega>)) \<partial>M j) = 0" (is "?L1 = 0")
+    if "j < n" "\<xi> \<in> space (PiM {..<j} M)" for j \<xi>
+  proof -
+
+    have "fun_upd \<xi> j ` space (M j) \<subseteq> space (Pi\<^sub>M (insert j {..<j}) M)"
+      using that unfolding space_PiM by (intro image_subsetI PiE_fun_upd) auto
+    hence 0:"bounded ((\<lambda>x. h (Suc j) (\<xi>(j := x))) ` space (M j))"
+      unfolding image_image[of "h (Suc j)" "\<lambda>x. \<xi>(j := x)",symmetric] using that
+      by (intro bounded_subset[OF h_bounded[where i="j+1" and I="{..<j+1}"]] image_mono)
+        (auto simp:lessThan_Suc)
+
+    have 1:"(\<lambda>x. h (Suc j) (\<xi>(j := x))) \<in> borel_measurable (M j)"
+      using h_meas that by (intro measurable_compose[OF _ h_meas[where I="insert j {..<j}"]]
+          measurable_component_update) auto
+
+    have "?L1 =(\<integral>\<omega>. h (Suc j) (\<xi>(j := \<omega>)) - h j \<xi> \<partial>M j)"
+      unfolding V_def
+      by (intro Bochner_Integration.integral_cong arg_cong2[where f="(-)"] refl h_cong) auto
+    also have "... = (\<integral>\<omega>. h (Suc j) (\<xi>(j := \<omega>)) \<partial>M j) - (\<integral>\<omega>. h j \<xi> \<partial>M j)"
+      using that by (intro Bochner_Integration.integral_diff int_rules 0 1) auto
+    also have "... = 0"
+      using that(1) assms(1) prob_space.prob_space unfolding h_step[OF that(2,1)] by auto
+    finally show ?thesis
+      by simp
+  qed
+
+  have var_V: "\<bar>V j x - V j y\<bar> \<le> c j" (is "?L1 \<le> ?R1")
+    if var_V_assms: "j < n" "{x,y} \<subseteq> space (PiM {..<j+1} M)"
+       "restrict x {..<j} = restrict y {..<j}"  for x y j
+  proof -
+    have x_ran: "x \<in> PiE {..<j+1} (\<lambda>i. space (M i))" and y_ran: "y \<in> PiE {..<j+1} (\<lambda>i. space (M i))"
+      using that(2) by (simp_all add:space_PiM)
+
+    have 0: "j+1 \<le> n"
+      using that by simp
+
+    have "?L1 = \<bar>h (Suc j) x - h j y - (h (Suc j) y - h j y)\<bar>"
+      unfolding V_def by (intro arg_cong[where f="abs"] arg_cong2[where f="(-)"] refl h_cong that)
+    also have "... = \<bar>h (j+1) x - h (j+1) y\<bar>"
+      by simp
+    also have "... =
+      \<bar>(\<integral>\<omega>. f(merge {..<j+1} {j+1..<n} (x,\<omega>))-f(merge {..<j+1} {j+1..<n} (y,\<omega>)) \<partial>PiM {j+1..<n} M)\<bar>"
+      using that unfolding h_def by (intro arg_cong[where f="abs"] f_merge_meas[OF 0] x_ran
+          Bochner_Integration.integral_diff[symmetric] int_rules f_merge_bounded[OF 0] y_ran) auto
+    also have "... \<le>
+      (\<integral>\<omega>. \<bar>f(merge {..<j+1} {j+1..<n} (x,\<omega>))-f(merge {..<j+1} {j+1..<n} (y,\<omega>))\<bar> \<partial>PiM {j+1..<n} M)"
+      by (intro integral_abs_bound)
+    also have "... \<le> (\<integral>\<omega>. c j \<partial>PiM {j+1..<n} M)"
+    proof (intro Bochner_Integration.integral_mono' delta int_rules c_ge_0 ballI merge_space 0)
+      fix \<omega> assume "\<omega> \<in> space (Pi\<^sub>M {j + 1..<n} M)"
+      have "{..<j + 1} \<inter> ({..<n} - {j}) = {..<j}"
+        using that by auto
+      thus "restrict (merge {..<j+1} {j+1..<n} (x, \<omega>)) ({..<n}-{j}) =
+            restrict (merge {..<j+1} {j+1..<n} (y, \<omega>)) ({..<n}-{j})"
+        using that(1,3) less_antisym unfolding restrict_merge by (intro merge_cong refl) auto
+    qed (simp_all add: space_PiM that(1) x_ran[simplified] y_ran[simplified])
+    also have "... = c j"
+      by (auto intro!:prob_space.prob_space prob_space_PiM assms(1))
+    finally show ?thesis by simp
+  qed
+
+  have "f \<xi> - (\<integral>\<omega>. f \<omega> \<partial>(PiM {..<n} M)) = (\<Sum>i < n. V i \<xi>)" if "\<xi> \<in> space (PiM {..<n} M)" for \<xi>
+    using that unfolding V_def by (subst sum_lessThan_telescope) (simp add: h_0 h_n)
+  hence "?L = \<P>(\<xi> in PiM {..<n} M. (\<Sum>i < n. V i \<xi>) \<ge> \<epsilon>)"
+    by (intro arg_cong2[where f="measure"] refl Collect_restr_cong arg_cong2[where f="(\<le>)"]) auto
+  also have "... \<le> \<P>(\<xi> in PiM {..<n} M. exp( t * (\<Sum>i < n. V i \<xi>) ) \<ge> exp (t * \<epsilon>))"
+  proof (intro finite_measure.finite_measure_mono subsetI prob_space.finite_measure int_rules)
+    show "{\<xi> \<in> space (Pi\<^sub>M {..<n} M). exp (t * \<epsilon>) \<le> exp (t * (\<Sum>i<n. V i \<xi>))} \<in> sets (Pi\<^sub>M {..<n} M)"
+      using V_meas by measurable
+  qed  (auto intro!:mult_left_mono[OF _ t_ge_0])
+  also have "... \<le> (\<integral>\<xi>. exp(t*(\<Sum>i < n. V i \<xi>)) \<partial>PiM {..<n} M)/ exp (t*\<epsilon>)"
+    by (intro integral_Markov_inequality_measure[where A="{}"] int_rules V_bounded V_meas) auto
+  also have "... = exp(t^2 * (\<Sum>i\<in>{n..<n}. c i^2)/8-t*\<epsilon>)*(\<integral>\<xi>. exp(t*(\<Sum>i < n. V i \<xi>)) \<partial>PiM {..<n} M)"
+    by (simp add:exp_minus inverse_eq_divide)
+  also have "... \<le> exp(t^2 * (\<Sum>i\<in>{0..<n}. c i^2)/8-t*\<epsilon>)*(\<integral>\<xi>. exp(t*(\<Sum>i < 0. V i \<xi>)) \<partial>PiM {..<0} M)"
+  proof (rule ineq_chain)
+    fix j assume a:"j < n"
+    let ?L1 = "exp (t\<^sup>2*(\<Sum>i=j+1..<n. (c i)\<^sup>2)/8-t*\<epsilon>)"
+    let ?L2 = "?L1 * (\<integral>\<xi>. exp (t * (\<Sum>i<j+1. V i \<xi>)) \<partial>PiM {..<j+1} M)"
+
+    note V_upd_meas = V_upd_meas[OF a]
+
+    have "?L2 = ?L1 * (\<integral>\<xi>. exp (t * (\<Sum>i<j. V i \<xi>)) * exp(t * V j \<xi>) \<partial>PiM (insert j {..<j}) M)"
+      by (simp add:algebra_simps exp_add lessThan_Suc)
+    also have "... = ?L1 *
+      (\<integral>\<xi>. (\<integral>\<omega>. exp (t * (\<Sum>i<j. V i (\<xi>(j := \<omega>)))) * exp(t * V j (\<xi>(j := \<omega>))) \<partial>M j) \<partial>PiM {..<j} M)"
+      using a by (intro product_integral_insert_rev arg_cong2[where f="(*)"] int_rules
+          prob_space_imp_sigma_finite V_bounded V_meas) auto
+    also have "... =?L1*(\<integral>\<xi>.(\<integral>\<omega>. exp (t*(\<Sum>i<j. V i \<xi>))*exp(t*V j (\<xi>(j := \<omega>))) \<partial>M j) \<partial>PiM {..<j} M)"
+      by (intro arg_cong2[where f="(*)"] Bochner_Integration.integral_cong
+          arg_cong[where f="exp"] sum.cong V_cong restrict_fupd) auto
+    also have "... =?L1*(\<integral>\<xi>. exp (t*(\<Sum>i<j. V i \<xi>))*(\<integral>\<omega>. exp(t*V j (\<xi>(j := \<omega>))) \<partial>M j) \<partial>PiM {..<j} M)"
+      using a by (intro arg_cong2[where f="(*)"] Bochner_Integration.integral_cong refl
+          Bochner_Integration.integral_mult_right V_upd_meas V_upd_bounded int_rules) auto
+    also have "... \<le> ?L1 * \<integral>\<xi>. exp (t*(\<Sum>i<j. V i \<xi>))* exp (t^2 * c j^2/8) \<partial>PiM {..<j} M"
+    proof (intro mult_left_mono integral_mono')
+      fix \<xi> assume c:"\<xi> \<in> space (Pi\<^sub>M {..<j} M)"
+      hence b:"\<xi> \<in> PiE {..<j} (\<lambda>i. space (M i))"
+        unfolding space_PiM by simp
+      moreover have "\<xi>(j := v) \<in> PiE {..<j+1} (\<lambda>i. space (M i))" if "v \<in> space (M j)" for v
+        using b that unfolding PiE_def extensional_def Pi_def by auto
+      ultimately show "LINT \<omega>|M j. exp (t * V j (\<xi>(j := \<omega>))) \<le> exp (t\<^sup>2 * (c j)\<^sup>2 / 8)"
+        using V_upd_meas[OF c]
+        by (intro prob_space.Hoeffdings_lemma_bochner_3 exp_V var_V a int_rules)
+          (auto simp: space_PiM)
+    next
+      show "integrable (Pi\<^sub>M {..<j} M) (\<lambda>x. exp (t * (\<Sum>i<j. V i x)) * exp (t\<^sup>2 * (c j)\<^sup>2 / 8))"
+        using a by (intro int_rules V_bounded V_meas) auto
+    qed auto
+    also have "... = ?L1 * ((\<integral>\<xi>. exp (t*(\<Sum>i<j. V i \<xi>)) \<partial>PiM {..<j} M) * exp (t^2 * c j^2/8))"
+    proof (subst Bochner_Integration.integral_mult_left)
+      show "integrable (Pi\<^sub>M {..<j} M) (\<lambda>\<xi>. exp (t * (\<Sum>i<j. V i \<xi>)))"
+        using a by (intro int_rules V_bounded V_meas) auto
+    qed auto
+    also have "... =
+      exp (t\<^sup>2*(\<Sum>i\<in>insert j {j+1..<n}. (c i)\<^sup>2)/8-t*\<epsilon>) * (\<integral>\<xi>. exp (t * (\<Sum>i<j. V i \<xi>))\<partial>PiM {..<j} M)"
+      by (simp_all add:exp_add[symmetric] field_simps)
+    also have "...=exp (t\<^sup>2*(\<Sum>i=j..<n. (c i)\<^sup>2)/8-t*\<epsilon>) * (\<integral>\<xi>. exp (t * (\<Sum>i<j. V i \<xi>))\<partial>PiM {..<j} M)"
+      using a by (intro arg_cong2[where f="(*)"] arg_cong[where f="exp"] refl arg_cong2
+          [where f="(-)"] arg_cong2[where f="(/)"] sum.cong) auto
+    finally show "?L2\<le>exp(t\<^sup>2*(\<Sum>i=j..<n. (c i)\<^sup>2)/8-t*\<epsilon>)*(\<integral>\<xi>. exp (t*(\<Sum>i<j. V i \<xi>))\<partial>PiM {..<j} M)"
+      by simp
+  qed
+  also have "... = exp(t^2 * (\<Sum>i<n. c i^2)/8-t*\<epsilon>)" by (simp add:PiM_empty atLeast0LessThan)
+  also have "... = exp(t * ((t * (\<Sum>i<n. c i^2)/8)-\<epsilon>))" by (simp add:algebra_simps power2_eq_square)
+  also have "... = exp(t * (-\<epsilon>/2))" using sum_c_ge_0 by (auto simp add:divide_simps t_def)
+  also have "... = ?R" unfolding t_def by (simp add:field_simps power2_eq_square)
+  finally show ?thesis by simp
+qed
+
+theorem mc_diarmid_inequality_distr:
+  fixes f :: "('i \<Rightarrow> 'a) \<Rightarrow> real"
+  assumes "finite I"
+  assumes "\<And>i. i \<in> I \<Longrightarrow> prob_space (M i)"
+  assumes "\<And>i x y. i \<in> I \<Longrightarrow> {x,y} \<subseteq> space (PiM I M) \<Longrightarrow> (\<forall>j\<in>I-{i}. x j=y j) \<Longrightarrow> \<bar>f x-f y\<bar>\<le>c i"
+  assumes f_meas: "f \<in> borel_measurable (PiM I M)" and \<epsilon>_gt_0: "\<epsilon> > 0"
+  shows "\<P>(\<omega> in PiM I M. f \<omega> - (\<integral>\<xi>. f \<xi> \<partial>PiM I M) \<ge> \<epsilon>) \<le> exp (-(2*\<epsilon>^2)/(\<Sum>i\<in>I. (c i)^2))"
+    (is "?L \<le> ?R")
+proof -
+  define n where "n = card I"
+  let ?q = "from_nat_into I"
+  let ?r = "to_nat_on I"
+  let ?f = "(\<lambda>\<xi>. f (\<lambda>i\<in>I. \<xi> (?r i)))"
+
+  have q: "bij_betw ?q {..<n} I" unfolding n_def by (intro bij_betw_from_nat_into_finite assms(1))
+  have r: "bij_betw ?r I {..<n}" unfolding n_def by (intro to_nat_on_finite assms(1))
+
+  have [simp]: "?q (?r x) = x" if "x \<in> I" for x
+    by (intro from_nat_into_to_nat_on that countable_finite assms(1))
+
+  have [simp]: "?r (?q x) = x" if "x < n" for x
+    using bij_betw_imp_surj_on[OF r] that by (intro to_nat_on_from_nat_into) auto
+
+  have a: "\<And>i. i \<in> {..<n} \<Longrightarrow> prob_space ((M \<circ> ?q) i)"
+    unfolding comp_def by (intro assms(2) bij_betw_apply[OF q])
+
+  have b:"PiM I M = PiM I (\<lambda>i. (M \<circ> ?q) (?r i))" by (intro PiM_cong) (simp_all add:comp_def)
+  also have "... = distr (PiM {..<n} (M \<circ> ?q)) (PiM I (\<lambda>i. (M \<circ> ?q) (?r i))) (\<lambda>\<omega>. \<lambda>n\<in>I. \<omega> (?r n))"
+    using r unfolding bij_betw_def by (intro distr_PiM_reindex[symmetric] a) auto
+  finally have c: "PiM I M = distr (PiM{..<n}(M\<circ>?q)) (PiM I (\<lambda>i.(M\<circ>?q)(?r i))) (\<lambda>\<omega>. \<lambda>n\<in>I. \<omega> (?r n))"
+    by simp
+
+  have d: "(\<lambda>n\<in>I. x (?r n)) \<in> space (Pi\<^sub>M I M)" if 4:"x \<in> space (Pi\<^sub>M {..<n} (M \<circ> ?q))" for x
+  proof -
+    have "x (?r i) \<in> space (M i)" if "i \<in> I" for i
+    proof -
+      have "?r i \<in> {..<n}" using bij_betw_apply[OF r] that by simp
+      hence "x (?r i) \<in> space ((M \<circ> ?q) (?r i))" using that 4 PiE_mem unfolding space_PiM by blast
+      thus ?thesis using that unfolding comp_def by simp
+    qed
+    thus ?thesis unfolding space_PiM PiE_def by auto
+  qed
+
+  have "?L = \<P>(\<omega> in PiM {..<n} (M \<circ> ?q). ?f \<omega> - (\<integral>\<xi>. f \<xi> \<partial>PiM I M) \<ge> \<epsilon>)"
+  proof (subst c, subst measure_distr, goal_cases)
+    case 1 thus ?case
+      by (intro measurable_restrict measurable_component_singleton bij_betw_apply[OF r])
+  next
+    case 2 thus ?case unfolding b[symmetric] by (intro measurable_sets_Collect[OF f_meas]) auto
+  next
+    case 3 thus ?case using d by (intro arg_cong2[where f="measure"] refl) (auto simp:vimage_def)
+  qed
+  also have "... = \<P>(\<omega> in PiM {..<n} (M \<circ> ?q). ?f \<omega> - (\<integral>\<xi>. ?f \<xi> \<partial>PiM {..<n} (M \<circ> ?q)) \<ge> \<epsilon>)"
+  proof (subst c, subst integral_distr, goal_cases)
+    case (1 \<omega>) thus ?case
+      by (intro measurable_restrict measurable_component_singleton bij_betw_apply[OF r])
+  next
+    case (2 \<omega>) thus ?case unfolding b[symmetric] by (rule f_meas)
+  next
+    case 3 thus ?case by simp
+  qed
+  also have "... \<le> exp (-(2*\<epsilon>^2)/(\<Sum>i<n. (c (?q i))^2))"
+  proof (intro mc_diarmid_inequality_aux \<epsilon>_gt_0, goal_cases)
+    case (1 i) thus ?case by (intro a) auto
+  next
+    case (2 i x y)
+    have "x (?r j) = y (?r j)" if "j \<in> I - {?q i}" for j
+    proof -
+      have "?r j \<in> {..<n} - {i}" using that bij_betw_apply[OF r] by auto
+      thus ?thesis using 2 by simp
+    qed
+    hence "\<forall>j\<in>I - {?q i}. (\<lambda>i\<in>I. x (?r i)) j = (\<lambda>i\<in>I. y (?r i)) j" by auto
+    thus ?case using 2 d by (intro assms(3) bij_betw_apply[OF q]) auto
+  next
+    case 3
+    have "(\<lambda>x. x (?r i)) \<in> Pi\<^sub>M {..<n} (M \<circ> ?q) \<rightarrow>\<^sub>M M i" if "i \<in> I" for i
+    proof -
+      have 0:"M i = (M \<circ> ?q) (?r i)" using that by (simp add: comp_def)
+      show ?thesis unfolding 0 by (intro measurable_component_singleton bij_betw_apply[OF r] that)
+    qed
+    thus ?case by (intro measurable_compose[OF _ f_meas] measurable_restrict)
+  qed
+  also have "... = ?R" by (subst sum.reindex_bij_betw[OF q]) simp
+  finally show ?thesis by simp
+qed
+
+lemma (in prob_space) mc_diarmid_inequality_classic:
+  fixes f :: "('i \<Rightarrow> 'a) \<Rightarrow> real"
+  assumes "finite I"
+  assumes "indep_vars N X I"
+  assumes "\<And>i x y. i \<in> I \<Longrightarrow> {x,y} \<subseteq> space (PiM I N) \<Longrightarrow> (\<forall>j\<in>I-{i}. x j=y j) \<Longrightarrow> \<bar>f x-f y\<bar>\<le>c i"
+  assumes f_meas: "f \<in> borel_measurable (PiM I N)" and \<epsilon>_gt_0: "\<epsilon> > 0"
+  shows "\<P>(\<omega> in M. f (\<lambda>i\<in>I. X i \<omega>) - (\<integral>\<xi>. f (\<lambda>i\<in>I. X i \<xi>) \<partial>M) \<ge> \<epsilon>) \<le> exp (-(2*\<epsilon>^2)/(\<Sum>i\<in>I. (c i)^2))"
+    (is "?L \<le> ?R")
+proof -
+  note indep_imp = iffD1[OF indep_vars_iff_distr_eq_PiM'']
+  let ?O = "\<lambda>i. distr M (N i) (X i)"
+  have a:"distr M (Pi\<^sub>M I N) (\<lambda>x. \<lambda>i\<in>I. X i x) = Pi\<^sub>M I ?O"
+    using assms(2) unfolding indep_vars_def by (intro indep_imp[OF _ assms(2)]) auto
+
+  have b: "space (PiM I ?O) = space (PiM I N)"
+    by (metis (no_types, lifting) a space_distr)
+
+  have "(\<lambda>i\<in>I. X i \<omega>) \<in> space (Pi\<^sub>M I N)" if "\<omega> \<in> space M" for \<omega>
+    using assms(2) that unfolding indep_vars_def measurable_def space_PiM by auto
+
+  hence "?L = \<P>(\<omega> in M. (\<lambda>i\<in>I. X i \<omega>)\<in> space (Pi\<^sub>M I N)\<and> f (\<lambda>i\<in>I. X i \<omega>)-(\<integral>\<xi>. f (\<lambda>i\<in>I. X i \<xi>) \<partial>M)\<ge>\<epsilon>)"
+    by (intro arg_cong2[where f="measure"] Collect_restr_cong refl) auto
+  also have "... = \<P>(\<omega> in distr M (Pi\<^sub>M I N) (\<lambda>x. \<lambda>i\<in>I. X i x). f \<omega> - (\<integral>\<xi>. f (\<lambda>i\<in>I. X i \<xi>) \<partial>M) \<ge> \<epsilon>)"
+  proof (subst measure_distr, goal_cases)
+    case 1 thus ?case using assms(2) unfolding indep_vars_def by (intro measurable_restrict) auto
+  next
+    case 2 thus ?case unfolding space_distr by (intro measurable_sets_Collect[OF f_meas]) auto
+  next
+    case 3 thus ?case by (simp_all add:Int_def conj_commute)
+  qed
+  also have "... = \<P>(\<omega> in PiM I ?O. f \<omega> - (\<integral>\<xi>. f (\<lambda>i\<in>I. X i \<xi>) \<partial>M) \<ge> \<epsilon>)"
+    unfolding a by simp
+  also have "... = \<P>(\<omega> in PiM I ?O. f \<omega> - (\<integral>\<xi>. f \<xi> \<partial> distr M (Pi\<^sub>M I N) (\<lambda>x. \<lambda>i\<in>I. X i x)) \<ge> \<epsilon>)"
+  proof (subst integral_distr[OF _ f_meas], goal_cases)
+    case (1 \<omega>) thus ?case using assms(2) unfolding indep_vars_def by (intro measurable_restrict)auto
+  next
+    case 2 thus ?case by simp
+  qed
+  also have "... = \<P>(\<omega> in PiM I ?O. f \<omega> - (\<integral>\<xi>. f \<xi> \<partial> Pi\<^sub>M I ?O) \<ge> \<epsilon>)" unfolding a by simp
+  also have "... \<le> ?R"
+    using f_meas assms(2) b unfolding indep_vars_def
+    by (intro mc_diarmid_inequality_distr prob_space_distr assms(1) \<epsilon>_gt_0 assms(3)) auto
+  finally show ?thesis by simp
+qed
+
+end
\ No newline at end of file
diff --git a/thys/Concentration_Inequalities/Paley_Zygmund_Inequality.thy b/thys/Concentration_Inequalities/Paley_Zygmund_Inequality.thy
new file mode 100644
--- /dev/null
+++ b/thys/Concentration_Inequalities/Paley_Zygmund_Inequality.thy
@@ -0,0 +1,204 @@
+section \<open>Paley-Zygmund Inequality\<close>
+
+text \<open>This section proves slight improvements of the Paley-Zygmund Inequality~\cite{paley1932note}.
+Unfortunately, the improvements are on Wikipedia with no citation.\<close>
+
+theory Paley_Zygmund_Inequality
+  imports Lp.Lp
+begin
+
+context prob_space
+begin
+
+theorem paley_zygmund_inequality_holder:
+  assumes p: "1 < (p::real)"
+  assumes rv: "random_variable borel Z"
+  assumes intZp: "integrable M (\<lambda>z. \<bar>Z z\<bar> powr p)"
+  assumes t: "\<theta> \<le> 1"
+  assumes ZAEpos: "AE z in M. Z z \<ge> 0"
+  shows "
+    (expectation (\<lambda>x. \<bar>Z x - \<theta> * expectation Z\<bar> powr p) powr (1 / (p-1))) *
+    prob {z \<in> space M. Z z > \<theta> * expectation Z}
+      \<ge> ((1-\<theta>) powr (p / (p-1)) * expectation Z powr (p / (p-1))) "
+proof -
+  have intZ: "integrable M Z"
+    apply (subst bound_L1_Lp[OF _ rv intZp])
+    using p by auto
+
+  define eZ where "eZ = expectation Z"
+  have "eZ \<ge> 0"
+    unfolding eZ_def
+    using ZAEpos intZ integral_ge_const prob_Collect_eq_1 by auto
+
+  have ezp: "expectation (\<lambda>x. \<bar>Z x - \<theta> * eZ\<bar> powr p) \<ge> 0"
+    by (meson Bochner_Integration.integral_nonneg powr_ge_pzero)
+
+  have "expectation (\<lambda>z. Z z - \<theta> * eZ) = expectation (\<lambda>z. Z z + (- \<theta> * eZ))"
+    by auto
+  moreover have "... = expectation Z + expectation (\<lambda>z. - \<theta> * eZ)"
+    apply (subst Bochner_Integration.integral_add)
+    using intZ by auto
+  moreover have "... = eZ + (- \<theta> * eZ)"
+    apply (subst lebesgue_integral_const)
+    using eZ_def prob_space by auto
+  ultimately have *: "expectation (\<lambda>z. Z z - \<theta> * eZ) = eZ - \<theta> * eZ"
+    by linarith
+
+  have ev: "{z \<in> space M. \<theta> * eZ < Z z} \<in> events"
+    using rv unfolding borel_measurable_iff_greater
+    by auto
+
+  define q where "q = p / (p-1)"
+
+  have sqI:"(indicat_real E x) powr q = indicat_real E (x::'a)" for E x
+    unfolding q_def
+    by (metis indicator_simps(1) indicator_simps(2) powr_0 powr_one_eq_one)
+
+  have bm1: "(\<lambda>z. (Z z - \<theta> * eZ)) \<in> borel_measurable M"
+    using borel_measurable_const borel_measurable_diff rv by blast
+  have bm2: "(\<lambda>z. indicat_real {z \<in> space M. Z z > \<theta> * eZ} z) \<in> borel_measurable M"
+    using borel_measurable_indicator ev by blast
+  have "integrable M (\<lambda>x. \<bar>Z x + (-\<theta> * eZ)\<bar> powr p)"
+    apply (intro Minkowski_inequality[OF _ rv _ intZp])
+    using p by auto
+  then have int1: "integrable M (\<lambda>x. \<bar>Z x - \<theta> * eZ\<bar> powr p)"
+     by auto
+
+  have "integrable M
+   (\<lambda>x. 1 * indicat_real {z \<in> space M. \<theta> * eZ < Z z} x)"
+    apply (intro integrable_real_mult_indicator[OF ev])
+    by auto
+
+  then have int2: " integrable M
+     (\<lambda>x. \<bar>indicat_real {z \<in> space M. \<theta> * eZ < Z z} x\<bar> powr q)"
+     by (auto simp add: sqI )
+
+  have pq:"p > (0::real)" "q > 0" "1/p + 1/q = 1"
+    unfolding q_def using p by (auto simp:divide_simps)
+  from Holder_inequality[OF pq bm1 bm2 int1 int2]
+  have hi: "expectation (\<lambda>x. (Z x - \<theta> * eZ) * indicat_real {z \<in> space M. \<theta> * eZ < Z z} x)
+    \<le> expectation (\<lambda>x. \<bar>Z x - \<theta> * eZ\<bar> powr p) powr (1 / p) *
+      expectation (\<lambda>x. \<bar>indicat_real {z \<in> space M. \<theta> * eZ < Z z} x\<bar> powr q) powr (1 / q)"
+    by auto
+
+  have "eZ - \<theta> * eZ \<le>
+    expectation (\<lambda>z. (Z z - \<theta> * eZ) * indicat_real {z \<in> space M. Z z > \<theta> * eZ} z)"
+    unfolding *[symmetric]
+    apply (intro integral_mono)
+    using intZ ev apply auto[1]
+    apply (auto intro!: integrable_real_mult_indicator simp add: intZ ev)[1]
+    unfolding indicator_def of_bool_def
+    by (auto simp add: mult_nonneg_nonpos2)
+
+  also have "... \<le>
+      expectation (\<lambda>x. \<bar>Z x - \<theta> * eZ\<bar> powr p) powr (1 / p) *
+      expectation (\<lambda>x. indicat_real {z \<in> space M. \<theta> * eZ < Z z} x) powr (1 / q)"
+    using hi by (auto simp add: sqI)
+
+  finally have "eZ - \<theta> * eZ \<le>
+     expectation (\<lambda>x. \<bar>Z x - \<theta> * eZ\<bar> powr p) powr (1 / p) *
+     expectation (\<lambda>x. indicat_real {z \<in> space M. \<theta> * eZ < Z z} x) powr (1 / q)"
+    by auto
+
+  then have "(eZ - \<theta> * eZ) powr q \<le>
+     (expectation (\<lambda>x. \<bar>Z x - \<theta> * eZ\<bar> powr p) powr (1 / p) *
+     expectation (\<lambda>x. indicat_real {z \<in> space M. \<theta> * eZ < Z z} x) powr (1 / q)) powr q"
+    by (smt (verit, ccfv_SIG) \<open>0 \<le> eZ\<close> mult_left_le_one_le powr_mono2 pq(2) right_diff_distrib' t zero_le_mult_iff)
+
+  also have "... =
+     (expectation (\<lambda>x. \<bar>Z x - \<theta> * eZ\<bar> powr p) powr (1 / p)) powr q *
+     (expectation (\<lambda>x. indicat_real {z \<in> space M. \<theta> * eZ < Z z} x) powr (1 / q)) powr q"
+    using powr_ge_pzero powr_mult by presburger
+  also have "... =
+     (expectation (\<lambda>x. \<bar>Z x - \<theta> * eZ\<bar> powr p) powr (1 / p)) powr q *
+     (expectation (\<lambda>x. indicat_real {z \<in> space M. \<theta> * eZ < Z z} x))"
+    by (smt (verit, ccfv_SIG) Bochner_Integration.integral_nonneg divide_le_eq_1_pos indicator_pos_le nonzero_eq_divide_eq p powr_one powr_powr q_def)
+  also have "... =
+     (expectation (\<lambda>x. \<bar>Z x - \<theta> * eZ\<bar> powr p) powr (1 / (p-1))) *
+     (expectation (\<lambda>x. indicat_real {z \<in> space M. \<theta> * eZ < Z z} x))"
+   by (smt (verit, ccfv_threshold) divide_divide_eq_right divide_self_if p powr_powr q_def times_divide_eq_left)
+  also have "... =
+     (expectation (\<lambda>x. \<bar>Z x - \<theta> * eZ\<bar> powr p) powr (1 / (p-1))) *
+     prob {z \<in> space M. Z z > \<theta> * eZ}"
+    by (simp add: ev)
+
+  finally have 1: "(eZ - \<theta> * eZ) powr q \<le>
+     (expectation (\<lambda>x. \<bar>Z x - \<theta> * eZ\<bar> powr p) powr (1 / (p-1))) *
+     prob {z \<in> space M. Z z > \<theta> * eZ}" by linarith
+
+  have "(eZ - \<theta> * eZ) powr q = ((1 - \<theta>) * eZ) powr q"
+    by (simp add: mult.commute right_diff_distrib)
+  also have "... = (1 - \<theta>) powr q * eZ powr q"
+    by (simp add: \<open>0 \<le> eZ\<close> powr_mult t)
+  finally show ?thesis using 1 eZ_def q_def by force
+qed
+
+corollary paley_zygmund_inequality:
+  assumes rv: "random_variable borel Z"
+  assumes intZsq: "integrable M (\<lambda>z. (Z z)^2)"
+  assumes t: "\<theta> \<le> 1"
+  assumes Zpos: "\<And>z. z \<in> space M \<Longrightarrow> Z z \<ge> 0"
+  shows "
+    (variance Z + (1-\<theta>)^2 * (expectation Z)^2) *
+    prob {z \<in> space M. Z z > \<theta> * expectation Z}
+      \<ge> (1-\<theta>)^2 * (expectation Z)^2"
+proof -
+  have ZAEpos: "AE z in M. Z z \<ge> 0"
+    by (simp add: Zpos)
+
+  define p where "p = (2::real)"
+  have p1: "1 < p" using p_def by auto
+  have " integrable M (\<lambda>z. \<bar>Z z\<bar> powr p)" unfolding p_def
+    using intZsq by auto
+
+  from paley_zygmund_inequality_holder[OF p1 rv this t ZAEpos]
+  have "(1 - \<theta>) powr (p / (p - 1)) * (expectation Z powr (p / (p - 1)))
+    \<le> expectation (\<lambda>x. \<bar>Z x - \<theta> * expectation Z\<bar> powr p) powr (1 / (p - 1)) *
+       prob {z \<in> space M.  \<theta> * expectation Z < Z z}" .
+
+  then have hi: "(1 - \<theta>)^2 * (expectation Z)^2
+    \<le> expectation (\<lambda>x. (Z x - \<theta> * expectation Z)^2) *
+       prob {z \<in> space M.  \<theta> * expectation Z < Z z}"
+    unfolding p_def by (auto simp add: Zpos t)
+
+  have intZ: "integrable M Z"
+    apply (subst square_integrable_imp_integrable[OF rv intZsq])
+    by auto
+
+  define eZ where "eZ = expectation Z"
+  have "eZ \<ge> 0"
+    unfolding eZ_def
+    using Bochner_Integration.integral_nonneg Zpos by blast
+
+  have ezp: "expectation (\<lambda>x. \<bar>Z x - \<theta> * eZ\<bar> powr p) \<ge> 0"
+    by (meson Bochner_Integration.integral_nonneg powr_ge_pzero)
+
+  have "expectation (\<lambda>z. Z z - \<theta> * eZ) = expectation (\<lambda>z. Z z + (- \<theta> * eZ))"
+    by auto
+  also have "... = expectation Z + expectation (\<lambda>z. - \<theta> * eZ)"
+    apply (subst Bochner_Integration.integral_add)
+    using intZ by auto
+  also have "... = eZ + (- \<theta> * eZ)"
+    apply (subst lebesgue_integral_const)
+    using eZ_def prob_space by auto
+  finally have *: "expectation (\<lambda>z. Z z - \<theta> * eZ) = eZ - \<theta> * eZ"
+    by linarith
+  have "variance Z =
+     variance (\<lambda>z. (Z z - \<theta> * eZ))"
+    using "*" eZ_def by auto
+  also have "... =
+    expectation (\<lambda>z. (Z z - \<theta> * eZ)^2)
+    - (expectation (\<lambda>x. Z x - \<theta> * eZ))\<^sup>2"
+    apply (subst variance_eq)
+    by (auto simp add: intZ power2_diff intZsq)
+  also have "... = expectation (\<lambda>z. (Z z - \<theta> * eZ)^2) - ((1-\<theta>)^2 * eZ^2)"
+    unfolding * by (auto simp:algebra_simps power2_eq_square)
+  finally have veq: "expectation (\<lambda>z. (Z z - \<theta> * eZ)^2) = (variance Z + (1-\<theta>)^2 * eZ^2)"
+    by linarith
+  thus ?thesis
+    using hi by (simp add: eZ_def)
+qed
+
+end
+
+end
\ No newline at end of file
diff --git a/thys/Concentration_Inequalities/ROOT b/thys/Concentration_Inequalities/ROOT
new file mode 100644
--- /dev/null
+++ b/thys/Concentration_Inequalities/ROOT
@@ -0,0 +1,17 @@
+chapter AFP
+
+session Concentration_Inequalities = "HOL-Probability" +
+  options [timeout = 1200]
+  sessions
+    Lp
+  theories
+    Bennett_Inequality
+    Bienaymes_Identity
+    Cantelli_Inequality
+    Concentration_Inequalities_Preliminary
+    Efron_Stein_Inequality
+    McDiarmid_Inequality
+    Paley_Zygmund_Inequality
+  document_files
+    "root.tex"
+    "root.bib"
diff --git a/thys/Concentration_Inequalities/document/root.bib b/thys/Concentration_Inequalities/document/root.bib
new file mode 100644
--- /dev/null
+++ b/thys/Concentration_Inequalities/document/root.bib
@@ -0,0 +1,98 @@
+
+@inbook{mcdiarmid1989,
+  series={London Mathematical Society Lecture Note Series},
+  chapter={On the method of bounded differences},
+  DOI={10.1017/CBO9781107359949.008},
+  title={Surveys in Combinatorics, 1989: Invited Papers at the Twelfth British Combinatorial Conference},
+  publisher={Cambridge University Press},
+  author={McDiarmid, Colin},
+  year={1989},
+  pages={148 -- 188},
+}
+
+@article{efron1981,
+  author = {B. Efron and C. Stein},
+  title = {{The Jackknife Estimate of Variance}},
+  volume = {9},
+  journal = {The Annals of Statistics},
+  number = {3},
+  pages = {586 -- 596},
+  year = {1981},
+  doi = {10.1214/aos/1176345462},
+}
+
+@article{steele1986,
+  author = {J. Michael Steele},
+  title = {{An Efron-Stein Inequality for Nonsymmetric Statistics}},
+  volume = {14},
+  journal = {The Annals of Statistics},
+  number = {2},
+  pages = {753 -- 758},
+  year = {1986},
+  doi = {10.1214/aos/1176349952},
+}
+
+@inbook{loeve1977,
+  author="Lo{\`e}ve, M.",
+  chapter="Sums of Independent Random Variables",
+  title="Probability Theory I",
+  year="1977",
+  publisher="Springer New York",
+  address="New York, NY",
+  pages="235--279",
+  isbn="978-1-4684-9464-8",
+  doi="10.1007/978-1-4684-9464-8_6",
+}
+
+@article{bennett1962,
+  title={Probability inequalities for the sum of independent random variables},
+  author={Bennett, George},
+  journal={Journal of the American Statistical Association},
+  volume={57},
+  number={297},
+  pages={33--45},
+  year={1962},
+  publisher={Taylor \& Francis}
+}
+
+@inproceedings{DBLP:conf/ac/BoucheronLB03,
+  author       = {St{\'{e}}phane Boucheron and
+                  G{\'{a}}bor Lugosi and
+                  Olivier Bousquet},
+  editor       = {Olivier Bousquet and
+                  Ulrike von Luxburg and
+                  Gunnar R{\"{a}}tsch},
+  title        = {Concentration Inequalities},
+  booktitle    = {Advanced Lectures on Machine Learning, {ML} Summer Schools 2003, Canberra,
+                  Australia, February 2-14, 2003, T{\"{u}}bingen, Germany, August
+                  4-16, 2003, Revised Lectures},
+  series       = {Lecture Notes in Computer Science},
+  volume       = {3176},
+  pages        = {208--240},
+  publisher    = {Springer},
+  year         = {2003},
+  url          = {https://doi.org/10.1007/978-3-540-28650-9\_9},
+  doi          = {10.1007/978-3-540-28650-9\_9},
+  timestamp    = {Tue, 14 May 2019 10:00:49 +0200},
+  biburl       = {https://dblp.org/rec/conf/ac/BoucheronLB03.bib},
+  bibsource    = {dblp computer science bibliography, https://dblp.org}
+}
+
+@inproceedings{cantelli1929sui,
+  title={Sui confini della probabilita},
+  author={Cantelli, Francesco Paolo},
+  booktitle={Atti del Congresso Internazionale dei Matematici: Bologna del 3 al 10 de settembre di 1928},
+  pages={47--60},
+  year={1929}
+}
+
+@inproceedings{paley1932note,
+  title={A note on analytic functions in the unit circle},
+  author={Paley, Raymond EAC and Zygmund, Antoni},
+  booktitle={Mathematical Proceedings of the Cambridge Philosophical Society},
+  volume={28},
+  number={3},
+  pages={266--272},
+  year={1932},
+  organization={Cambridge University Press}
+}
diff --git a/thys/Concentration_Inequalities/document/root.tex b/thys/Concentration_Inequalities/document/root.tex
new file mode 100644
--- /dev/null
+++ b/thys/Concentration_Inequalities/document/root.tex
@@ -0,0 +1,35 @@
+\documentclass[11pt,a4paper]{article}
+\usepackage[T1]{fontenc}
+\usepackage{isabelle,isabellesym}
+\usepackage{pdfsetup}
+\urlstyle{rm}
+\isabellestyle{it}
+\begin{document}
+
+\title{Concentration Inequalities}
+\author{Emin Karayel and Yong Kiam Tan$^*$}
+\maketitle
+\def\thefootnote{*}\footnotetext{The authors contributed equally to this work.}\def\thefootnote{\arabic{footnote}}
+
+\abstract{Concentration inequalities provide bounds on how a random variable
+(or a sum/composition of random variables) deviate from their expectation,
+usually based on moments/independence of the variables.
+
+The most important concentration inequalities (the Markov, Chebyshev, and
+Hoelder inequalities and the Chernoff bounds) are already part of
+HOL-Probability. This entry collects more advanced results, such as
+Bennett's/Bernstein's Inequality, Bienaym\'e's Identity, Cantelli's Inequality,
+the Efron-Stein Inequality, McDiarmid's Inequality, and the Paley-Zygmund
+Inequality.}
+
+\tableofcontents
+
+% sane default for proof documents
+\parindent 0pt\parskip 0.5ex
+
+\input{session}
+
+\bibliographystyle{abbrv}
+\bibliography{root}
+
+\end{document}
diff --git a/thys/ROOTS b/thys/ROOTS
--- a/thys/ROOTS
+++ b/thys/ROOTS
@@ -1,788 +1,789 @@
 ABY3_Protocols
 ADS_Functor
 AI_Planning_Languages_Semantics
 AODV
 AOT
 AVL-Trees
 AWN
 Abortable_Linearizable_Modules
 Abs_Int_ITP2012
 Abstract-Hoare-Logics
 Abstract-Rewriting
 Abstract_Completeness
 Abstract_Soundness
 Ackermanns_not_PR
 Actuarial_Mathematics
 Adaptive_State_Counting
 Affine_Arithmetic
 Aggregation_Algebras
 Akra_Bazzi
 Algebraic_Numbers
 Algebraic_VCs
 Allen_Calculus
 Amicable_Numbers
 Amortized_Complexity
 AnselmGod
 Applicative_Lifting
 Approximation_Algorithms
 Architectural_Design_Patterns
 Aristotles_Assertoric_Syllogistic
 Arith_Prog_Rel_Primes
 ArrowImpossibilityGS
 Attack_Trees
 Auto2_HOL
 Auto2_Imperative_HOL
 AutoFocus-Stream
 Automated_Stateful_Protocol_Verification
 Automatic_Refinement
 AxiomaticCategoryTheory
 BDD
 BD_Security_Compositional
 BNF_CC
 BNF_Operations
 BTree
 Balog_Szemeredi_Gowers
 Banach_Steinhaus
 Belief_Revision
 Bell_Numbers_Spivey
 BenOr_Kozen_Reif
 Berlekamp_Zassenhaus
 Bernoulli
 Bertrands_Postulate
 Bicategory
 BinarySearchTree
 Binary_Code_Imprimitive
 Binding_Syntax_Theory
 Binomial-Heaps
 Binomial-Queues
 BirdKMP
 Birkhoff_Finite_Distributive_Lattices
 Blue_Eyes
 Bondy
 Boolean_Expression_Checkers
 Boolos_Curious_Inference
 Boolos_Curious_Inference_Automated
 Bounded_Deducibility_Security
 Buchi_Complementation
 Budan_Fourier
 Buffons_Needle
 Buildings
 BytecodeLogicJmlTypes
 C2KA_DistributedSystems
 CAVA_Automata
 CAVA_LTL_Modelchecker
 CCS
 CHERI-C_Memory_Model
 CISC-Kernel
+Concentration_Inequalities
 CRDT
 CRYSTALS-Kyber
 CSP_RefTK
 CVP_Hardness
 CYK
 CZH_Elementary_Categories
 CZH_Foundations
 CZH_Universal_Constructions
 CakeML
 CakeML_Codegen
 Call_Arity
 Card_Equiv_Relations
 Card_Multisets
 Card_Number_Partitions
 Card_Partitions
 Cardinality_Continuum
 Cartan_FP
 Case_Labeling
 Catalan_Numbers
 Category
 Category2
 Category3
 Catoids
 Cauchy
 Cayley_Hamilton
 Certification_Monads
 Ceva
 Chandy_Lamport
 Chebyshev_Polynomials
 Chord_Segments
 Circus
 Clean
 Clique_and_Monotone_Circuits
 ClockSynchInst
 Closest_Pair_Points
 CoCon
 CoSMeDis
 CoSMed
 CofGroups
 Coinductive
 Coinductive_Languages
 Collections
 Combinable_Wands
 Combinatorial_Enumeration_Algorithms
 Combinatorics_Words
 Combinatorics_Words_Graph_Lemma
 Combinatorics_Words_Lyndon
 CommCSL
 Commuting_Hermitian
 Comparison_Sort_Lower_Bound
 Compiling-Exceptions-Correctly
 Complete_Non_Orders
 Completeness
 Complex_Bounded_Operators
 Complex_Geometry
 Complx
 ComponentDependencies
 ConcurrentGC
 ConcurrentIMP
 Concurrent_Ref_Alg
 Concurrent_Revisions
 Conditional_Simplification
 Conditional_Transfer_Rule
 Consensus_Refined
 Constructive_Cryptography
 Constructive_Cryptography_CM
 Constructor_Funs
 Containers
 Cook_Levin
 CoreC++
 Core_DOM
 Core_SC_DOM
 Correctness_Algebras
 Cotangent_PFD_Formula
 Count_Complex_Roots
 Coupledsim_Contrasim
 CryptHOL
 CryptoBasedCompositionalProperties
 Crypto_Standards
 Cubic_Quartic_Equations
 DCR-ExecutionEquivalence
 DFS_Framework
 DOM_Components
 DPRM_Theorem
 DPT-SAT-Solver
 DataRefinementIBP
 Datatype_Order_Generator
 Decl_Sem_Fun_PL
 Decreasing-Diagrams
 Decreasing-Diagrams-II
 Dedekind_Real
 Deep_Learning
 Delta_System_Lemma
 Density_Compiler
 Dependent_SIFUM_Refinement
 Dependent_SIFUM_Type_Systems
 Depth-First-Search
 Derangements
 Deriving
 Descartes_Sign_Rule
 Design_Theory
 Dict_Construction
 Differential_Dynamic_Logic
 Differential_Game_Logic
 DigitsInBase
 Digit_Expansions
 Dijkstra_Shortest_Path
 Diophantine_Eqns_Lin_Hom
 Directed_Sets
 Dirichlet_L
 Dirichlet_Series
 DiscretePricing
 Discrete_Summation
 Disintegration
 DiskPaxos
 Distributed_Distinct_Elements
 Dominance_CHK
 DynamicArchitectures
 Dynamic_Tables
 E_Transcendental
 Earley_Parser
 Echelon_Form
 EdmondsKarp_Maxflow
 Edwards_Elliptic_Curves_Group
 Efficient-Mergesort
 Efficient_Weighted_Path_Order
 Elimination_Of_Repeated_Factors
 Elliptic_Curves_Group_Law
 Encodability_Process_Calculi
 Epistemic_Logic
 Equivalence_Relation_Enumeration
 Ergodic_Theory
 Error_Function
 Euler_MacLaurin
 Euler_Partition
 Euler_Polyhedron_Formula
 Eudoxus_Reals
 Eval_FO
 Example-Submission
 Executable_Randomized_Algorithms
 Expander_Graphs
 Extended_Finite_State_Machine_Inference
 Extended_Finite_State_Machines
 FFT
 FLP
 FOL-Fitting
 FOL_Axiomatic
 FOL_Harrison
 FOL_Seq_Calc1
 FOL_Seq_Calc2
 FOL_Seq_Calc3
 FO_Theory_Rewriting
 FSM_Tests
 Factor_Algebraic_Polynomial
 Factored_Transition_System_Bounding
 Falling_Factorial_Sum
 Farkas
 FeatherweightJava
 Featherweight_OCL
 Fermat3_4
 FileRefinement
 FinFun
 Finger-Trees
 Finite-Map-Extras
 Finite_Automata_HF
 Finite_Fields
 Finitely_Generated_Abelian_Groups
 First_Order_Terms
 First_Welfare_Theorem
 Fishburn_Impossibility
 Fisher_Yates
 Fishers_Inequality
 Fixed_Length_Vector
 Flow_Networks
 Floyd_Warshall
 Flyspeck-Tame
 FocusStreamsCaseStudies
 Forcing
 Formal_Puiseux_Series
 Formal_SSA
 Formula_Derivatives
 Foundation_of_geometry
 Fourier
 Free-Boolean-Algebra
 Free-Groups
 Frequency_Moments
 Fresh_Identifiers
 FunWithFunctions
 FunWithTilings
 Functional-Automata
 Functional_Ordered_Resolution_Prover
 Furstenberg_Topology
 GPU_Kernel_PL
 Gabow_SCC
 GaleStewart_Games
 Gale_Shapley
 Game_Based_Crypto
 Gauss-Jordan-Elim-Fun
 Gauss_Jordan
 Gauss_Sums
 Gaussian_Integers
 GenClock
 General-Triangle
 Generalized_Counting_Sort
 Generic_Deriving
 Generic_Join
 GewirthPGCProof
 Girth_Chromatic
 Given_Clause_Loops
 GoedelGod
 Goedel_HFSet_Semantic
 Goedel_HFSet_Semanticless
 Goedel_Incompleteness
 Goodstein_Lambda
 GraphMarkingIBP
 Graph_Saturation
 Graph_Theory
 Gray_Codes
 Green
 Groebner_Bases
 Groebner_Macaulay
 Gromov_Hyperbolicity
 Grothendieck_Schemes
 Group-Ring-Module
 HOL-CSP
 HOLCF-Prelude
 HRB-Slicing
 Hahn_Jordan_Decomposition
 Hales_Jewett
 Heard_Of
 Hello_World
 HereditarilyFinite
 Hermite
 Hermite_Lindemann
 Hidden_Markov_Models
 Higher_Order_Terms
 HoareForDivergence
 Hoare_Time
 Hood_Melville_Queue
 HotelKeyCards
 Huffman
 Hybrid_Logic
 Hybrid_Multi_Lane_Spatial_Logic
 Hybrid_Systems_VCs
 HyperCTL
 HyperHoareLogic
 Hyperdual
 Hypergraph_Basics
 Hypergraph_Colourings
 IEEE_Floating_Point
 IFC_Tracking
 IMAP-CRDT
 IMO2019
 IMP2
 IMP2_Binary_Heap
 IMP_Compiler
 IMP_Compiler_Reuse
 IO_Language_Conformance
 IP_Addresses
 Imperative_Insertion_Sort
 Implicational_Logic
 Impossible_Geometry
 Incompleteness
 Incredible_Proof_Machine
 Independence_CH
 Inductive_Confidentiality
 Inductive_Inference
 InfPathElimination
 InformationFlowSlicing
 InformationFlowSlicing_Inter
 Integration
 Interpolation_Polynomials_HOL_Algebra
 Interpreter_Optimizations
 Interval_Arithmetic_Word32
 Intro_Dest_Elim
 Involutions2Squares
 Iptables_Semantics
 Irrational_Series_Erdos_Straus
 Irrationality_J_Hancl
 Irrationals_From_THEBOOK
 IsaGeoCoq
 IsaNet
 Isabelle_C
 Isabelle_Marries_Dirac
 Isabelle_Meta_Model
 Jacobson_Basic_Algebra
 Jinja
 JinjaDCI
 JinjaThreads
 JiveDataStoreModel
 Jordan_Hoelder
 Jordan_Normal_Form
 KAD
 KAT_and_DRA
 KBPs
 KD_Tree
 Key_Agreement_Strong_Adversaries
 Khovanskii_Theorem
 Kleene_Algebra
 Kneser_Cauchy_Davenport
 Knights_Tour
 Knot_Theory
 Knuth_Bendix_Order
 Knuth_Morris_Pratt
 Koenigsberg_Friendship
 Kruskal
 Kuratowski_Closure_Complement
 LLL_Basis_Reduction
 LLL_Factorization
 LOFT
 LP_Duality
 LTL
 LTL_Master_Theorem
 LTL_Normal_Form
 LTL_to_DRA
 LTL_to_GBA
 Lam-ml-Normalization
 LambdaAuth
 LambdaMu
 Lambda_Free_EPO
 Lambda_Free_KBOs
 Lambda_Free_RPOs
 Lambert_Series
 Lambert_W
 Landau_Symbols
 Laplace_Transform
 Latin_Square
 LatticeProperties
 Launchbury
 Laws_of_Large_Numbers
 Lazy-Lists-II
 Lazy_Case
 Lehmer
 Lifting_Definition_Option
 Lifting_the_Exponent
 LightweightJava
 LinearQuantifierElim
 Linear_Inequalities
 Linear_Programming
 Linear_Recurrences
 Liouville_Numbers
 List-Index
 List-Infinite
 List_Interleaving
 List_Inversions
 List_Update
 LocalLexing
 Localization_Ring
 Locally-Nameless-Sigma
 Logging_Independent_Anonymity
 Lovasz_Local
 Lowe_Ontological_Argument
 Lower_Semicontinuous
 Lp
 Lucas_Theorem
 MDP-Algorithms
 MDP-Rewards
 MFMC_Countable
 MFODL_Monitor_Optimized
 MFOTL_Monitor
 MSO_Regex_Equivalence
 Markov_Models
 Marriage
 Mason_Stothers
 Matrices_for_ODEs
 Matrix
 Matrix_Tensor
 Matroids
 Max-Card-Matching
 Maximum_Segment_Sum
 Median_Method
 Median_Of_Medians_Selection
 Menger
 Mereology
 Mersenne_Primes
 Metalogic_ProofChecker
 MHComputation
 MiniML
 MiniSail
 Minimal_SSA
 Minkowskis_Theorem
 Minsky_Machines
 MLSS_Decision_Proc
 ML_Unification
 Modal_Logics_for_NTS
 Modular_Assembly_Kit_Security
 Modular_arithmetic_LLL_and_HNF_algorithms
 Monad_Memo_DP
 Monad_Normalisation
 MonoBoolTranAlgebra
 MonoidalCategory
 Monomorphic_Monad
 MuchAdoAboutTwo
 Multi_Party_Computation
 Multirelations
 Multirelations_Heterogeneous
 Multiset_Ordering_NPC
 Multitape_To_Singletape_TM
 Myhill-Nerode
 Name_Carrying_Type_Inference
 Nano_JSON
 Nash_Williams
 Nat-Interval-Logic
 Native_Word
 Nested_Multisets_Ordinals
 Network_Security_Policy_Verification
 Neumann_Morgenstern_Utility
 No_FTL_observers
 No_FTL_observers_Gen_Rel
 Nominal2
 Nominal_Myhill_Nerode
 Noninterference_CSP
 Noninterference_Concurrent_Composition
 Noninterference_Generic_Unwinding
 Noninterference_Inductive_Unwinding
 Noninterference_Ipurge_Unwinding
 Noninterference_Sequential_Composition
 NormByEval
 Nullstellensatz
 Number_Theoretic_Transform
 Octonions
 OpSets
 Open_Induction
 Optics
 Optimal_BST
 Orbit_Stabiliser
 Order_Lattice_Props
 Ordered_Resolution_Prover
 Ordinal
 Ordinal_Partitions
 Ordinals_and_Cardinals
 Ordinary_Differential_Equations
 PAC_Checker
 PAL
 PAPP_Impossibility
 PCF
 PLM
 POPLmark-deBruijn
 PSemigroupsConvolution
 Package_logic
 Padic_Field
 Padic_Ints
 Pairing_Heap
 Paraconsistency
 Parity_Game
 Partial_Function_MR
 Partial_Order_Reduction
 Password_Authentication_Protocol
 Pell
 Perfect_Fields
 Perfect-Number-Thm
 Perron_Frobenius
 Physical_Quantities
 Pi_Calculus
 Pi_Transcendental
 Planarity_Certificates
 Pluennecke_Ruzsa_Inequality
 Poincare_Bendixson
 Poincare_Disc
 Polygonal_Number_Theorem
 Polylog
 Polynomial_Crit_Geometry
 Polynomial_Factorization
 Polynomial_Interpolation
 Polynomials
 Pop_Refinement
 Posix-Lexing
 Possibilistic_Noninterference
 Power_Sum_Polynomials
 Pratt_Certificate
 Prefix_Free_Code_Combinators
 Presburger-Automata
 Prim_Dijkstra_Simple
 Prime_Distribution_Elementary
 Prime_Harmonic_Series
 Prime_Number_Theorem
 Priority_Queue_Braun
 Priority_Search_Trees
 Probabilistic_Noninterference
 Probabilistic_Prime_Tests
 Probabilistic_System_Zoo
 Probabilistic_Timed_Automata
 Probabilistic_While
 Probability_Inequality_Completeness
 Program-Conflict-Analysis
 Progress_Tracking
 Projective_Geometry
 Projective_Measurements
 Promela
 Proof_Strategy_Language
 PropResPI
 Propositional_Logic_Class
 Propositional_Proof_Systems
 Prpu_Maxflow
 PseudoHoops
 Psi_Calculi
 Ptolemys_Theorem
 Public_Announcement_Logic
 Q0_Metatheory
 Q0_Soundness
 QHLProver
 QR_Decomposition
 Quantales
 Quantales_Converse
 Quantifier_Elimination_Hybrid
 Quasi_Borel_Spaces
 Quaternions
 Query_Optimization
 Quick_Sort_Cost
 RIPEMD-160-SPARK
 ROBDD
 RSAPSS
 Ramsey-Infinite
 Random_BSTs
 Random_Graph_Subgraph_Threshold
 Randomised_BSTs
 Randomised_Social_Choice
 Rank_Nullity_Theorem
 Real_Impl
 Real_Power
 Real_Time_Deque
 Recursion-Addition
 Recursion-Theory-I
 Refine_Imperative_HOL
 Refine_Monadic
 RefinementReactive
 Regex_Equivalence
 Registers
 Regression_Test_Selection
 Regular-Sets
 Regular_Algebras
 Regular_Tree_Relations
 Relation_Algebra
 Relational-Incorrectness-Logic
 Relational_Cardinality
 Relational_Disjoint_Set_Forests
 Relational_Forests
 Relational_Method
 Relational_Minimum_Spanning_Trees
 Relational_Paths
 Rensets
 Rep_Fin_Groups
 ResiduatedTransitionSystem
 Residuated_Lattices
 Resolution_FOL
 Rewrite_Properties_Reduction
 Rewriting_Z
 Ribbon_Proofs
 Risk_Free_Lending
 Robbins-Conjecture
 Robinson_Arithmetic
 Root_Balanced_Tree
 Roth_Arithmetic_Progressions
 Routing
 Roy_Floyd_Warshall
 SATSolverVerification
 SCC_Bloemen_Sequential
 SC_DOM_Components
 SDS_Impossibility
 SIFPL
 SIFUM_Type_Systems
 SPARCv8
 S_Finite_Measure_Monad
 Safe_Distance
 Safe_OCL
 Safe_Range_RC
 Saturation_Framework
 Saturation_Framework_Extensions
 Sauer_Shelah_Lemma
 Schutz_Spacetime
 Schwartz_Zippel
 Secondary_Sylow
 Security_Protocol_Refinement
 Selection_Heap_Sort
 SenSocialChoice
 Separata
 Separation_Algebra
 Separation_Logic_Imperative_HOL
 Separation_Logic_Unbounded
 SequentInvertibility
 Shadow_DOM
 Shadow_SC_DOM
 Shivers-CFA
 ShortestPath
 Show
 Sigma_Commit_Crypto
 Signature_Groebner
 Simpl
 Simple_Clause_Learning
 Simple_Firewall
 Simplex
 Simplicial_complexes_and_boolean_functions
 SimplifiedOntologicalArgument
 Skew_Heap
 Skip_Lists
 Slicing
 Sliding_Window_Algorithm
 Smith_Normal_Form
 Smooth_Manifolds
 Solidity
 Sophomores_Dream
 Sort_Encodings
 Source_Coding_Theorem
 SpecCheck
 Special_Function_Bounds
 Splay_Tree
 Sqrt_Babylonian
 Stable_Matching
 Stalnaker_Logic
 Standard_Borel_Spaces
 Statecharts
 Stateful_Protocol_Composition_and_Typing
 Stellar_Quorums
 Stern_Brocot
 Stewart_Apollonius
 Stirling_Formula
 Stochastic_Matrices
 Stone_Algebras
 Stone_Kleene_Relation_Algebras
 Stone_Relation_Algebras
 Store_Buffer_Reduction
 Stream-Fusion
 Stream_Fusion_Code
 StrictOmegaCategories
 Strong_Security
 Sturm_Sequences
 Sturm_Tarski
 Stuttering_Equivalence
 Subresultants
 Subset_Boolean_Algebras
 SumSquares
 Sunflowers
 SuperCalc
 Suppes_Theorem
 Surprise_Paradox
 Symmetric_Polynomials
 Syntax_Independent_Logic
 Synthetic_Completeness
 Szemeredi_Regularity
 Szpilrajn
 TESL_Language
 TLA
 Tail_Recursive_Functions
 Tarskis_Geometry
 Taylor_Models
 Three_Circles
 Three_Squares
 Timed_Automata
 Topological_Semantics
 Topology
 TortoiseHare
 TsirelsonBound
 Transcendence_Series_Hancl_Rucki
 Transformer_Semantics
 Transition_Systems_and_Automata
 Transitive-Closure
 Transitive-Closure-II
 Transitive_Models
 Transport
 Treaps
 Tree-Automata
 Tree_Decomposition
 Tree_Enumeration
 Triangle
 Trie
 Turans_Graph_Theorem
 Twelvefold_Way
 Two_Generated_Word_Monoids_Intersection
 Tycon
 Types_Tableaus_and_Goedels_God
 Types_To_Sets_Extension
 UPF
 UPF_Firewall
 UTP
 Undirected_Graph_Theory
 Universal_Hash_Families
 Universal_Turing_Machine
 UpDown_Scheme
 VYDRA_MDL
 Valuation
 Van_Emde_Boas_Trees
 Van_der_Waerden
 VectorSpace
 VeriComp
 Verified-Prover
 Verified_SAT_Based_AI_Planning
 VerifyThis2018
 VerifyThis2019
 Vickrey_Clarke_Groves
 Virtual_Substitution
 VolpanoSmith
 WHATandWHERE_Security
 WOOT_Strong_Eventual_Consistency
 WebAssembly
 Weight_Balanced_Trees
 Weighted_Arithmetic_Geometric_Mean
 Weighted_Path_Order
 Well_Quasi_Orders
 Wetzels_Problem
 Winding_Number_Eval
 Word_Lib
 WorkerWrapper
 X86_Semantics
 XML
 Youngs_Inequality
 ZFC_in_HOL
 Zeckendorf
 Zeta_3_Irrational
 Zeta_Function
 pGCL
 Labeled_Transition_Systems
 Pushdown_Systems