Theory McDiarmid_Inequality

section ‹McDiarmid's inequality›

text ‹In this section we verify McDiarmid's inequality \cite[Lemma 1.2]{mcdiarmid1989}. In the
source and also further sources sometimes refer to the result as the ``independent bounded
differences'' inequality.›

theory McDiarmid_Inequality
  imports Concentration_Inequalities_Preliminary
begin

lemma Collect_restr_cong:
  assumes "A = B"
  assumes "⋀x. x ∈ A ⟹ P x = Q x"
  shows "{x ∈ A. P x} = {x ∈ B. Q x}"
  using assms by auto

lemma ineq_chain:
  fixes h :: "nat ⇒ real"
  assumes "⋀i. i < n ⟹ h (i+1) ≤ h i"
  shows "h n ≤ h 0"
  using assms by (induction n) force+

lemma restrict_subset_eq:
  assumes "A ⊆ B"
  assumes "restrict f B = restrict g B"
  shows "restrict f A = restrict g A"
  using assms unfolding restrict_def by (meson subsetD)

text ‹Bochner Integral version of Hoeffding's Lemma using
  @{thm [source] interval_bounded_random_variable.Hoeffdings_lemma_nn_integral_0}›

lemma (in prob_space) Hoeffdings_lemma_bochner:
  assumes "l > 0" and E0: "expectation f = 0"
  assumes "random_variable borel f"
  assumes "AE x in M. f x ∈ {a..b::real}"
  shows   "expectation (λx. exp (l * f x)) ≤ exp (l⇧² * (b - a)⇧² / 8)" (is "?L ≤ ?R")
proof -
  interpret interval_bounded_random_variable M f a b
    using assms by (unfold_locales) auto

  have "integrable M (λx. exp (l * f x))"
    using assms(1,3,4) by (intro integrable_const_bound[where B="exp (l * b)"]) simp_all

  hence "ennreal (?L) = (∫⇧⁺ x. exp (l * f x) ∂M)"
    by (intro nn_integral_eq_integral[symmetric]) auto
  also have "... ≤ ennreal (?R)"
    by (intro Hoeffdings_lemma_nn_integral_0 assms)
  finally have 0:"ennreal (?L) ≤ ennreal ?R"
    by simp
  show ?thesis
  proof (cases "?L ≥ 0")
    case True
    thus ?thesis using 0 by simp
  next
    case False
    hence "?L ≤ 0" by simp
    also have "... ≤ ?R" by simp
    finally show ?thesis by simp
  qed
qed

lemma (in prob_space) Hoeffdings_lemma_bochner_2:
  assumes "l > 0" and E0: "expectation f = 0"
  assumes "random_variable borel f"
  assumes "⋀x y. {x,y} ⊆ space M ⟹ ¦f x - f y¦ ≤ (c::real)"
  shows   "expectation (λx. exp (l * f x)) ≤ exp (l^2 * c^2 / 8)" (is "?L ≤ ?R")
proof -
  define a :: real where "a = (INF x ∈ space M. f x)"
  define b :: real where "b = a+c"

  obtain ω where ω:"ω ∈ space M" using not_empty by auto
  hence 0:"f ` space M ≠ {}" by auto
  have 1: "c = b - a" unfolding b_def by simp

  have "bdd_below (f ` space M)"
    using ω assms(4) unfolding abs_le_iff
    by (intro bdd_belowI[where m="f ω - c"]) (auto simp add:algebra_simps)
  hence "f x ≥ a" if "x ∈ space M" for x unfolding a_def by (intro cINF_lower that)
  moreover have "f x ≤ b" if x_space: "x ∈ space M" for x
  proof (rule ccontr)
    assume "¬(f x ≤ b)"
    hence a:"f x > a + c" unfolding b_def by simp
    have "f y ≥ f x - c" if "y ∈ space M" for y
      using that x_space assms(4) unfolding abs_le_iff by (simp add:algebra_simps)
    hence "f x - c ≤ a" unfolding a_def using cInf_greatest[OF 0] by auto
    thus "False" using a by simp
  qed
  ultimately have "f x ∈ {a..b}" if "x ∈ space M" for x using that by auto
  hence "AE x in M. f x ∈ {a..b}" by simp
  thus ?thesis unfolding 1 by (intro Hoeffdings_lemma_bochner assms(1,2,3))
qed

lemma (in prob_space) Hoeffdings_lemma_bochner_3:
  assumes "expectation f = 0"
  assumes "random_variable borel f"
  assumes "⋀x y. {x,y} ⊆ space M ⟹ ¦f x - f y¦ ≤ (c::real)"
  shows   "expectation (λx. exp (l * f x)) ≤ exp (l^2 * c^2 / 8)" (is "?L ≤ ?R")
proof -
  consider (a) "l > 0" | (b) "l = 0" | (c) "l < 0"
    by argo
  then show ?thesis
  proof (cases)
    case a thus ?thesis by (intro Hoeffdings_lemma_bochner_2 assms) auto
  next
    case b thus ?thesis by simp
  next
    case c
    have "?L = expectation (λx. exp ((-l) * (-f x)))" by simp
    also have "... ≤ exp ((-l)^2 * c⇧²/8)" using c assms by (intro Hoeffdings_lemma_bochner_2) auto
    also have "... = ?R" by simp
    finally show ?thesis by simp
  qed
qed

text ‹Version of @{thm [source] product_sigma_finite.product_integral_singleton} without the
condition that @{term "M i"} has to be sigma finite for all @{term "i"}:›

lemma product_integral_singleton:
  fixes f :: "_ ⇒ _::{banach, second_countable_topology}"
  assumes "sigma_finite_measure (M i)"
  assumes "f ∈ borel_measurable (M i)"
  shows "(∫x. f (x i) ∂(PiM {i} M)) = (∫x. f x ∂(M i))" (is "?L = ?R")
proof -
  define M' where "M' j = (if j=i then M i else count_space {undefined})" for j

  interpret product_sigma_finite "M'"
    using assms(1) unfolding product_sigma_finite_def M'_def
    by (auto intro!:sigma_finite_measure_count_space_finite)

  have "?L = ∫x. f (x i) ∂(PiM {i} M')"
    by (intro Bochner_Integration.integral_cong PiM_cong) (simp_all add:M'_def)
  also have "... = (∫x. f x ∂(M' i))"
    using assms(2) by (intro product_integral_singleton) (simp add:M'_def)
  also have "... = ?R"
    by (intro Bochner_Integration.integral_cong PiM_cong) (simp_all add:M'_def)
  finally show ?thesis by simp
qed

text ‹Version of @{thm [source] product_sigma_finite.product_integral_fold} without the
condition that @{term "M i"} has to be sigma finite for all @{term "i"}:›

lemma product_integral_fold:
  fixes f :: "_ ⇒ _::{banach, second_countable_topology}"
  assumes "⋀i. i ∈ I ∪ J ⟹ sigma_finite_measure (M i)"
  assumes "I ∩ J = {}"
  assumes "finite I"
  assumes "finite J"
  assumes "integrable (PiM (I ∪ J) M) f"
  shows "(∫x. f x ∂PiM (I ∪ J) M) = (∫x. (∫y. f (merge I J(x,y)) ∂PiM J M) ∂PiM I M)" (is "?L = ?R")
    and "integrable (PiM I M) (λx. (∫y. f (merge I J(x,y)) ∂PiM J M))" (is "?I")
    and "AE x in PiM I M. integrable (PiM J M) (λy. f (merge I J(x,y)))" (is "?T")
proof -
  define M' where "M' i = (if i ∈ I ∪ J then M i else count_space {undefined})" for i

  interpret product_sigma_finite "M'"
    using assms(1) unfolding product_sigma_finite_def M'_def
    by (auto intro!:sigma_finite_measure_count_space_finite)

  interpret pair_sigma_finite "Pi⇩_M I M'" "Pi⇩_M J M'"
    using assms(3,4) sigma_finite unfolding pair_sigma_finite_def by blast

  have 0: "integrable (Pi⇩_M (I ∪ J) M') f = integrable (Pi⇩_M (I ∪ J) M) f"
    by (intro Bochner_Integration.integrable_cong PiM_cong) (simp_all add:M'_def)

  have "?L = (∫x. f x ∂PiM (I ∪ J) M')"
    by (intro Bochner_Integration.integral_cong PiM_cong) (simp_all add:M'_def)
  also have "... = (∫x. (∫y. f (merge I J (x,y)) ∂PiM J M') ∂PiM I M')"
    using assms(5) by (intro product_integral_fold assms(2,3,4)) (simp add:0)
  also have "... = ?R"
    by (intro Bochner_Integration.integral_cong PiM_cong) (simp_all add:M'_def)
  finally show "?L = ?R" by simp

  have "integrable (Pi⇩_M (I ∪ J) M') f = integrable (PiM I M' ⨂⇩_M PiM J M') (λx. f (merge I J x))"
    using assms(5) apply (subst distr_merge[OF assms(2,3,4),symmetric])
    by (intro integrable_distr_eq) (simp_all add:0[symmetric])
  hence 1:"integrable (PiM I M' ⨂⇩_M PiM J M') (λx. f (merge I J x))"
    using assms(5) 0 by simp

  hence "integrable (PiM I M') (λx. (∫y. f (merge I J(x,y)) ∂PiM J M'))" (is "?I'")
    by (intro integrable_fst') auto
  moreover have "?I' = ?I"
    by (intro Bochner_Integration.integrable_cong PiM_cong ext Bochner_Integration.integral_cong)
     (simp_all add:M'_def)
  ultimately show "?I"
    by simp

  have "AE x in Pi⇩_M I M'. integrable (Pi⇩_M J M') (λy. f (merge I J (x, y)))" (is "?T'")
    by (intro AE_integrable_fst'[OF 1])
  moreover have "?T' = ?T"
    by (intro arg_cong2[where f="almost_everywhere"] PiM_cong ext Bochner_Integration.integrable_cong)
     (simp_all add:M'_def)
  ultimately show  "?T"
    by simp
qed

lemma product_integral_insert:
  fixes f :: "_ ⇒ _::{banach, second_countable_topology}"
  assumes "⋀k. k ∈ {i} ∪ J ⟹ sigma_finite_measure (M k)"
  assumes "i ∉ J"
  assumes "finite J"
  assumes "integrable (PiM (insert i J) M) f"
  shows "(∫x. f x ∂PiM (insert i J) M) = (∫x. (∫y. f (y(i := x)) ∂PiM J M) ∂M i)" (is "?L = ?R")
proof -
  note meas_cong = iffD1[OF measurable_cong]

  have "integrable (PiM {i} M) (λx. (∫y. f (merge {i} J (x,y)) ∂PiM J M))"
    using assms by (intro product_integral_fold) auto
  hence 0:"(λx. (∫y. f (merge {i} J (x,y)) ∂PiM J M)) ∈ borel_measurable (PiM {i} M)"
    using borel_measurable_integrable by simp
  have 1:"(λx. (∫y. f (y(i := (x i))) ∂PiM J M)) ∈ borel_measurable (PiM {i} M)"
    by (intro meas_cong[OF _ 0] Bochner_Integration.integral_cong arg_cong[where f="f"])
     (auto simp add:space_PiM merge_def fun_upd_def PiE_def extensional_def)
  have "(λx. (∫y. f (y(i := (λi∈{i}. x) i)) ∂PiM J M)) ∈ borel_measurable (M i)"
    by (intro measurable_compose[OF _ 1, where f="(λx. (λi∈{i}. x))"] measurable_restrict) auto
  hence 2:"(λx. (∫y. f (y(i := x )) ∂PiM J M)) ∈ borel_measurable (M i)" by simp

  have "?L = (∫x. f x ∂PiM ({i} ∪ J) M)" by simp
  also have "... = (∫x. (∫y. f (merge {i} J (x,y)) ∂PiM J M) ∂PiM {i} M)"
    using assms(2,4) by (intro product_integral_fold assms(1,3)) auto
  also have "... = (∫x. (∫y. f (y(i := (x i))) ∂PiM J M) ∂PiM {i} M)"
    by (intro Bochner_Integration.integral_cong refl arg_cong[where f="f"])
     (auto simp add:space_PiM merge_def fun_upd_def PiE_def extensional_def)
  also have "... = ?R"
    using assms(1,4) by (intro product_integral_singleton assms(1) 2) auto
  finally show ?thesis by simp
qed

lemma product_integral_insert_rev:
  fixes f :: "_ ⇒ _::{banach, second_countable_topology}"
  assumes "⋀k. k ∈ {i} ∪ J ⟹ sigma_finite_measure (M k)"
  assumes "i ∉ J"
  assumes "finite J"
  assumes "integrable (PiM (insert i J) M) f"
  shows "(∫x. f x ∂PiM (insert i J) M) = (∫y. (∫x. f (y(i := x)) ∂M i) ∂PiM J M)" (is "?L = ?R")
proof -
  have "?L = (∫x. f x ∂PiM (J ∪ {i}) M)" by simp
  also have "... = (∫x. (∫y. f (merge J {i} (x,y)) ∂PiM {i} M) ∂PiM J M)"
    using assms(2,4) by (intro product_integral_fold assms(1,3)) auto
  also have "... = (∫x. (∫y. f (x(i := (y i))) ∂PiM {i} M) ∂PiM J M)"
    unfolding merge_singleton[OF assms(2)]
    by (intro Bochner_Integration.integral_cong refl arg_cong[where f="f"])
     (metis PiE_restrict assms(2) restrict_upd space_PiM)
  also have "... = ?R"
    using assms(1,4) by (intro Bochner_Integration.integral_cong product_integral_singleton) auto
  finally show ?thesis by simp
qed

lemma merge_empty[simp]:
  "merge {} I (y,x) = restrict x I"
  "merge I {} (y,x) = restrict y I"
  unfolding merge_def restrict_def by auto

lemma merge_cong:
  assumes "restrict x1 I = restrict x2 I"
  assumes "restrict y1 J = restrict y2 J"
  shows "merge I J (x1,y1) = merge I J (x2,y2)"
  using assms unfolding merge_def restrict_def
  by (intro ext) (smt (verit, best) case_prod_conv)

lemma restrict_merge:
  "restrict (merge I J x) K = merge (I ∩ K) (J ∩ K) x"
  unfolding restrict_def merge_def by (intro ext) (auto simp:case_prod_beta)

lemma map_prod_measurable:
  assumes "f ∈ M →⇩_M M'"
  assumes "g ∈ N →⇩_M N'"
  shows "map_prod f g ∈ M ⨂⇩_M N →⇩_M M' ⨂⇩_M N'"
  using assms by (subst measurable_pair_iff) simp

lemma mc_diarmid_inequality_aux:
  fixes f :: "(nat ⇒ 'a) ⇒ real"
  fixes n :: nat
  assumes "⋀i. i < n ⟹ prob_space (M i)"
  assumes "⋀i x y. i<n ⟹ {x,y} ⊆ space (PiM {..<n} M) ⟹ (∀j∈{..<n}-{i}. x j=y j) ⟹ ¦f x-f y¦≤c i"
  assumes f_meas: "f ∈ borel_measurable (PiM {..<n} M)" and ε_gt_0: "ε >0"
  shows "𝒫(ω in PiM {..<n} M. f ω - (∫ξ. f ξ ∂PiM {..<n} M) ≥ ε) ≤ exp (-(2*ε^2)/(∑i<n. (c i)^2))"
    (is "?L ≤ ?R")
proof -
  define h where "h k = (λξ. (∫ω. f (merge {..<k} {k..<n} (ξ, ω)) ∂PiM {k..<n} M))" for k

  define t :: real where "t = 4 * ε / (∑i<n. (c i)^2)"

  define V where "V i ξ = h (Suc i) ξ - h i ξ" for i ξ

  obtain x0 where x0:"x0 ∈ space (PiM {..<n} M)"
    using prob_space.not_empty[OF prob_space_PiM] assms(1) by fastforce

  have delta: "¦f x - f y¦ ≤ c i" if "i < n"
    "x ∈ PiE {..<n} (λi. space (M i))" "y ∈ PiE {..<n} (λi. space (M i))"
    "restrict x ({..<n}-{i}) = restrict y ({..<n}-{i})"
  for x y i
  proof (rule assms(2)[OF that(1)], goal_cases)
    case 1
    then show ?case using that(2,3) unfolding space_PiM by auto
  next
    case 2
    then show ?case using that(4) by (intro ballI) (metis restrict_apply')
  qed

  have c_ge_0: "c j ≥ 0" if "j < n" for j
  proof -
    have "0 ≤ ¦f x0 - f x0¦" by simp
    also have "... ≤ c j" using x0 unfolding space_PiM by (intro delta that) auto
    finally show ?thesis by simp
  qed
  hence sum_c_ge_0: "(∑i<n. (c i)^2) ≥ 0" by (meson sum_nonneg zero_le_power2)

  hence t_ge_0: "t ≥ 0" using ε_gt_0 unfolding t_def by simp

  note borel_rules =
    borel_measurable_sum measurable_compose[OF _ borel_measurable_exp]
    borel_measurable_times

  note int_rules =
    prob_space_PiM assms(1) borel_rules
    prob_space.integrable_bounded bounded_intros
  have h_n: "h n ξ = f ξ" if "ξ ∈ space (PiM {..<n} M)" for ξ
  proof -
    have "h n ξ = (∫ω. f (λi∈{..<n}. ξ i) ∂PiM {} M)"
      unfolding h_def using leD
      by (intro Bochner_Integration.integral_cong PiM_cong arg_cong[where f="f"] restrict_cong)
       auto
    also have "... = f (restrict ξ {..<n})"
      unfolding PiM_empty by simp
    also have "... = f ξ"
      using that unfolding space_PiM PiE_def
      by (simp add: extensional_restrict)
    finally show ?thesis
      by simp
  qed

  have h_0: "h 0 ξ = (∫ω. f ω ∂PiM {..<n} M)" for ξ
    unfolding h_def by (intro Bochner_Integration.integral_cong PiM_cong refl)
     (simp_all add:space_PiM atLeast0LessThan)

  have h_cong: "h j ω = h j ξ" if "restrict ω {..<j} = restrict ξ {..<j}" for j ω ξ
    using that unfolding h_def
    by (intro Bochner_Integration.integral_cong refl arg_cong[where f="f"] merge_cong) auto

  have h_meas: "h i ∈ borel_measurable (PiM I M)" if "i ≤ n" "{..<i} ⊆ I" for i I
  proof -
    have 0: "{..<n} = {..<i} ∪ {i..<n}"
      using that(1) by auto

    have 1: "merge {..<i} {i..<n} = merge {..<i} {i..<n} ∘ map_prod (λx. restrict x {..<i}) id"
      unfolding merge_def map_prod_def restrict_def comp_def
      by (intro ext) (auto simp:case_prod_beta')

    have "merge {..<i} {i..<n} ∈ Pi⇩_M I M ⨂⇩_M Pi⇩_M {i..<n} M →⇩_M Pi⇩_M {..<n} M"
      unfolding 0 by (subst 1) (intro measurable_comp[OF _ measurable_merge] map_prod_measurable
          measurable_ident measurable_restrict_subset that(2))
    hence "(λx. f (merge {..<i} {i..<n} x)) ∈ borel_measurable (Pi⇩_M I M ⨂⇩_M Pi⇩_M {i..<n} M)"
      by (intro measurable_compose[OF _ f_meas])
    thus ?thesis
      unfolding h_def by (intro sigma_finite_measure.borel_measurable_lebesgue_integral
            prob_space_imp_sigma_finite prob_space_PiM assms(1)) (auto simp:case_prod_beta')
  qed

  have merge_space_aux:"merge {..<j} {j..<n} u ∈ (Π⇩_E i∈{..<n}. space (M i))"
    if "j ≤ n" "fst u ∈ Pi {..<j} (λi. space (M i))" "snd u ∈ Pi {j..<n} (λi. space (M i))"
    for u  j
  proof -
    have "merge {..<j} {j..<n} (fst u, snd u) ∈ (PiE ({..<j} ∪ {j..<n}) (λi. space (M i)))"
      using that by (intro iffD2[OF PiE_cancel_merge]) auto
    also have "... =  (Π⇩_E i∈{..<n}. space (M i))"
      using that by (intro arg_cong2[where f="PiE"] refl) auto
    finally show ?thesis by simp
  qed

  have merge_space:"merge {..<j} {j..<n} (u, v) ∈ (Π⇩_E i∈{..<n}. space (M i))"
    if "j ≤ n" "u ∈ PiE {..<j} (λi. space (M i))" "v ∈ PiE {j..<n} (λi. space (M i))"
    for u v j
    using that by (intro merge_space_aux) (simp_all add:PiE_def)

  have delta': "¦f x - f y¦ ≤ (∑i<n. c i)"
    if "x ∈ PiE {..<n} (λi. space (M i))" "y ∈ PiE {..<n} (λi. space (M i))" for x y
  proof -
    define m where "m i = merge {..<i} {i..<n} (x,y)" for i

    have 0: "z ∈ Pi I (λi. space (M i))" if "z ∈ PiE {..<n} (λi. space (M i))"
       "I ⊆ {..<n}" for z I
      using that unfolding PiE_def by auto

    have 3: "{..<Suc i} ∩ ({..<n} - {i}) = {..<i}"
      "{Suc i..<n} ∩ ({..<n} - {i}) = {Suc i..<n}"
      "{..<i} ∩ ({..<n} - {i}) = {..<i}"
      "{i..<n} ∩ ({..<n} - {i}) = {Suc i..<n}"
      if "i < n" for i
      using that by auto

    have "¦f x - f y¦ = ¦f (m n) - f(m 0)¦"
      using that unfolding m_def by (simp add:atLeast0LessThan)
    also have "... = ¦∑i < n. f (m (Suc i)) - f (m i)¦"
      by (subst sum_lessThan_telescope) simp
    also have "... ≤ (∑i < n. ¦f (m (Suc i)) - f (m i)¦)"
      by simp
    also have "... ≤ (∑i < n. c i)"
      using that unfolding m_def by (intro delta sum_mono merge_space_aux 0 subsetI)
       (simp_all add:restrict_merge 3)
    finally show ?thesis
      by simp
  qed

  have "norm (f x) ≤ norm (f x0) + sum c {..<n}" if "x ∈ space (Pi⇩_M {..<n} M)" for x
  proof -
    have "¦f x - f x0¦ ≤ sum c {..<n}"
      using x0 that unfolding space_PiM by (intro delta') auto
    thus ?thesis
      by simp
  qed
  hence f_bounded: "bounded (f ` space (PiM {..<n} M))"
    by (intro boundedI[where B="norm (f x0) + (∑i<n. c i)"]) auto

  have f_merge_bounded:
    "bounded ((λω. (f (merge {..<j} {j..<n} (u, ω)))) ` space (Pi⇩_M {j..<n} M))"
    if "j ≤ n" "u ∈ PiE {..<j} (λi. space (M i))" for u j
  proof -
    have "(λω. merge {..<j} {j..<n} (u, ω)) ` space (Pi⇩_M {j..<n} M) ⊆ space (Pi⇩_M {..<n} M)"
      using that  unfolding space_PiM
      by (intro image_subsetI merge_space) auto
    thus ?thesis
      by (subst image_image[of "f",symmetric]) (intro bounded_subset[OF f_bounded] image_mono)
  qed

  have f_merge_meas_aux:
    "(λω. f (merge {..<j} {j..<n} (u, ω))) ∈ borel_measurable (Pi⇩_M {j..<n} M)"
    if "j ≤ n" "u ∈ Pi {..<j} (λi. space (M i))" for j u
  proof -

    have 0: "{..<n} = {..<j } ∪ {j ..<n}"
      using that(1) by auto

    have 1: "merge {..<j} {j..<n} (u,ω) = merge {..<j} {j..<n} (restrict u {..<j},ω)" for ω
      by (intro merge_cong) auto

    have "(λω. merge {..<j} {j..<n} (u, ω)) ∈ Pi⇩_M {j..<n} M →⇩_M Pi⇩_M {..<n} M"
      using that unfolding 0 1
      by (intro measurable_compose[OF _ measurable_merge] measurable_Pair1')
       (simp add:space_PiM)
    thus ?thesis
      by (intro measurable_compose[OF _ f_meas])
  qed

  have f_merge_meas: "(λω. f (merge {..<j} {j..<n} (u, ω))) ∈ borel_measurable (Pi⇩_M {j..<n} M)"
    if "j ≤ n" "u ∈ PiE {..<j} (λi. space (M i))" for j u
    using that unfolding PiE_def by (intro f_merge_meas_aux) auto

  have h_bounded: "bounded (h i ` space (PiM I M))"
    if h_bounded_assms: "i ≤ n" "{..<i} ⊆ I" for i I
  proof -
    have "merge {..<i} {i..<n} x ∈ space (Pi⇩_M {..<n} M)"
      if "x ∈ (Π⇩_E i∈I. space (M i)) × (Π⇩_E i∈{i..<n}. space (M i))" for x
      using that h_bounded_assms unfolding space_PiM by (intro merge_space_aux)
        (auto simp: PiE_def mem_Times_iff)
    hence "bounded ((λx. f (merge {..<i} {i..<n} x)) `
      ((Π⇩_E i∈I. space (M i)) × (Π⇩_E i∈{i..<n}. space (M i))))"
      by (subst image_image[of "f",symmetric])
       (intro bounded_subset[OF f_bounded] image_mono image_subsetI)
    thus ?thesis
      using that unfolding h_def
      by (intro prob_space.finite_measure finite_measure.bounded_int int_rules)
        (auto simp:space_PiM PiE_def)
  qed

  have V_bounded: "bounded (V i ` space (PiM I M))"
    if "i < n" "{..<i+1} ⊆ I" for i I
    using that unfolding V_def by (intro bounded_intros h_bounded) auto

  have V_upd_bounded: "bounded ((λx. V j (ξ(j := x))) ` space (M j))"
    if V_upd_bounded_assms: "ξ ∈ space (Pi⇩_M {..<j} M)" "j < n" for j ξ
  proof -
    have "ξ(j := v) ∈ space (Pi⇩_M {..<j + 1} M)" if "v ∈ space (M j)" for v
      using V_upd_bounded_assms that unfolding space_PiM PiE_def extensional_def Pi_def by auto
    thus ?thesis
        using that unfolding image_image[of "V j" "(λx. (ξ(j := x)))",symmetric]
        by (intro bounded_subset[OF V_bounded[of "j" "{..<j+1}"]] that image_mono) auto
  qed

  have h_step: "h j ω = ∫τ. h (j+1) (ω (j := τ)) ∂ M j" (is "?L1 = ?R1")
    if "ω ∈ space (PiM {..<j} M)" "j < n" for j ω
  proof -
    have 0: "(λx. f (merge {..<j} {j..<n} (ω, x))) ∈ borel_measurable (Pi⇩_M {j..<n} M)"
      using that unfolding space_PiM by (intro f_merge_meas) auto

    have 1: "insert j {Suc j..<n} = {j..<n}"
      using that by auto

    have 2: "bounded ((λx.(f (merge {..<j} {j..<n} (ω, x)))) ` space (Pi⇩_M {j..<n} M))"
      using that by (intro f_merge_bounded) (simp_all add: space_PiM)

    have "?L1 = (∫ξ. f (merge {..<j} {j..<n} (ω, ξ)) ∂PiM (insert j {j+1..<n}) M)"
      unfolding h_def using that by (intro Bochner_Integration.integral_cong refl PiM_cong) auto
    also have "...=(∫τ.(∫ξ. f (merge {..<j} {j..<n} (ω, (ξ(j := τ)))) ∂PiM {j+1..<n} M)∂M j)"
      using that(1,2) 0 1 2 by (intro product_integral_insert prob_space_imp_sigma_finite assms(1)
          int_rules f_merge_meas) (simp_all)
    also have "... = ?R1"
      using that(2) unfolding h_def
      by (intro Bochner_Integration.integral_cong arg_cong[where f="f"] ext) (auto simp:merge_def)
    finally show ?thesis
      by simp
  qed

  have V_meas: "V i ∈ borel_measurable (PiM I M)" if "i < n" "{..<i+1} ⊆ I" for i I
    unfolding V_def using that by (intro borel_measurable_diff h_meas) auto

  have V_upd_meas: "(λx. V j (ξ(j := x))) ∈ borel_measurable (M j)"
    if "j < n" "ξ ∈ space (Pi⇩_M {..<j} M)" for j ξ
    using that by (intro measurable_compose[OF _ V_meas[where I="insert j {..<j}"]]
          measurable_component_update) auto

  have V_cong:
    "V j ω = V j ξ" if "restrict ω {..<(j+1)} = restrict ξ {..<(j+1)}" for j ω ξ
    using that restrict_subset_eq[OF _ that] unfolding V_def
    by (intro arg_cong2[where f="(-)"] h_cong) simp_all

  have exp_V: "(∫ω. V j (ξ(j := ω)) ∂M j) = 0" (is "?L1 = 0")
    if "j < n" "ξ ∈ space (PiM {..<j} M)" for j ξ
  proof -

    have "fun_upd ξ j ` space (M j) ⊆ space (Pi⇩_M (insert j {..<j}) M)"
      using that unfolding space_PiM by (intro image_subsetI PiE_fun_upd) auto
    hence 0:"bounded ((λx. h (Suc j) (ξ(j := x))) ` space (M j))"
      unfolding image_image[of "h (Suc j)" "λx. ξ(j := x)",symmetric] using that
      by (intro bounded_subset[OF h_bounded[where i="j+1" and I="{..<j+1}"]] image_mono)
        (auto simp:lessThan_Suc)

    have 1:"(λx. h (Suc j) (ξ(j := x))) ∈ borel_measurable (M j)"
      using h_meas that by (intro measurable_compose[OF _ h_meas[where I="insert j {..<j}"]]
          measurable_component_update) auto

    have "?L1 =(∫ω. h (Suc j) (ξ(j := ω)) - h j ξ ∂M j)"
      unfolding V_def
      by (intro Bochner_Integration.integral_cong arg_cong2[where f="(-)"] refl h_cong) auto
    also have "... = (∫ω. h (Suc j) (ξ(j := ω)) ∂M j) - (∫ω. h j ξ ∂M j)"
      using that by (intro Bochner_Integration.integral_diff int_rules 0 1) auto
    also have "... = 0"
      using that(1) assms(1) prob_space.prob_space unfolding h_step[OF that(2,1)] by auto
    finally show ?thesis
      by simp
  qed

  have var_V: "¦V j x - V j y¦ ≤ c j" (is "?L1 ≤ ?R1")
    if var_V_assms: "j < n" "{x,y} ⊆ space (PiM {..<j+1} M)"
       "restrict x {..<j} = restrict y {..<j}"  for x y j
  proof -
    have x_ran: "x ∈ PiE {..<j+1} (λi. space (M i))" and y_ran: "y ∈ PiE {..<j+1} (λi. space (M i))"
      using that(2) by (simp_all add:space_PiM)

    have 0: "j+1 ≤ n"
      using that by simp

    have "?L1 = ¦h (Suc j) x - h j y - (h (Suc j) y - h j y)¦"
      unfolding V_def by (intro arg_cong[where f="abs"] arg_cong2[where f="(-)"] refl h_cong that)
    also have "... = ¦h (j+1) x - h (j+1) y¦"
      by simp
    also have "... =
      ¦(∫ω. f(merge {..<j+1} {j+1..<n} (x,ω))-f(merge {..<j+1} {j+1..<n} (y,ω)) ∂PiM {j+1..<n} M)¦"
      using that unfolding h_def by (intro arg_cong[where f="abs"] f_merge_meas[OF 0] x_ran
          Bochner_Integration.integral_diff[symmetric] int_rules f_merge_bounded[OF 0] y_ran) auto
    also have "... ≤
      (∫ω. ¦f(merge {..<j+1} {j+1..<n} (x,ω))-f(merge {..<j+1} {j+1..<n} (y,ω))¦ ∂PiM {j+1..<n} M)"
      by (intro integral_abs_bound)
    also have "... ≤ (∫ω. c j ∂PiM {j+1..<n} M)"
    proof (intro Bochner_Integration.integral_mono' delta int_rules c_ge_0 ballI merge_space 0)
      fix ω assume "ω ∈ space (Pi⇩_M {j + 1..<n} M)"
      have "{..<j + 1} ∩ ({..<n} - {j}) = {..<j}"
        using that by auto
      thus "restrict (merge {..<j+1} {j+1..<n} (x, ω)) ({..<n}-{j}) =
            restrict (merge {..<j+1} {j+1..<n} (y, ω)) ({..<n}-{j})"
        using that(1,3) less_antisym unfolding restrict_merge by (intro merge_cong refl) auto
    qed (simp_all add: space_PiM that(1) x_ran[simplified] y_ran[simplified])
    also have "... = c j"
      by (auto intro!:prob_space.prob_space prob_space_PiM assms(1))
    finally show ?thesis by simp
  qed

  have "f ξ - (∫ω. f ω ∂(PiM {..<n} M)) = (∑i < n. V i ξ)" if "ξ ∈ space (PiM {..<n} M)" for ξ
    using that unfolding V_def by (subst sum_lessThan_telescope) (simp add: h_0 h_n)
  hence "?L = 𝒫(ξ in PiM {..<n} M. (∑i < n. V i ξ) ≥ ε)"
    by (intro arg_cong2[where f="measure"] refl Collect_restr_cong arg_cong2[where f="(≤)"]) auto
  also have "... ≤ 𝒫(ξ in PiM {..<n} M. exp( t * (∑i < n. V i ξ) ) ≥ exp (t * ε))"
  proof (intro finite_measure.finite_measure_mono subsetI prob_space.finite_measure int_rules)
    show "{ξ ∈ space (Pi⇩_M {..<n} M). exp (t * ε) ≤ exp (t * (∑i<n. V i ξ))} ∈ sets (Pi⇩_M {..<n} M)"
      using V_meas by measurable
  qed  (auto intro!:mult_left_mono[OF _ t_ge_0])
  also have "... ≤ (∫ξ. exp(t*(∑i < n. V i ξ)) ∂PiM {..<n} M)/ exp (t*ε)"
    by (intro integral_Markov_inequality_measure[where A="{}"] int_rules V_bounded V_meas) auto
  also have "... = exp(t^2 * (∑i∈{n..<n}. c i^2)/8-t*ε)*(∫ξ. exp(t*(∑i < n. V i ξ)) ∂PiM {..<n} M)"
    by (simp add:exp_minus inverse_eq_divide)
  also have "... ≤ exp(t^2 * (∑i∈{0..<n}. c i^2)/8-t*ε)*(∫ξ. exp(t*(∑i < 0. V i ξ)) ∂PiM {..<0} M)"
  proof (rule ineq_chain)
    fix j assume a:"j < n"
    let ?L1 = "exp (t⇧²*(∑i=j+1..<n. (c i)⇧²)/8-t*ε)"
    let ?L2 = "?L1 * (∫ξ. exp (t * (∑i<j+1. V i ξ)) ∂PiM {..<j+1} M)"

    note V_upd_meas = V_upd_meas[OF a]

    have "?L2 = ?L1 * (∫ξ. exp (t * (∑i<j. V i ξ)) * exp(t * V j ξ) ∂PiM (insert j {..<j}) M)"
      by (simp add:algebra_simps exp_add lessThan_Suc)
    also have "... = ?L1 *
      (∫ξ. (∫ω. exp (t * (∑i<j. V i (ξ(j := ω)))) * exp(t * V j (ξ(j := ω))) ∂M j) ∂PiM {..<j} M)"
      using a by (intro product_integral_insert_rev arg_cong2[where f="(*)"] int_rules
          prob_space_imp_sigma_finite V_bounded V_meas) auto
    also have "... =?L1*(∫ξ.(∫ω. exp (t*(∑i<j. V i ξ))*exp(t*V j (ξ(j := ω))) ∂M j) ∂PiM {..<j} M)"
      by (intro arg_cong2[where f="(*)"] Bochner_Integration.integral_cong
          arg_cong[where f="exp"] sum.cong V_cong restrict_fupd) auto
    also have "... =?L1*(∫ξ. exp (t*(∑i<j. V i ξ))*(∫ω. exp(t*V j (ξ(j := ω))) ∂M j) ∂PiM {..<j} M)"
      using a by (intro arg_cong2[where f="(*)"] Bochner_Integration.integral_cong refl
          Bochner_Integration.integral_mult_right V_upd_meas V_upd_bounded int_rules) auto
    also have "... ≤ ?L1 * ∫ξ. exp (t*(∑i<j. V i ξ))* exp (t^2 * c j^2/8) ∂PiM {..<j} M"
    proof (intro mult_left_mono integral_mono')
      fix ξ assume c:"ξ ∈ space (Pi⇩_M {..<j} M)"
      hence b:"ξ ∈ PiE {..<j} (λi. space (M i))"
        unfolding space_PiM by simp
      moreover have "ξ(j := v) ∈ PiE {..<j+1} (λi. space (M i))" if "v ∈ space (M j)" for v
        using b that unfolding PiE_def extensional_def Pi_def by auto
      ultimately show "LINT ω|M j. exp (t * V j (ξ(j := ω))) ≤ exp (t⇧² * (c j)⇧² / 8)"
        using V_upd_meas[OF c]
        by (intro prob_space.Hoeffdings_lemma_bochner_3 exp_V var_V a int_rules)
          (auto simp: space_PiM)
    next
      show "integrable (Pi⇩_M {..<j} M) (λx. exp (t * (∑i<j. V i x)) * exp (t⇧² * (c j)⇧² / 8))"
        using a by (intro int_rules V_bounded V_meas) auto
    qed auto
    also have "... = ?L1 * ((∫ξ. exp (t*(∑i<j. V i ξ)) ∂PiM {..<j} M) * exp (t^2 * c j^2/8))"
    proof (subst Bochner_Integration.integral_mult_left)
      show "integrable (Pi⇩_M {..<j} M) (λξ. exp (t * (∑i<j. V i ξ)))"
        using a by (intro int_rules V_bounded V_meas) auto
    qed auto
    also have "... =
      exp (t⇧²*(∑i∈insert j {j+1..<n}. (c i)⇧²)/8-t*ε) * (∫ξ. exp (t * (∑i<j. V i ξ))∂PiM {..<j} M)"
      by (simp_all add:exp_add[symmetric] field_simps)
    also have "...=exp (t⇧²*(∑i=j..<n. (c i)⇧²)/8-t*ε) * (∫ξ. exp (t * (∑i<j. V i ξ))∂PiM {..<j} M)"
      using a by (intro arg_cong2[where f="(*)"] arg_cong[where f="exp"] refl arg_cong2
          [where f="(-)"] arg_cong2[where f="(/)"] sum.cong) auto
    finally show "?L2≤exp(t⇧²*(∑i=j..<n. (c i)⇧²)/8-t*ε)*(∫ξ. exp (t*(∑i<j. V i ξ))∂PiM {..<j} M)"
      by simp
  qed
  also have "... = exp(t^2 * (∑i<n. c i^2)/8-t*ε)" by (simp add:PiM_empty atLeast0LessThan)
  also have "... = exp(t * ((t * (∑i<n. c i^2)/8)-ε))" by (simp add:algebra_simps power2_eq_square)
  also have "... = exp(t * (-ε/2))" using sum_c_ge_0 by (auto simp add:divide_simps t_def)
  also have "... = ?R" unfolding t_def by (simp add:field_simps power2_eq_square)
  finally show ?thesis by simp
qed

theorem mc_diarmid_inequality_distr:
  fixes f :: "('i ⇒ 'a) ⇒ real"
  assumes "finite I"
  assumes "⋀i. i ∈ I ⟹ prob_space (M i)"
  assumes "⋀i x y. i ∈ I ⟹ {x,y} ⊆ space (PiM I M) ⟹ (∀j∈I-{i}. x j=y j) ⟹ ¦f x-f y¦≤c i"
  assumes f_meas: "f ∈ borel_measurable (PiM I M)" and ε_gt_0: "ε > 0"
  shows "𝒫(ω in PiM I M. f ω - (∫ξ. f ξ ∂PiM I M) ≥ ε) ≤ exp (-(2*ε^2)/(∑i∈I. (c i)^2))"
    (is "?L ≤ ?R")
proof -
  define n where "n = card I"
  let ?q = "from_nat_into I"
  let ?r = "to_nat_on I"
  let ?f = "(λξ. f (λi∈I. ξ (?r i)))"

  have q: "bij_betw ?q {..<n} I" unfolding n_def by (intro bij_betw_from_nat_into_finite assms(1))
  have r: "bij_betw ?r I {..<n}" unfolding n_def by (intro to_nat_on_finite assms(1))

  have [simp]: "?q (?r x) = x" if "x ∈ I" for x
    by (intro from_nat_into_to_nat_on that countable_finite assms(1))

  have [simp]: "?r (?q x) = x" if "x < n" for x
    using bij_betw_imp_surj_on[OF r] that by (intro to_nat_on_from_nat_into) auto

  have a: "⋀i. i ∈ {..<n} ⟹ prob_space ((M ∘ ?q) i)"
    unfolding comp_def by (intro assms(2) bij_betw_apply[OF q])

  have b:"PiM I M = PiM I (λi. (M ∘ ?q) (?r i))" by (intro PiM_cong) (simp_all add:comp_def)
  also have "... = distr (PiM {..<n} (M ∘ ?q)) (PiM I (λi. (M ∘ ?q) (?r i))) (λω. λn∈I. ω (?r n))"
    using r unfolding bij_betw_def by (intro distr_PiM_reindex[symmetric] a) auto
  finally have c: "PiM I M = distr (PiM{..<n}(M∘?q)) (PiM I (λi.(M∘?q)(?r i))) (λω. λn∈I. ω (?r n))"
    by simp

  have d: "(λn∈I. x (?r n)) ∈ space (Pi⇩_M I M)" if 4:"x ∈ space (Pi⇩_M {..<n} (M ∘ ?q))" for x
  proof -
    have "x (?r i) ∈ space (M i)" if "i ∈ I" for i
    proof -
      have "?r i ∈ {..<n}" using bij_betw_apply[OF r] that by simp
      hence "x (?r i) ∈ space ((M ∘ ?q) (?r i))" using that 4 PiE_mem unfolding space_PiM by blast
      thus ?thesis using that unfolding comp_def by simp
    qed
    thus ?thesis unfolding space_PiM PiE_def by auto
  qed

  have "?L = 𝒫(ω in PiM {..<n} (M ∘ ?q). ?f ω - (∫ξ. f ξ ∂PiM I M) ≥ ε)"
  proof (subst c, subst measure_distr, goal_cases)
    case 1 thus ?case
      by (intro measurable_restrict measurable_component_singleton bij_betw_apply[OF r])
  next
    case 2 thus ?case unfolding b[symmetric] by (intro measurable_sets_Collect[OF f_meas]) auto
  next
    case 3 thus ?case using d by (intro arg_cong2[where f="measure"] refl) (auto simp:vimage_def)
  qed
  also have "... = 𝒫(ω in PiM {..<n} (M ∘ ?q). ?f ω - (∫ξ. ?f ξ ∂PiM {..<n} (M ∘ ?q)) ≥ ε)"
  proof (subst c, subst integral_distr, goal_cases)
    case (1 ω) thus ?case
      by (intro measurable_restrict measurable_component_singleton bij_betw_apply[OF r])
  next
    case (2 ω) thus ?case unfolding b[symmetric] by (rule f_meas)
  next
    case 3 thus ?case by simp
  qed
  also have "... ≤ exp (-(2*ε^2)/(∑i<n. (c (?q i))^2))"
  proof (intro mc_diarmid_inequality_aux ε_gt_0, goal_cases)
    case (1 i) thus ?case by (intro a) auto
  next
    case (2 i x y)
    have "x (?r j) = y (?r j)" if "j ∈ I - {?q i}" for j
    proof -
      have "?r j ∈ {..<n} - {i}" using that bij_betw_apply[OF r] by auto
      thus ?thesis using 2 by simp
    qed
    hence "∀j∈I - {?q i}. (λi∈I. x (?r i)) j = (λi∈I. y (?r i)) j" by auto
    thus ?case using 2 d by (intro assms(3) bij_betw_apply[OF q]) auto
  next
    case 3
    have "(λx. x (?r i)) ∈ Pi⇩_M {..<n} (M ∘ ?q) →⇩_M M i" if "i ∈ I" for i
    proof -
      have 0:"M i = (M ∘ ?q) (?r i)" using that by (simp add: comp_def)
      show ?thesis unfolding 0 by (intro measurable_component_singleton bij_betw_apply[OF r] that)
    qed
    thus ?case by (intro measurable_compose[OF _ f_meas] measurable_restrict)
  qed
  also have "... = ?R" by (subst sum.reindex_bij_betw[OF q]) simp
  finally show ?thesis by simp
qed

lemma (in prob_space) mc_diarmid_inequality_classic:
  fixes f :: "('i ⇒ 'a) ⇒ real"
  assumes "finite I"
  assumes "indep_vars N X I"
  assumes "⋀i x y. i ∈ I ⟹ {x,y} ⊆ space (PiM I N) ⟹ (∀j∈I-{i}. x j=y j) ⟹ ¦f x-f y¦≤c i"
  assumes f_meas: "f ∈ borel_measurable (PiM I N)" and ε_gt_0: "ε > 0"
  shows "𝒫(ω in M. f (λi∈I. X i ω) - (∫ξ. f (λi∈I. X i ξ) ∂M) ≥ ε) ≤ exp (-(2*ε^2)/(∑i∈I. (c i)^2))"
    (is "?L ≤ ?R")
proof -
  note indep_imp = iffD1[OF indep_vars_iff_distr_eq_PiM'']
  let ?O = "λi. distr M (N i) (X i)"
  have a:"distr M (Pi⇩_M I N) (λx. λi∈I. X i x) = Pi⇩_M I ?O"
    using assms(2) unfolding indep_vars_def by (intro indep_imp[OF _ assms(2)]) auto

  have b: "space (PiM I ?O) = space (PiM I N)"
    by (metis (no_types, lifting) a space_distr)

  have "(λi∈I. X i ω) ∈ space (Pi⇩_M I N)" if "ω ∈ space M" for ω
    using assms(2) that unfolding indep_vars_def measurable_def space_PiM by auto

  hence "?L = 𝒫(ω in M. (λi∈I. X i ω)∈ space (Pi⇩_M I N)∧ f (λi∈I. X i ω)-(∫ξ. f (λi∈I. X i ξ) ∂M)≥ε)"
    by (intro arg_cong2[where f="measure"] Collect_restr_cong refl) auto
  also have "... = 𝒫(ω in distr M (Pi⇩_M I N) (λx. λi∈I. X i x). f ω - (∫ξ. f (λi∈I. X i ξ) ∂M) ≥ ε)"
  proof (subst measure_distr, goal_cases)
    case 1 thus ?case using assms(2) unfolding indep_vars_def by (intro measurable_restrict) auto
  next
    case 2 thus ?case unfolding space_distr by (intro measurable_sets_Collect[OF f_meas]) auto
  next
    case 3 thus ?case by (simp_all add:Int_def conj_commute)
  qed
  also have "... = 𝒫(ω in PiM I ?O. f ω - (∫ξ. f (λi∈I. X i ξ) ∂M) ≥ ε)"
    unfolding a by simp
  also have "... = 𝒫(ω in PiM I ?O. f ω - (∫ξ. f ξ ∂ distr M (Pi⇩_M I N) (λx. λi∈I. X i x)) ≥ ε)"
  proof (subst integral_distr[OF _ f_meas], goal_cases)
    case (1 ω) thus ?case using assms(2) unfolding indep_vars_def by (intro measurable_restrict)auto
  next
    case 2 thus ?case by simp
  qed
  also have "... = 𝒫(ω in PiM I ?O. f ω - (∫ξ. f ξ ∂ Pi⇩_M I ?O) ≥ ε)" unfolding a by simp
  also have "... ≤ ?R"
    using f_meas assms(2) b unfolding indep_vars_def
    by (intro mc_diarmid_inequality_distr prob_space_distr assms(1) ε_gt_0 assms(3)) auto
  finally show ?thesis by simp
qed

end