Theory Concentration_Inequalities.McDiarmid_Inequality

section ‹McDiarmid's inequality›

text ‹In this section we verify McDiarmid's inequality \cite[Lemma 1.2]{mcdiarmid1989}. In the
source and also further sources sometimes refer to the result as the ``independent bounded
differences'' inequality.›

theory McDiarmid_Inequality
  imports Concentration_Inequalities_Preliminary
begin

lemma Collect_restr_cong:
  assumes "A = B"
  assumes "x. x  A  P x = Q x"
  shows "{x  A. P x} = {x  B. Q x}"
  using assms by auto

lemma ineq_chain:
  fixes h :: "nat  real"
  assumes "i. i < n  h (i+1)  h i"
  shows "h n  h 0"
  using assms by (induction n) force+

lemma restrict_subset_eq:
  assumes "A  B"
  assumes "restrict f B = restrict g B"
  shows "restrict f A = restrict g A"
  using assms unfolding restrict_def by (meson subsetD)

text ‹Bochner Integral version of Hoeffding's Lemma using
  @{thm [source] interval_bounded_random_variable.Hoeffdings_lemma_nn_integral_0}

lemma (in prob_space) Hoeffdings_lemma_bochner:
  assumes "l > 0" and E0: "expectation f = 0"
  assumes "random_variable borel f"
  assumes "AE x in M. f x  {a..b::real}"
  shows   "expectation (λx. exp (l * f x))  exp (l2 * (b - a)2 / 8)" (is "?L  ?R")
proof -
  interpret interval_bounded_random_variable M f a b
    using assms by (unfold_locales) auto

  have "integrable M (λx. exp (l * f x))"
    using assms(1,3,4) by (intro integrable_const_bound[where B="exp (l * b)"]) simp_all

  hence "ennreal (?L) = (+ x. exp (l * f x) M)"
    by (intro nn_integral_eq_integral[symmetric]) auto
  also have "...  ennreal (?R)"
    by (intro Hoeffdings_lemma_nn_integral_0 assms)
  finally have 0:"ennreal (?L)  ennreal ?R"
    by simp
  show ?thesis
  proof (cases "?L  0")
    case True
    thus ?thesis using 0 by simp
  next
    case False
    hence "?L  0" by simp
    also have "...  ?R" by simp
    finally show ?thesis by simp
  qed
qed

lemma (in prob_space) Hoeffdings_lemma_bochner_2:
  assumes "l > 0" and E0: "expectation f = 0"
  assumes "random_variable borel f"
  assumes "x y. {x,y}  space M  ¦f x - f y¦  (c::real)"
  shows   "expectation (λx. exp (l * f x))  exp (l^2 * c^2 / 8)" (is "?L  ?R")
proof -
  define a :: real where "a = (INF x  space M. f x)"
  define b :: real where "b = a+c"

  obtain ω where ω:"ω  space M" using not_empty by auto
  hence 0:"f ` space M  {}" by auto
  have 1: "c = b - a" unfolding b_def by simp

  have "bdd_below (f ` space M)"
    using ω assms(4) unfolding abs_le_iff
    by (intro bdd_belowI[where m="f ω - c"]) (auto simp add:algebra_simps)
  hence "f x  a" if "x  space M" for x unfolding a_def by (intro cINF_lower that)
  moreover have "f x  b" if x_space: "x  space M" for x
  proof (rule ccontr)
    assume "¬(f x  b)"
    hence a:"f x > a + c" unfolding b_def by simp
    have "f y  f x - c" if "y  space M" for y
      using that x_space assms(4) unfolding abs_le_iff by (simp add:algebra_simps)
    hence "f x - c  a" unfolding a_def using cInf_greatest[OF 0] by auto
    thus "False" using a by simp
  qed
  ultimately have "f x  {a..b}" if "x  space M" for x using that by auto
  hence "AE x in M. f x  {a..b}" by simp
  thus ?thesis unfolding 1 by (intro Hoeffdings_lemma_bochner assms(1,2,3))
qed

lemma (in prob_space) Hoeffdings_lemma_bochner_3:
  assumes "expectation f = 0"
  assumes "random_variable borel f"
  assumes "x y. {x,y}  space M  ¦f x - f y¦  (c::real)"
  shows   "expectation (λx. exp (l * f x))  exp (l^2 * c^2 / 8)" (is "?L  ?R")
proof -
  consider (a) "l > 0" | (b) "l = 0" | (c) "l < 0"
    by argo
  then show ?thesis
  proof (cases)
    case a thus ?thesis by (intro Hoeffdings_lemma_bochner_2 assms) auto
  next
    case b thus ?thesis by simp
  next
    case c
    have "?L = expectation (λx. exp ((-l) * (-f x)))" by simp
    also have "...  exp ((-l)^2 * c2/8)" using c assms by (intro Hoeffdings_lemma_bochner_2) auto
    also have "... = ?R" by simp
    finally show ?thesis by simp
  qed
qed

text ‹Version of @{thm [source] product_sigma_finite.product_integral_singleton} without the
condition that @{term "M i"} has to be sigma finite for all @{term "i"}:›

lemma product_integral_singleton:
  fixes f :: "_  _::{banach, second_countable_topology}"
  assumes "sigma_finite_measure (M i)"
  assumes "f  borel_measurable (M i)"
  shows "(x. f (x i) (PiM {i} M)) = (x. f x (M i))" (is "?L = ?R")
proof -
  define M' where "M' j = (if j=i then M i else count_space {undefined})" for j

  interpret product_sigma_finite "M'"
    using assms(1) unfolding product_sigma_finite_def M'_def
    by (auto intro!:sigma_finite_measure_count_space_finite)

  have "?L = x. f (x i) (PiM {i} M')"
    by (intro Bochner_Integration.integral_cong PiM_cong) (simp_all add:M'_def)
  also have "... = (x. f x (M' i))"
    using assms(2) by (intro product_integral_singleton) (simp add:M'_def)
  also have "... = ?R"
    by (intro Bochner_Integration.integral_cong PiM_cong) (simp_all add:M'_def)
  finally show ?thesis by simp
qed

text ‹Version of @{thm [source] product_sigma_finite.product_integral_fold} without the
condition that @{term "M i"} has to be sigma finite for all @{term "i"}:›

lemma product_integral_fold:
  fixes f :: "_  _::{banach, second_countable_topology}"
  assumes "i. i  I  J  sigma_finite_measure (M i)"
  assumes "I  J = {}"
  assumes "finite I"
  assumes "finite J"
  assumes "integrable (PiM (I  J) M) f"
  shows "(x. f x PiM (I  J) M) = (x. (y. f (merge I J(x,y)) PiM J M) PiM I M)" (is "?L = ?R")
    and "integrable (PiM I M) (λx. (y. f (merge I J(x,y)) PiM J M))" (is "?I")
    and "AE x in PiM I M. integrable (PiM J M) (λy. f (merge I J(x,y)))" (is "?T")
proof -
  define M' where "M' i = (if i  I  J then M i else count_space {undefined})" for i

  interpret product_sigma_finite "M'"
    using assms(1) unfolding product_sigma_finite_def M'_def
    by (auto intro!:sigma_finite_measure_count_space_finite)

  interpret pair_sigma_finite "PiM I M'" "PiM J M'"
    using assms(3,4) sigma_finite unfolding pair_sigma_finite_def by blast

  have 0: "integrable (PiM (I  J) M') f = integrable (PiM (I  J) M) f"
    by (intro Bochner_Integration.integrable_cong PiM_cong) (simp_all add:M'_def)

  have "?L = (x. f x PiM (I  J) M')"
    by (intro Bochner_Integration.integral_cong PiM_cong) (simp_all add:M'_def)
  also have "... = (x. (y. f (merge I J (x,y)) PiM J M') PiM I M')"
    using assms(5) by (intro product_integral_fold assms(2,3,4)) (simp add:0)
  also have "... = ?R"
    by (intro Bochner_Integration.integral_cong PiM_cong) (simp_all add:M'_def)
  finally show "?L = ?R" by simp

  have "integrable (PiM (I  J) M') f = integrable (PiM I M' M PiM J M') (λx. f (merge I J x))"
    using assms(5) apply (subst distr_merge[OF assms(2,3,4),symmetric])
    by (intro integrable_distr_eq) (simp_all add:0[symmetric])
  hence 1:"integrable (PiM I M' M PiM J M') (λx. f (merge I J x))"
    using assms(5) 0 by simp

  hence "integrable (PiM I M') (λx. (y. f (merge I J(x,y)) PiM J M'))" (is "?I'")
    by (intro integrable_fst') auto
  moreover have "?I' = ?I"
    by (intro Bochner_Integration.integrable_cong PiM_cong ext Bochner_Integration.integral_cong)
     (simp_all add:M'_def)
  ultimately show "?I"
    by simp

  have "AE x in PiM I M'. integrable (PiM J M') (λy. f (merge I J (x, y)))" (is "?T'")
    by (intro AE_integrable_fst'[OF 1])
  moreover have "?T' = ?T"
    by (intro arg_cong2[where f="almost_everywhere"] PiM_cong ext Bochner_Integration.integrable_cong)
     (simp_all add:M'_def)
  ultimately show  "?T"
    by simp
qed

lemma product_integral_insert:
  fixes f :: "_  _::{banach, second_countable_topology}"
  assumes "k. k  {i}  J  sigma_finite_measure (M k)"
  assumes "i  J"
  assumes "finite J"
  assumes "integrable (PiM (insert i J) M) f"
  shows "(x. f x PiM (insert i J) M) = (x. (y. f (y(i := x)) PiM J M) M i)" (is "?L = ?R")
proof -
  note meas_cong = iffD1[OF measurable_cong]

  have "integrable (PiM {i} M) (λx. (y. f (merge {i} J (x,y)) PiM J M))"
    using assms by (intro product_integral_fold) auto
  hence 0:"(λx. (y. f (merge {i} J (x,y)) PiM J M))  borel_measurable (PiM {i} M)"
    using borel_measurable_integrable by simp
  have 1:"(λx. (y. f (y(i := (x i))) PiM J M))  borel_measurable (PiM {i} M)"
    by (intro meas_cong[OF _ 0] Bochner_Integration.integral_cong arg_cong[where f="f"])
     (auto simp add:space_PiM merge_def fun_upd_def PiE_def extensional_def)
  have "(λx. (y. f (y(i := (λi{i}. x) i)) PiM J M))  borel_measurable (M i)"
    by (intro measurable_compose[OF _ 1, where f="(λx. (λi{i}. x))"] measurable_restrict) auto
  hence 2:"(λx. (y. f (y(i := x )) PiM J M))  borel_measurable (M i)" by simp

  have "?L = (x. f x PiM ({i}  J) M)" by simp
  also have "... = (x. (y. f (merge {i} J (x,y)) PiM J M) PiM {i} M)"
    using assms(2,4) by (intro product_integral_fold assms(1,3)) auto
  also have "... = (x. (y. f (y(i := (x i))) PiM J M) PiM {i} M)"
    by (intro Bochner_Integration.integral_cong refl arg_cong[where f="f"])
     (auto simp add:space_PiM merge_def fun_upd_def PiE_def extensional_def)
  also have "... = ?R"
    using assms(1,4) by (intro product_integral_singleton assms(1) 2) auto
  finally show ?thesis by simp
qed

lemma product_integral_insert_rev:
  fixes f :: "_  _::{banach, second_countable_topology}"
  assumes "k. k  {i}  J  sigma_finite_measure (M k)"
  assumes "i  J"
  assumes "finite J"
  assumes "integrable (PiM (insert i J) M) f"
  shows "(x. f x PiM (insert i J) M) = (y. (x. f (y(i := x)) M i) PiM J M)" (is "?L = ?R")
proof -
  have "?L = (x. f x PiM (J  {i}) M)" by simp
  also have "... = (x. (y. f (merge J {i} (x,y)) PiM {i} M) PiM J M)"
    using assms(2,4) by (intro product_integral_fold assms(1,3)) auto
  also have "... = (x. (y. f (x(i := (y i))) PiM {i} M) PiM J M)"
    unfolding merge_singleton[OF assms(2)]
    by (intro Bochner_Integration.integral_cong refl arg_cong[where f="f"])
     (metis PiE_restrict assms(2) restrict_upd space_PiM)
  also have "... = ?R"
    using assms(1,4) by (intro Bochner_Integration.integral_cong product_integral_singleton) auto
  finally show ?thesis by simp
qed

lemma merge_empty[simp]:
  "merge {} I (y,x) = restrict x I"
  "merge I {} (y,x) = restrict y I"
  unfolding merge_def restrict_def by auto

lemma merge_cong:
  assumes "restrict x1 I = restrict x2 I"
  assumes "restrict y1 J = restrict y2 J"
  shows "merge I J (x1,y1) = merge I J (x2,y2)"
  using assms unfolding merge_def restrict_def
  by (intro ext) (smt (verit, best) case_prod_conv)

lemma restrict_merge:
  "restrict (merge I J x) K = merge (I  K) (J  K) x"
  unfolding restrict_def merge_def by (intro ext) (auto simp:case_prod_beta)

lemma map_prod_measurable:
  assumes "f  M M M'"
  assumes "g  N M N'"
  shows "map_prod f g  M M N M M' M N'"
  using assms by (subst measurable_pair_iff) simp

lemma mc_diarmid_inequality_aux:
  fixes f :: "(nat  'a)  real"
  fixes n :: nat
  assumes "i. i < n  prob_space (M i)"
  assumes "i x y. i<n  {x,y}  space (PiM {..<n} M)  (j{..<n}-{i}. x j=y j)  ¦f x-f y¦c i"
  assumes f_meas: "f  borel_measurable (PiM {..<n} M)" and ε_gt_0: "ε >0"
  shows "𝒫(ω in PiM {..<n} M. f ω - (ξ. f ξ PiM {..<n} M)  ε)  exp (-(2*ε^2)/(i<n. (c i)^2))"
    (is "?L  ?R")
proof -
  define h where "h k = (λξ. (ω. f (merge {..<k} {k..<n} (ξ, ω)) PiM {k..<n} M))" for k

  define t :: real where "t = 4 * ε / (i<n. (c i)^2)"

  define V where "V i ξ = h (Suc i) ξ - h i ξ" for i ξ

  obtain x0 where x0:"x0  space (PiM {..<n} M)"
    using prob_space.not_empty[OF prob_space_PiM] assms(1) by fastforce

  have delta: "¦f x - f y¦  c i" if "i < n"
    "x  PiE {..<n} (λi. space (M i))" "y  PiE {..<n} (λi. space (M i))"
    "restrict x ({..<n}-{i}) = restrict y ({..<n}-{i})"
  for x y i
  proof (rule assms(2)[OF that(1)], goal_cases)
    case 1
    then show ?case using that(2,3) unfolding space_PiM by auto
  next
    case 2
    then show ?case using that(4) by (intro ballI) (metis restrict_apply')
  qed

  have c_ge_0: "c j  0" if "j < n" for j
  proof -
    have "0  ¦f x0 - f x0¦" by simp
    also have "...  c j" using x0 unfolding space_PiM by (intro delta that) auto
    finally show ?thesis by simp
  qed
  hence sum_c_ge_0: "(i<n. (c i)^2)  0" by (meson sum_nonneg zero_le_power2)

  hence t_ge_0: "t  0" using ε_gt_0 unfolding t_def by simp

  note borel_rules =
    borel_measurable_sum measurable_compose[OF _ borel_measurable_exp]
    borel_measurable_times

  note int_rules =
    prob_space_PiM assms(1) borel_rules
    prob_space.integrable_bounded bounded_intros
  have h_n: "h n ξ = f ξ" if "ξ  space (PiM {..<n} M)" for ξ
  proof -
    have "h n ξ = (ω. f (λi{..<n}. ξ i) PiM {} M)"
      unfolding h_def using leD
      by (intro Bochner_Integration.integral_cong PiM_cong arg_cong[where f="f"] restrict_cong)
       auto
    also have "... = f (restrict ξ {..<n})"
      unfolding PiM_empty by simp
    also have "... = f ξ"
      using that unfolding space_PiM PiE_def
      by (simp add: extensional_restrict)
    finally show ?thesis
      by simp
  qed

  have h_0: "h 0 ξ = (ω. f ω PiM {..<n} M)" for ξ
    unfolding h_def by (intro Bochner_Integration.integral_cong PiM_cong refl)
     (simp_all add:space_PiM atLeast0LessThan)

  have h_cong: "h j ω = h j ξ" if "restrict ω {..<j} = restrict ξ {..<j}" for j ω ξ
    using that unfolding h_def
    by (intro Bochner_Integration.integral_cong refl arg_cong[where f="f"] merge_cong) auto

  have h_meas: "h i  borel_measurable (PiM I M)" if "i  n" "{..<i}  I" for i I
  proof -
    have 0: "{..<n} = {..<i}  {i..<n}"
      using that(1) by auto

    have 1: "merge {..<i} {i..<n} = merge {..<i} {i..<n}  map_prod (λx. restrict x {..<i}) id"
      unfolding merge_def map_prod_def restrict_def comp_def
      by (intro ext) (auto simp:case_prod_beta')

    have "merge {..<i} {i..<n}  PiM I M M PiM {i..<n} M M PiM {..<n} M"
      unfolding 0 by (subst 1) (intro measurable_comp[OF _ measurable_merge] map_prod_measurable
          measurable_ident measurable_restrict_subset that(2))
    hence "(λx. f (merge {..<i} {i..<n} x))  borel_measurable (PiM I M M PiM {i..<n} M)"
      by (intro measurable_compose[OF _ f_meas])
    thus ?thesis
      unfolding h_def by (intro sigma_finite_measure.borel_measurable_lebesgue_integral
            prob_space_imp_sigma_finite prob_space_PiM assms(1)) (auto simp:case_prod_beta')
  qed

  have merge_space_aux:"merge {..<j} {j..<n} u  (ΠE i{..<n}. space (M i))"
    if "j  n" "fst u  Pi {..<j} (λi. space (M i))" "snd u  Pi {j..<n} (λi. space (M i))"
    for u  j
  proof -
    have "merge {..<j} {j..<n} (fst u, snd u)  (PiE ({..<j}  {j..<n}) (λi. space (M i)))"
      using that by (intro iffD2[OF PiE_cancel_merge]) auto
    also have "... =  (ΠE i{..<n}. space (M i))"
      using that by (intro arg_cong2[where f="PiE"] refl) auto
    finally show ?thesis by simp
  qed

  have merge_space:"merge {..<j} {j..<n} (u, v)  (ΠE i{..<n}. space (M i))"
    if "j  n" "u  PiE {..<j} (λi. space (M i))" "v  PiE {j..<n} (λi. space (M i))"
    for u v j
    using that by (intro merge_space_aux) (simp_all add:PiE_def)

  have delta': "¦f x - f y¦  (i<n. c i)"
    if "x  PiE {..<n} (λi. space (M i))" "y  PiE {..<n} (λi. space (M i))" for x y
  proof -
    define m where "m i = merge {..<i} {i..<n} (x,y)" for i

    have 0: "z  Pi I (λi. space (M i))" if "z  PiE {..<n} (λi. space (M i))"
       "I  {..<n}" for z I
      using that unfolding PiE_def by auto

    have 3: "{..<Suc i}  ({..<n} - {i}) = {..<i}"
      "{Suc i..<n}  ({..<n} - {i}) = {Suc i..<n}"
      "{..<i}  ({..<n} - {i}) = {..<i}"
      "{i..<n}  ({..<n} - {i}) = {Suc i..<n}"
      if "i < n" for i
      using that by auto

    have "¦f x - f y¦ = ¦f (m n) - f(m 0)¦"
      using that unfolding m_def by (simp add:atLeast0LessThan)
    also have "... = ¦i < n. f (m (Suc i)) - f (m i)¦"
      by (subst sum_lessThan_telescope) simp
    also have "...  (i < n. ¦f (m (Suc i)) - f (m i)¦)"
      by simp
    also have "...  (i < n. c i)"
      using that unfolding m_def by (intro delta sum_mono merge_space_aux 0 subsetI)
       (simp_all add:restrict_merge 3)
    finally show ?thesis
      by simp
  qed

  have "norm (f x)  norm (f x0) + sum c {..<n}" if "x  space (PiM {..<n} M)" for x
  proof -
    have "¦f x - f x0¦  sum c {..<n}"
      using x0 that unfolding space_PiM by (intro delta') auto
    thus ?thesis
      by simp
  qed
  hence f_bounded: "bounded (f ` space (PiM {..<n} M))"
    by (intro boundedI[where B="norm (f x0) + (i<n. c i)"]) auto

  have f_merge_bounded:
    "bounded ((λω. (f (merge {..<j} {j..<n} (u, ω)))) ` space (PiM {j..<n} M))"
    if "j  n" "u  PiE {..<j} (λi. space (M i))" for u j
  proof -
    have "(λω. merge {..<j} {j..<n} (u, ω)) ` space (PiM {j..<n} M)  space (PiM {..<n} M)"
      using that  unfolding space_PiM
      by (intro image_subsetI merge_space) auto
    thus ?thesis
      by (subst image_image[of "f",symmetric]) (intro bounded_subset[OF f_bounded] image_mono)
  qed

  have f_merge_meas_aux:
    "(λω. f (merge {..<j} {j..<n} (u, ω)))  borel_measurable (PiM {j..<n} M)"
    if "j  n" "u  Pi {..<j} (λi. space (M i))" for j u
  proof -

    have 0: "{..<n} = {..<j }  {j ..<n}"
      using that(1) by auto

    have 1: "merge {..<j} {j..<n} (u,ω) = merge {..<j} {j..<n} (restrict u {..<j},ω)" for ω
      by (intro merge_cong) auto

    have "(λω. merge {..<j} {j..<n} (u, ω))  PiM {j..<n} M M PiM {..<n} M"
      using that unfolding 0 1
      by (intro measurable_compose[OF _ measurable_merge] measurable_Pair1')
       (simp add:space_PiM)
    thus ?thesis
      by (intro measurable_compose[OF _ f_meas])
  qed

  have f_merge_meas: "(λω. f (merge {..<j} {j..<n} (u, ω)))  borel_measurable (PiM {j..<n} M)"
    if "j  n" "u  PiE {..<j} (λi. space (M i))" for j u
    using that unfolding PiE_def by (intro f_merge_meas_aux) auto

  have h_bounded: "bounded (h i ` space (PiM I M))"
    if h_bounded_assms: "i  n" "{..<i}  I" for i I
  proof -
    have "merge {..<i} {i..<n} x  space (PiM {..<n} M)"
      if "x  (ΠE iI. space (M i)) × (ΠE i{i..<n}. space (M i))" for x
      using that h_bounded_assms unfolding space_PiM by (intro merge_space_aux)
        (auto simp: PiE_def mem_Times_iff)
    hence "bounded ((λx. f (merge {..<i} {i..<n} x)) `
      ((ΠE iI. space (M i)) × (ΠE i{i..<n}. space (M i))))"
      by (subst image_image[of "f",symmetric])
       (intro bounded_subset[OF f_bounded] image_mono image_subsetI)
    thus ?thesis
      using that unfolding h_def
      by (intro prob_space.finite_measure finite_measure.bounded_int int_rules)
        (auto simp:space_PiM PiE_def)
  qed

  have V_bounded: "bounded (V i ` space (PiM I M))"
    if "i < n" "{..<i+1}  I" for i I
    using that unfolding V_def by (intro bounded_intros h_bounded) auto

  have V_upd_bounded: "bounded ((λx. V j (ξ(j := x))) ` space (M j))"
    if V_upd_bounded_assms: "ξ  space (PiM {..<j} M)" "j < n" for j ξ
  proof -
    have "ξ(j := v)  space (PiM {..<j + 1} M)" if "v  space (M j)" for v
      using V_upd_bounded_assms that unfolding space_PiM PiE_def extensional_def Pi_def by auto
    thus ?thesis
        using that unfolding image_image[of "V j" "(λx. (ξ(j := x)))",symmetric]
        by (intro bounded_subset[OF V_bounded[of "j" "{..<j+1}"]] that image_mono) auto
  qed

  have h_step: "h j ω = τ. h (j+1) (ω (j := τ))  M j" (is "?L1 = ?R1")
    if "ω  space (PiM {..<j} M)" "j < n" for j ω
  proof -
    have 0: "(λx. f (merge {..<j} {j..<n} (ω, x)))  borel_measurable (PiM {j..<n} M)"
      using that unfolding space_PiM by (intro f_merge_meas) auto

    have 1: "insert j {Suc j..<n} = {j..<n}"
      using that by auto

    have 2: "bounded ((λx.(f (merge {..<j} {j..<n} (ω, x)))) ` space (PiM {j..<n} M))"
      using that by (intro f_merge_bounded) (simp_all add: space_PiM)

    have "?L1 = (ξ. f (merge {..<j} {j..<n} (ω, ξ)) PiM (insert j {j+1..<n}) M)"
      unfolding h_def using that by (intro Bochner_Integration.integral_cong refl PiM_cong) auto
    also have "...=(τ.(ξ. f (merge {..<j} {j..<n} (ω, (ξ(j := τ)))) PiM {j+1..<n} M)M j)"
      using that(1,2) 0 1 2 by (intro product_integral_insert prob_space_imp_sigma_finite assms(1)
          int_rules f_merge_meas) (simp_all)
    also have "... = ?R1"
      using that(2) unfolding h_def
      by (intro Bochner_Integration.integral_cong arg_cong[where f="f"] ext) (auto simp:merge_def)
    finally show ?thesis
      by simp
  qed

  have V_meas: "V i  borel_measurable (PiM I M)" if "i < n" "{..<i+1}  I" for i I
    unfolding V_def using that by (intro borel_measurable_diff h_meas) auto

  have V_upd_meas: "(λx. V j (ξ(j := x)))  borel_measurable (M j)"
    if "j < n" "ξ  space (PiM {..<j} M)" for j ξ
    using that by (intro measurable_compose[OF _ V_meas[where I="insert j {..<j}"]]
          measurable_component_update) auto

  have V_cong:
    "V j ω = V j ξ" if "restrict ω {..<(j+1)} = restrict ξ {..<(j+1)}" for j ω ξ
    using that restrict_subset_eq[OF _ that] unfolding V_def
    by (intro arg_cong2[where f="(-)"] h_cong) simp_all

  have exp_V: "(ω. V j (ξ(j := ω)) M j) = 0" (is "?L1 = 0")
    if "j < n" "ξ  space (PiM {..<j} M)" for j ξ
  proof -

    have "fun_upd ξ j ` space (M j)  space (PiM (insert j {..<j}) M)"
      using that unfolding space_PiM by (intro image_subsetI PiE_fun_upd) auto
    hence 0:"bounded ((λx. h (Suc j) (ξ(j := x))) ` space (M j))"
      unfolding image_image[of "h (Suc j)" "λx. ξ(j := x)",symmetric] using that
      by (intro bounded_subset[OF h_bounded[where i="j+1" and I="{..<j+1}"]] image_mono)
        (auto simp:lessThan_Suc)

    have 1:"(λx. h (Suc j) (ξ(j := x)))  borel_measurable (M j)"
      using h_meas that by (intro measurable_compose[OF _ h_meas[where I="insert j {..<j}"]]
          measurable_component_update) auto

    have "?L1 =(ω. h (Suc j) (ξ(j := ω)) - h j ξ M j)"
      unfolding V_def
      by (intro Bochner_Integration.integral_cong arg_cong2[where f="(-)"] refl h_cong) auto
    also have "... = (ω. h (Suc j) (ξ(j := ω)) M j) - (ω. h j ξ M j)"
      using that by (intro Bochner_Integration.integral_diff int_rules 0 1) auto
    also have "... = 0"
      using that(1) assms(1) prob_space.prob_space unfolding h_step[OF that(2,1)] by auto
    finally show ?thesis
      by simp
  qed

  have var_V: "¦V j x - V j y¦  c j" (is "?L1  ?R1")
    if var_V_assms: "j < n" "{x,y}  space (PiM {..<j+1} M)"
       "restrict x {..<j} = restrict y {..<j}"  for x y j
  proof -
    have x_ran: "x  PiE {..<j+1} (λi. space (M i))" and y_ran: "y  PiE {..<j+1} (λi. space (M i))"
      using that(2) by (simp_all add:space_PiM)

    have 0: "j+1  n"
      using that by simp

    have "?L1 = ¦h (Suc j) x - h j y - (h (Suc j) y - h j y)¦"
      unfolding V_def by (intro arg_cong[where f="abs"] arg_cong2[where f="(-)"] refl h_cong that)
    also have "... = ¦h (j+1) x - h (j+1) y¦"
      by simp
    also have "... =
      ¦(ω. f(merge {..<j+1} {j+1..<n} (x,ω))-f(merge {..<j+1} {j+1..<n} (y,ω)) PiM {j+1..<n} M)¦"
      using that unfolding h_def by (intro arg_cong[where f="abs"] f_merge_meas[OF 0] x_ran
          Bochner_Integration.integral_diff[symmetric] int_rules f_merge_bounded[OF 0] y_ran) auto
    also have "... 
      (ω. ¦f(merge {..<j+1} {j+1..<n} (x,ω))-f(merge {..<j+1} {j+1..<n} (y,ω))¦ PiM {j+1..<n} M)"
      by (intro integral_abs_bound)
    also have "...  (ω. c j PiM {j+1..<n} M)"
    proof (intro Bochner_Integration.integral_mono' delta int_rules c_ge_0 ballI merge_space 0)
      fix ω assume "ω  space (PiM {j + 1..<n} M)"
      have "{..<j + 1}  ({..<n} - {j}) = {..<j}"
        using that by auto
      thus "restrict (merge {..<j+1} {j+1..<n} (x, ω)) ({..<n}-{j}) =
            restrict (merge {..<j+1} {j+1..<n} (y, ω)) ({..<n}-{j})"
        using that(1,3) less_antisym unfolding restrict_merge by (intro merge_cong refl) auto
    qed (simp_all add: space_PiM that(1) x_ran[simplified] y_ran[simplified])
    also have "... = c j"
      by (auto intro!:prob_space.prob_space prob_space_PiM assms(1))
    finally show ?thesis by simp
  qed

  have "f ξ - (ω. f ω (PiM {..<n} M)) = (i < n. V i ξ)" if "ξ  space (PiM {..<n} M)" for ξ
    using that unfolding V_def by (subst sum_lessThan_telescope) (simp add: h_0 h_n)
  hence "?L = 𝒫(ξ in PiM {..<n} M. (i < n. V i ξ)  ε)"
    by (intro arg_cong2[where f="measure"] refl Collect_restr_cong arg_cong2[where f="(≤)"]) auto
  also have "...  𝒫(ξ in PiM {..<n} M. exp( t * (i < n. V i ξ) )  exp (t * ε))"
  proof (intro finite_measure.finite_measure_mono subsetI prob_space.finite_measure int_rules)
    show "{ξ  space (PiM {..<n} M). exp (t * ε)  exp (t * (i<n. V i ξ))}  sets (PiM {..<n} M)"
      using V_meas by measurable
  qed  (auto intro!:mult_left_mono[OF _ t_ge_0])
  also have "...  (ξ. exp(t*(i < n. V i ξ)) PiM {..<n} M)/ exp (t*ε)"
    by (intro integral_Markov_inequality_measure[where A="{}"] int_rules V_bounded V_meas) auto
  also have "... = exp(t^2 * (i{n..<n}. c i^2)/8-t*ε)*(ξ. exp(t*(i < n. V i ξ)) PiM {..<n} M)"
    by (simp add:exp_minus inverse_eq_divide)
  also have "...  exp(t^2 * (i{0..<n}. c i^2)/8-t*ε)*(ξ. exp(t*(i < 0. V i ξ)) PiM {..<0} M)"
  proof (rule ineq_chain)
    fix j assume a:"j < n"
    let ?L1 = "exp (t2*(i=j+1..<n. (c i)2)/8-t*ε)"
    let ?L2 = "?L1 * (ξ. exp (t * (i<j+1. V i ξ)) PiM {..<j+1} M)"

    note V_upd_meas = V_upd_meas[OF a]

    have "?L2 = ?L1 * (ξ. exp (t * (i<j. V i ξ)) * exp(t * V j ξ) PiM (insert j {..<j}) M)"
      by (simp add:algebra_simps exp_add lessThan_Suc)
    also have "... = ?L1 *
      (ξ. (ω. exp (t * (i<j. V i (ξ(j := ω)))) * exp(t * V j (ξ(j := ω))) M j) PiM {..<j} M)"
      using a by (intro product_integral_insert_rev arg_cong2[where f="(*)"] int_rules
          prob_space_imp_sigma_finite V_bounded V_meas) auto
    also have "... =?L1*(ξ.(ω. exp (t*(i<j. V i ξ))*exp(t*V j (ξ(j := ω))) M j) PiM {..<j} M)"
      by (intro arg_cong2[where f="(*)"] Bochner_Integration.integral_cong
          arg_cong[where f="exp"] sum.cong V_cong restrict_fupd) auto
    also have "... =?L1*(ξ. exp (t*(i<j. V i ξ))*(ω. exp(t*V j (ξ(j := ω))) M j) PiM {..<j} M)"
      using a by (intro arg_cong2[where f="(*)"] Bochner_Integration.integral_cong refl
          Bochner_Integration.integral_mult_right V_upd_meas V_upd_bounded int_rules) auto
    also have "...  ?L1 * ξ. exp (t*(i<j. V i ξ))* exp (t^2 * c j^2/8) PiM {..<j} M"
    proof (intro mult_left_mono integral_mono')
      fix ξ assume c:"ξ  space (PiM {..<j} M)"
      hence b:"ξ  PiE {..<j} (λi. space (M i))"
        unfolding space_PiM by simp
      moreover have "ξ(j := v)  PiE {..<j+1} (λi. space (M i))" if "v  space (M j)" for v
        using b that unfolding PiE_def extensional_def Pi_def by auto
      ultimately show "LINT ω|M j. exp (t * V j (ξ(j := ω)))  exp (t2 * (c j)2 / 8)"
        using V_upd_meas[OF c]
        by (intro prob_space.Hoeffdings_lemma_bochner_3 exp_V var_V a int_rules)
          (auto simp: space_PiM)
    next
      show "integrable (PiM {..<j} M) (λx. exp (t * (i<j. V i x)) * exp (t2 * (c j)2 / 8))"
        using a by (intro int_rules V_bounded V_meas) auto
    qed auto
    also have "... = ?L1 * ((ξ. exp (t*(i<j. V i ξ)) PiM {..<j} M) * exp (t^2 * c j^2/8))"
    proof (subst Bochner_Integration.integral_mult_left)
      show "integrable (PiM {..<j} M) (λξ. exp (t * (i<j. V i ξ)))"
        using a by (intro int_rules V_bounded V_meas) auto
    qed auto
    also have "... =
      exp (t2*(iinsert j {j+1..<n}. (c i)2)/8-t*ε) * (ξ. exp (t * (i<j. V i ξ))PiM {..<j} M)"
      by (simp_all add:exp_add[symmetric] field_simps)
    also have "...=exp (t2*(i=j..<n. (c i)2)/8-t*ε) * (ξ. exp (t * (i<j. V i ξ))PiM {..<j} M)"
      using a by (intro arg_cong2[where f="(*)"] arg_cong[where f="exp"] refl arg_cong2
          [where f="(-)"] arg_cong2[where f="(/)"] sum.cong) auto
    finally show "?L2exp(t2*(i=j..<n. (c i)2)/8-t*ε)*(ξ. exp (t*(i<j. V i ξ))PiM {..<j} M)"
      by simp
  qed
  also have "... = exp(t^2 * (i<n. c i^2)/8-t*ε)" by (simp add:PiM_empty atLeast0LessThan)
  also have "... = exp(t * ((t * (i<n. c i^2)/8)-ε))" by (simp add:algebra_simps power2_eq_square)
  also have "... = exp(t * (-ε/2))" using sum_c_ge_0 by (auto simp add:divide_simps t_def)
  also have "... = ?R" unfolding t_def by (simp add:field_simps power2_eq_square)
  finally show ?thesis by simp
qed

theorem mc_diarmid_inequality_distr:
  fixes f :: "('i  'a)  real"
  assumes "finite I"
  assumes "i. i  I  prob_space (M i)"
  assumes "i x y. i  I  {x,y}  space (PiM I M)  (jI-{i}. x j=y j)  ¦f x-f y¦c i"
  assumes f_meas: "f  borel_measurable (PiM I M)" and ε_gt_0: "ε > 0"
  shows "𝒫(ω in PiM I M. f ω - (ξ. f ξ PiM I M)  ε)  exp (-(2*ε^2)/(iI. (c i)^2))"
    (is "?L  ?R")
proof -
  define n where "n = card I"
  let ?q = "from_nat_into I"
  let ?r = "to_nat_on I"
  let ?f = "(λξ. f (λiI. ξ (?r i)))"

  have q: "bij_betw ?q {..<n} I" unfolding n_def by (intro bij_betw_from_nat_into_finite assms(1))
  have r: "bij_betw ?r I {..<n}" unfolding n_def by (intro to_nat_on_finite assms(1))

  have [simp]: "?q (?r x) = x" if "x  I" for x
    by (intro from_nat_into_to_nat_on that countable_finite assms(1))

  have [simp]: "?r (?q x) = x" if "x < n" for x
    using bij_betw_imp_surj_on[OF r] that by (intro to_nat_on_from_nat_into) auto

  have a: "i. i  {..<n}  prob_space ((M  ?q) i)"
    unfolding comp_def by (intro assms(2) bij_betw_apply[OF q])

  have b:"PiM I M = PiM I (λi. (M  ?q) (?r i))" by (intro PiM_cong) (simp_all add:comp_def)
  also have "... = distr (PiM {..<n} (M  ?q)) (PiM I (λi. (M  ?q) (?r i))) (λω. λnI. ω (?r n))"
    using r unfolding bij_betw_def by (intro distr_PiM_reindex[symmetric] a) auto
  finally have c: "PiM I M = distr (PiM{..<n}(M?q)) (PiM I (λi.(M?q)(?r i))) (λω. λnI. ω (?r n))"
    by simp

  have d: "(λnI. x (?r n))  space (PiM I M)" if 4:"x  space (PiM {..<n} (M  ?q))" for x
  proof -
    have "x (?r i)  space (M i)" if "i  I" for i
    proof -
      have "?r i  {..<n}" using bij_betw_apply[OF r] that by simp
      hence "x (?r i)  space ((M  ?q) (?r i))" using that 4 PiE_mem unfolding space_PiM by blast
      thus ?thesis using that unfolding comp_def by simp
    qed
    thus ?thesis unfolding space_PiM PiE_def by auto
  qed

  have "?L = 𝒫(ω in PiM {..<n} (M  ?q). ?f ω - (ξ. f ξ PiM I M)  ε)"
  proof (subst c, subst measure_distr, goal_cases)
    case 1 thus ?case
      by (intro measurable_restrict measurable_component_singleton bij_betw_apply[OF r])
  next
    case 2 thus ?case unfolding b[symmetric] by (intro measurable_sets_Collect[OF f_meas]) auto
  next
    case 3 thus ?case using d by (intro arg_cong2[where f="measure"] refl) (auto simp:vimage_def)
  qed
  also have "... = 𝒫(ω in PiM {..<n} (M  ?q). ?f ω - (ξ. ?f ξ PiM {..<n} (M  ?q))  ε)"
  proof (subst c, subst integral_distr, goal_cases)
    case (1 ω) thus ?case
      by (intro measurable_restrict measurable_component_singleton bij_betw_apply[OF r])
  next
    case (2 ω) thus ?case unfolding b[symmetric] by (rule f_meas)
  next
    case 3 thus ?case by simp
  qed
  also have "...  exp (-(2*ε^2)/(i<n. (c (?q i))^2))"
  proof (intro mc_diarmid_inequality_aux ε_gt_0, goal_cases)
    case (1 i) thus ?case by (intro a) auto
  next
    case (2 i x y)
    have "x (?r j) = y (?r j)" if "j  I - {?q i}" for j
    proof -
      have "?r j  {..<n} - {i}" using that bij_betw_apply[OF r] by auto
      thus ?thesis using 2 by simp
    qed
    hence "jI - {?q i}. (λiI. x (?r i)) j = (λiI. y (?r i)) j" by auto
    thus ?case using 2 d by (intro assms(3) bij_betw_apply[OF q]) auto
  next
    case 3
    have "(λx. x (?r i))  PiM {..<n} (M  ?q) M M i" if "i  I" for i
    proof -
      have 0:"M i = (M  ?q) (?r i)" using that by (simp add: comp_def)
      show ?thesis unfolding 0 by (intro measurable_component_singleton bij_betw_apply[OF r] that)
    qed
    thus ?case by (intro measurable_compose[OF _ f_meas] measurable_restrict)
  qed
  also have "... = ?R" by (subst sum.reindex_bij_betw[OF q]) simp
  finally show ?thesis by simp
qed

lemma (in prob_space) mc_diarmid_inequality_classic:
  fixes f :: "('i  'a)  real"
  assumes "finite I"
  assumes "indep_vars N X I"
  assumes "i x y. i  I  {x,y}  space (PiM I N)  (jI-{i}. x j=y j)  ¦f x-f y¦c i"
  assumes f_meas: "f  borel_measurable (PiM I N)" and ε_gt_0: "ε > 0"
  shows "𝒫(ω in M. f (λiI. X i ω) - (ξ. f (λiI. X i ξ) M)  ε)  exp (-(2*ε^2)/(iI. (c i)^2))"
    (is "?L  ?R")
proof -
  note indep_imp = iffD1[OF indep_vars_iff_distr_eq_PiM'']
  let ?O = "λi. distr M (N i) (X i)"
  have a:"distr M (PiM I N) (λx. λiI. X i x) = PiM I ?O"
    using assms(2) unfolding indep_vars_def by (intro indep_imp[OF _ assms(2)]) auto

  have b: "space (PiM I ?O) = space (PiM I N)"
    by (metis (no_types, lifting) a space_distr)

  have "(λiI. X i ω)  space (PiM I N)" if "ω  space M" for ω
    using assms(2) that unfolding indep_vars_def measurable_def space_PiM by auto

  hence "?L = 𝒫(ω in M. (λiI. X i ω) space (PiM I N) f (λiI. X i ω)-(ξ. f (λiI. X i ξ) M)ε)"
    by (intro arg_cong2[where f="measure"] Collect_restr_cong refl) auto
  also have "... = 𝒫(ω in distr M (PiM I N) (λx. λiI. X i x). f ω - (ξ. f (λiI. X i ξ) M)  ε)"
  proof (subst measure_distr, goal_cases)
    case 1 thus ?case using assms(2) unfolding indep_vars_def by (intro measurable_restrict) auto
  next
    case 2 thus ?case unfolding space_distr by (intro measurable_sets_Collect[OF f_meas]) auto
  next
    case 3 thus ?case by (simp_all add:Int_def conj_commute)
  qed
  also have "... = 𝒫(ω in PiM I ?O. f ω - (ξ. f (λiI. X i ξ) M)  ε)"
    unfolding a by simp
  also have "... = 𝒫(ω in PiM I ?O. f ω - (ξ. f ξ  distr M (PiM I N) (λx. λiI. X i x))  ε)"
  proof (subst integral_distr[OF _ f_meas], goal_cases)
    case (1 ω) thus ?case using assms(2) unfolding indep_vars_def by (intro measurable_restrict)auto
  next
    case 2 thus ?case by simp
  qed
  also have "... = 𝒫(ω in PiM I ?O. f ω - (ξ. f ξ  PiM I ?O)  ε)" unfolding a by simp
  also have "...  ?R"
    using f_meas assms(2) b unfolding indep_vars_def
    by (intro mc_diarmid_inequality_distr prob_space_distr assms(1) ε_gt_0 assms(3)) auto
  finally show ?thesis by simp
qed

end