Theory Weighted_Arithmetic_Geometric_Mean

section ‹The Weighted Arithmetic--Geometric Mean Inequality›
theory Weighted_Arithmetic_Geometric_Mean
  imports Complex_Main
begin

subsection ‹Auxiliary Facts›

lemma root_powr_inverse': "0 < n ⟹ 0 ≤ x ⟹ root n x = x powr (1/n)"
  by (cases "x = 0") (auto simp: root_powr_inverse)

lemma powr_sum_distrib_real_right:
  assumes "a ≠ 0"
  shows   "(∏x∈X. a powr e x :: real) = a powr (∑x∈X. e x)"
  using assms
  by (induction X rule: infinite_finite_induct) (auto simp: powr_add)

lemma powr_sum_distrib_real_left:
  assumes "⋀x. x ∈ X ⟹ a x ≥ 0"
  shows   "(∏x∈X. a x powr e :: real) = (∏x∈X. a x) powr e"
  using assms
  by (induction X rule: infinite_finite_induct)
     (auto simp: powr_mult prod_nonneg)

lemma prod_ge_pointwise_le_imp_pointwise_eq:
  fixes f :: "'a ⇒ real"
  assumes "finite X"
  assumes ge: "prod f X ≥ prod g X"
  assumes nonneg: "⋀x. x ∈ X ⟹ f x ≥ 0"
  assumes pos: "⋀x. x ∈ X ⟹ g x > 0"
  assumes le: "⋀x. x ∈ X ⟹ f x ≤ g x" and x: "x ∈ X"
  shows   "f x = g x"
proof (rule ccontr)
  assume "f x ≠ g x"
  with le[of x] and x have "f x < g x"
    by auto
  hence "prod f X < prod g X"
    using x and le and nonneg and pos and ‹finite X› 
    by (intro prod_mono_strict) auto
  with ge show False
    by simp
qed

lemma powr_right_real_eq_iff:
  assumes "a ≥ (0 :: real)"
  shows   "a powr x = a powr y ⟷ a = 0 ∨ a = 1 ∨ x = y"
  using assms by (auto simp: powr_def)

lemma powr_left_real_eq_iff:
  assumes "a ≥ (0 :: real)" "b ≥ 0" "x ≠ 0"
  shows   "a powr x = b powr x ⟷ a = b"
  using assms by (auto simp: powr_def)

lemma exp_real_eq_one_plus_iff:
  fixes x :: real
  shows "exp x = 1 + x ⟷ x = 0"
proof (cases "x = 0")
  case False
  define f :: "real ⇒ real" where "f = (λx. exp x - 1 - x)"
  have deriv: "(f has_field_derivative (exp x - 1)) (at x)" for x
    by (auto simp: f_def intro!: derivative_eq_intros)

  have "∃z. z>min x 0 ∧ z < max x 0 ∧ f (max x 0) - f (min x 0) = 
            (max x 0 - min x 0) * (exp z - 1)"
    using MVT2[of "min x 0" "max x 0" f "λx. exp x - 1"] deriv False
    by (auto simp: min_def max_def)
  then obtain z where "z ∈ {min x 0<..<max x 0}"
     "f (max x 0) - f (min x 0) = (max x 0 - min x 0) * (exp z - 1)"
    by (auto simp: f_def)
  thus ?thesis using False
    by (cases x "0 :: real" rule: linorder_cases) (auto simp: f_def)
qed auto


subsection ‹The Inequality›

text ‹
  We first prove the equality under the assumption that all the $a_i$ and $w_i$ are positive.
›
lemma weighted_arithmetic_geometric_mean_pos:
  fixes a w :: "'a ⇒ real"
  assumes "finite X"
  assumes pos1: "⋀x. x ∈ X ⟹ a x > 0"
  assumes pos2: "⋀x. x ∈ X ⟹ w x > 0"
  assumes sum_weights: "(∑x∈X. w x) = 1"
  shows   "(∏x∈X. a x powr w x) ≤ (∑x∈X. w x * a x)"
proof -
  note nonneg1 = less_imp_le[OF pos1]
  note nonneg2 = less_imp_le[OF pos2]
  define A where "A = (∑x∈X. w x * a x)"
  define r where "r = (λx. a x / A - 1)"
  from sum_weights have "X ≠ {}" by auto
  hence "A ≠ 0"
    unfolding A_def using nonneg1 nonneg2 pos1 pos2 ‹finite X›
    by (subst sum_nonneg_eq_0_iff) force+
  moreover from nonneg1 nonneg2 have "A ≥ 0"
    by (auto simp: A_def intro!: sum_nonneg)
  ultimately have "A > 0" by simp

  have "(∏x∈X. (1 + r x) powr w x) = (∏x∈X. (a x / A) powr w x)"
    by (simp add: r_def)
  also have "… = (∏x∈X. a x powr w x) / (∏x∈X. A powr w x)"
    unfolding prod_dividef [symmetric]
    using assms pos2 ‹A > 0› by (intro prod.cong powr_divide) (auto intro: less_imp_le)
  also have "(∏x∈X. A powr w x) = exp ((∑x∈X. w x) * ln A)"
    using ‹A > 0› and ‹finite X› by (simp add: powr_def exp_sum sum_distrib_right)
  also have "(∑x∈X. w x) = 1" by fact
  also have "exp (1 * ln A) = A"
    using ‹A > 0› by simp
  finally have lhs: "(∏x∈X. (1 + r x) powr w x) = (∏x∈X. a x powr w x) / A" .

  have "(∏x∈X. exp (w x * r x)) = exp (∑x∈X. w x * r x)"
    using ‹finite X› by (simp add: exp_sum)
  also have "(∑x∈X. w x * r x) = (∑x∈X. a x * w x) / A - 1"
    using ‹A > 0› by (simp add: r_def algebra_simps sum_subtractf sum_divide_distrib sum_weights)
  also have "(∑x∈X. a x * w x) / A = 1"
    using ‹A > 0› by (simp add: A_def mult.commute)
  finally have rhs: "(∏x∈X. exp (w x * r x)) = 1" by simp

  have "(∏x∈X. a x powr w x) / A = (∏x∈X. (1 + r x) powr w x)"
    by (fact lhs [symmetric])
  also have "(∏x∈X. (1 + r x) powr w x) ≤ (∏x∈X. exp (w x * r x))"
  proof (intro prod_mono conjI)
    fix x assume x: "x ∈ X"
    have "1 + r x ≤ exp (r x)"
      by (rule exp_ge_add_one_self)
    hence "(1 + r x) powr w x ≤ exp (r x) powr w x"
      using nonneg1[of x] nonneg2[of x] x ‹A > 0›
      by (intro powr_mono2) (auto simp: r_def field_simps)
    also have "… = exp (w x * r x)"
      by (simp add: powr_def)
    finally show "(1 + r x) powr w x ≤ exp (w x * r x)" .
  qed auto
  also have "(∏x∈X. exp (w x * r x)) = 1" by (fact rhs)
  finally show "(∏x∈X. a x powr w x) ≤ A"
    using ‹A > 0› by (simp add: field_simps)
qed

text ‹
  We can now relax the positivity assumptions to non-negativity: if one of the $a_i$ is
  zero, the theorem becomes trivial (note that $0^0 = 0$ by convention for the real-valued
  power operator \<^term>‹(powr) :: real ⇒ real ⇒ real›).

  Otherwise, we can simply remove all the indices that have weight 0 and apply the
  above auxiliary version of the theorem.
›
theorem weighted_arithmetic_geometric_mean:
  fixes a w :: "'a ⇒ real"
  assumes "finite X"
  assumes nonneg1: "⋀x. x ∈ X ⟹ a x ≥ 0"
  assumes nonneg2: "⋀x. x ∈ X ⟹ w x ≥ 0"
  assumes sum_weights: "(∑x∈X. w x) = 1"
  shows   "(∏x∈X. a x powr w x) ≤ (∑x∈X. w x * a x)"
proof (cases "∃x∈X. a x = 0")
  case True
  hence "(∏x∈X. a x powr w x) = 0"
    using ‹finite X› by simp
  also have "… ≤ (∑x∈X. w x * a x)"
    by (intro sum_nonneg mult_nonneg_nonneg assms)
  finally show ?thesis .
next
  case False
  have "(∑x∈X-{x. w x = 0}. w x) = (∑x∈X. w x)"
    by (intro sum.mono_neutral_left assms) auto
  also have "… = 1" by fact
  finally have sum_weights': "(∑x∈X-{x. w x = 0}. w x) = 1" .

  have "(∏x∈X. a x powr w x) = (∏x∈X-{x. w x = 0}. a x powr w x)"
    using ‹finite X› False by (intro prod.mono_neutral_right) auto
  also have "… ≤ (∑x∈X-{x. w x = 0}. w x * a x)" using assms False
    by (intro weighted_arithmetic_geometric_mean_pos sum_weights')
       (auto simp: order.strict_iff_order)
  also have "… = (∑x∈X. w x * a x)"
    using ‹finite X› by (intro sum.mono_neutral_left) auto
  finally show ?thesis .
qed

text ‹
  We can derive the regular arithmetic/geometric mean inequality from this by simply
  setting all the weights to $\frac{1}{n}$:
›
corollary arithmetic_geometric_mean:
  fixes a :: "'a ⇒ real"
  assumes "finite X"
  defines "n ≡ card X"
  assumes nonneg: "⋀x. x ∈ X ⟹ a x ≥ 0"
  shows   "root n (∏x∈X. a x) ≤ (∑x∈X. a x) / n"
proof (cases "X = {}")
  case False
  with assms have n: "n > 0"
    by auto
  have "(∏x∈X. a x powr (1 / n)) ≤ (∑x∈X. (1 / n) * a x)"
    using n assms by (intro weighted_arithmetic_geometric_mean) auto
  also have "(∏x∈X. a x powr (1 / n)) = (∏x∈X. a x) powr (1 / n)"
    using nonneg by (subst powr_sum_distrib_real_left) auto
  also have "… = root n (∏x∈X. a x)"
    using ‹n > 0› nonneg by (subst root_powr_inverse') (auto simp: prod_nonneg)
  also have "(∑x∈X. (1 / n) * a x) = (∑x∈X. a x) / n"
    by (subst sum_distrib_left [symmetric]) auto
  finally show ?thesis .
qed (auto simp: n_def)


subsection ‹The Equality Case›

text ‹
  Next, we show that weighted arithmetic and geometric mean are equal if and only if all the 
  $a_i$ are equal.

  We first prove the more difficult direction as a lemmas and again first assume positivity
  of all $a_i$ and $w_i$ and will relax this somewhat later.
›
lemma weighted_arithmetic_geometric_mean_eq_iff_pos:
  fixes a w :: "'a ⇒ real"
  assumes "finite X"
  assumes pos1: "⋀x. x ∈ X ⟹ a x > 0"
  assumes pos2: "⋀x. x ∈ X ⟹ w x > 0"
  assumes sum_weights: "(∑x∈X. w x) = 1"
  assumes eq: "(∏x∈X. a x powr w x) = (∑x∈X. w x * a x)"
  shows   "∀x∈X. ∀y∈X. a x = a y"
proof -
  note nonneg1 = less_imp_le[OF pos1]
  note nonneg2 = less_imp_le[OF pos2]
  define A where "A = (∑x∈X. w x * a x)"
  define r where "r = (λx. a x / A - 1)"
  from sum_weights have "X ≠ {}" by auto
  hence "A ≠ 0"
    unfolding A_def using nonneg1 nonneg2 pos1 pos2 ‹finite X›
    by (subst sum_nonneg_eq_0_iff) force+
  moreover from nonneg1 nonneg2 have "A ≥ 0"
    by (auto simp: A_def intro!: sum_nonneg)
  ultimately have "A > 0" by simp

  have r_ge: "r x ≥ -1" if x: "x ∈ X" for x
    using ‹A > 0› pos1[OF x] by (auto simp: r_def field_simps)

  have "(∏x∈X. (1 + r x) powr w x) = (∏x∈X. (a x / A) powr w x)"
    by (simp add: r_def)
  also have "… = (∏x∈X. a x powr w x) / (∏x∈X. A powr w x)"
    unfolding prod_dividef [symmetric]
    using assms pos2 ‹A > 0› by (intro prod.cong powr_divide) (auto intro: less_imp_le)
  also have "(∏x∈X. A powr w x) = exp ((∑x∈X. w x) * ln A)"
    using ‹A > 0› and ‹finite X› by (simp add: powr_def exp_sum sum_distrib_right)
  also have "(∑x∈X. w x) = 1" by fact
  also have "exp (1 * ln A) = A"
    using ‹A > 0› by simp
  finally have lhs: "(∏x∈X. (1 + r x) powr w x) = (∏x∈X. a x powr w x) / A" .

  have "(∏x∈X. exp (w x * r x)) = exp (∑x∈X. w x * r x)"
    using ‹finite X› by (simp add: exp_sum)
  also have "(∑x∈X. w x * r x) = (∑x∈X. a x * w x) / A - 1"
    using ‹A > 0› by (simp add: r_def algebra_simps sum_subtractf sum_divide_distrib sum_weights)
  also have "(∑x∈X. a x * w x) / A = 1"
    using ‹A > 0› by (simp add: A_def mult.commute)
  finally have rhs: "(∏x∈X. exp (w x * r x)) = 1" by simp

  have "a x = A" if x: "x ∈ X" for x
  proof -
    have "(1 + r x) powr w x = exp (w x * r x)"
    proof (rule prod_ge_pointwise_le_imp_pointwise_eq
             [where f = "λx. (1 + r x) powr w x" and g = "λx. exp (w x * r x)"])
      show "(1 + r x) powr w x ≤ exp (w x * r x)" if x: "x ∈ X" for x
      proof -
        have "1 + r x ≤ exp (r x)"
          by (rule exp_ge_add_one_self)
        hence "(1 + r x) powr w x ≤ exp (r x) powr w x"
          using nonneg1[of x] nonneg2[of x] x ‹A > 0›
          by (intro powr_mono2) (auto simp: r_def field_simps)
        also have "… = exp (w x * r x)"
          by (simp add: powr_def)
        finally show "(1 + r x) powr w x ≤ exp (w x * r x)" .
      qed
    next
      show "(∏x∈X. (1 + r x) powr w x) ≥ (∏x∈X. exp (w x * r x))"
      proof -
        have "(∏x∈X. (1 + r x) powr w x) = (∏x∈X. a x powr w x) / A"
          by (fact lhs)
        also have "… = 1"
          using ‹A ≠ 0› by (simp add: eq A_def)
        also have "… = (∏x∈X. exp (w x * r x))"
          by (simp add: rhs)
        finally show ?thesis by simp
      qed
    qed (use x ‹finite X› in auto)

    also have "exp (w x * r x) = exp (r x) powr w x"
      by (simp add: powr_def)
    finally have "1 + r x = exp (r x)"
      using x pos2[of x] r_ge[of x] by (subst (asm) powr_left_real_eq_iff) auto
    hence "r x = 0"
      using exp_real_eq_one_plus_iff[of "r x"] by auto
    hence "a x = A"
      using ‹A > 0› by (simp add: r_def field_simps)
    thus ?thesis
      by (simp add: )
  qed
  thus "∀x∈X. ∀y∈X. a x = a y"
    by auto
qed

text ‹
  We can now show the full theorem and relax the positivity condition on the $a_i$ to
  non-negativity. This is possible because if some $a_i$ is zero and the two means
  coincide, then the product is obviously 0, but the sum can only be 0 if \<^term>‹all›
  the $a_i$ are 0.
›
theorem weighted_arithmetic_geometric_mean_eq_iff:
  fixes a w :: "'a ⇒ real"
  assumes "finite X"
  assumes nonneg1: "⋀x. x ∈ X ⟹ a x ≥ 0"
  assumes pos2:    "⋀x. x ∈ X ⟹ w x > 0"
  assumes sum_weights: "(∑x∈X. w x) = 1"
  shows   "(∏x∈X. a x powr w x) = (∑x∈X. w x * a x) ⟷ X ≠ {} ∧ (∀x∈X. ∀y∈X. a x = a y)"
proof
  assume *: "X ≠ {} ∧ (∀x∈X. ∀y∈X. a x = a y)"
  from * have "X ≠ {}"
    by blast

  from * obtain c where c: "⋀x. x ∈ X ⟹ a x = c" "c ≥ 0"
  proof (cases "X = {}")
    case False
    then obtain x where "x ∈ X" by blast
    thus ?thesis using * that[of "a x"] nonneg1[of x] by metis
  next
    case True
    thus ?thesis
      using that[of 1] by auto
  qed

  have "(∏x∈X. a x powr w x) = (∏x∈X. c powr w x)"
    by (simp add: c)
  also have "… = c"
    using assms c ‹X ≠ {}› by (cases "c = 0") (auto simp: powr_sum_distrib_real_right)
  also have "… = (∑x∈X. w x * a x)"
    using sum_weights by (simp add: c(1) flip: sum_distrib_left sum_distrib_right)
  finally show "(∏x∈X. a x powr w x) = (∑x∈X. w x * a x)" .
next
  assume *: "(∏x∈X. a x powr w x) = (∑x∈X. w x * a x)"
  have "X ≠ {}"
    using * by auto
  moreover have "(∀x∈X. ∀y∈X. a x = a y)"
  proof (cases "∃x∈X. a x = 0")
    case False
    with nonneg1 have pos1: "∀x∈X. a x > 0"
      by force
    thus ?thesis
      using weighted_arithmetic_geometric_mean_eq_iff_pos[of X a w] assms *
      by blast
  next
    case True
    hence "(∏x∈X. a x powr w x) = 0"
      using assms by auto
    with * have "(∑x∈X. w x * a x) = 0"
      by auto
    also have "?this ⟷ (∀x∈X. w x * a x = 0)"
      using assms by (intro sum_nonneg_eq_0_iff mult_nonneg_nonneg) (auto intro: less_imp_le)
    finally have "(∀x∈X. a x = 0)"
      using pos2 by force
    thus ?thesis
      by auto
  qed
  ultimately show "X ≠ {} ∧ (∀x∈X. ∀y∈X. a x = a y)"
    by blast
qed

text ‹
  Again, we derive a version for the unweighted arithmetic/geometric mean.
›
corollary arithmetic_geometric_mean_eq_iff:
  fixes a :: "'a ⇒ real"
  assumes "finite X"
  defines "n ≡ card X"
  assumes nonneg: "⋀x. x ∈ X ⟹ a x ≥ 0"
  shows   "root n (∏x∈X. a x) = (∑x∈X. a x) / n ⟷ (∀x∈X. ∀y∈X. a x = a y)"
proof (cases "X = {}")
  case False
  with assms have "n > 0"
    by auto
  have "(∏x∈X. a x powr (1 / n)) = (∑x∈X. (1 / n) * a x) ⟷
          X ≠ {} ∧ (∀x∈X. ∀y∈X. a x = a y)"
    using assms False by (intro weighted_arithmetic_geometric_mean_eq_iff) auto
  also have "(∏x∈X. a x powr (1 / n)) = (∏x∈X. a x) powr (1 / n)"
    using nonneg by (subst powr_sum_distrib_real_left) auto
  also have "… = root n (∏x∈X. a x)"
    using ‹n > 0› nonneg by (subst root_powr_inverse') (auto simp: prod_nonneg)
  also have "(∑x∈X. (1 / n) * a x) = (∑x∈X. a x) / n"
    by (subst sum_distrib_left [symmetric]) auto
  finally show ?thesis using False by auto
qed (auto simp: n_def)


subsection ‹The Binary Version›

text ‹
  For convenience, we also derive versions for only two numbers:
›
corollary weighted_arithmetic_geometric_mean_binary:
  fixes w1 w2 x1 x2 :: real
  assumes "x1 ≥ 0" "x2 ≥ 0" "w1 ≥ 0" "w2 ≥ 0" "w1 + w2 = 1"
  shows   "x1 powr w1 * x2 powr w2 ≤ w1 * x1 + w2 * x2"
proof -
  let ?a = "λb. if b then x1 else x2"
  let ?w = "λb. if b then w1 else w2"
  from assms have "(∏x∈UNIV. ?a x powr ?w x) ≤ (∑x∈UNIV. ?w x * ?a x)" 
    by (intro weighted_arithmetic_geometric_mean) (auto simp add: UNIV_bool)
  thus ?thesis by (simp add: UNIV_bool add_ac mult_ac)
qed

corollary weighted_arithmetic_geometric_mean_eq_iff_binary:
  fixes w1 w2 x1 x2 :: real
  assumes "x1 ≥ 0" "x2 ≥ 0" "w1 > 0" "w2 > 0" "w1 + w2 = 1"
  shows   "x1 powr w1 * x2 powr w2 = w1 * x1 + w2 * x2 ⟷ x1 = x2"
proof -
  let ?a = "λb. if b then x1 else x2"
  let ?w = "λb. if b then w1 else w2"
  from assms have "(∏x∈UNIV. ?a x powr ?w x) = (∑x∈UNIV. ?w x * ?a x)
                      ⟷ (UNIV :: bool set) ≠ {} ∧ (∀x∈UNIV. ∀y∈UNIV. ?a x = ?a y)" 
    by (intro weighted_arithmetic_geometric_mean_eq_iff) (auto simp add: UNIV_bool)
  thus ?thesis by (auto simp: UNIV_bool add_ac mult_ac)
qed

corollary arithmetic_geometric_mean_binary:
  fixes x1 x2 :: real
  assumes "x1 ≥ 0" "x2 ≥ 0"
  shows   "sqrt (x1 * x2) ≤ (x1 + x2) / 2"
  using weighted_arithmetic_geometric_mean_binary[of x1 x2 "1/2" "1/2"] assms
  by (simp add: powr_half_sqrt field_simps real_sqrt_mult)

corollary arithmetic_geometric_mean_eq_iff_binary:
  fixes x1 x2 :: real
  assumes "x1 ≥ 0" "x2 ≥ 0"
  shows   "sqrt (x1 * x2) = (x1 + x2) / 2 ⟷ x1 = x2"
  using weighted_arithmetic_geometric_mean_eq_iff_binary[of x1 x2 "1/2" "1/2"] assms
  by (simp add: powr_half_sqrt field_simps real_sqrt_mult)

end