feat(Analysis/SpecialFunctions): arithmetic-geometric mean (leanprover-community#32892)

Parcly-Taxel · Parcly-Taxel · commit 0dd53a2a08de · 2026-01-28T19:52:06.000Z
Co-authored-by: Parcly Taxel &lt;reddeloostw@gmail.com&gt;
diff --git a/Mathlib.lean b/Mathlib.lean
@@ -2126,6 +2126,7 @@ public import Mathlib.Analysis.Real.Pi.Wallis
 public import Mathlib.Analysis.Real.Spectrum
 public import Mathlib.Analysis.Seminorm
 public import Mathlib.Analysis.SpecialFunctions.Arcosh
+public import Mathlib.Analysis.SpecialFunctions.ArithmeticGeometricMean
 public import Mathlib.Analysis.SpecialFunctions.Arsinh
 public import Mathlib.Analysis.SpecialFunctions.Artanh
 public import Mathlib.Analysis.SpecialFunctions.Bernstein
diff --git a/Mathlib/Analysis/SpecialFunctions/ArithmeticGeometricMean.lean b/Mathlib/Analysis/SpecialFunctions/ArithmeticGeometricMean.lean
@@ -0,0 +1,302 @@
+/-
+Copyright (c) 2025 Jeremy Tan. All rights reserved.
+Released under Apache 2.0 license as described in the file LICENSE.
+Authors: Jeremy Tan
+-/
+module
+
+public import Mathlib.Analysis.SpecificLimits.Basic
+public import Mathlib.Data.Real.Sqrt
+
+/-!
+# The arithmetic-geometric mean
+
+Starting with two nonnegative real numbers, repeatedly replace them with their arithmetic and
+geometric means. By the AM-GM inequality, the smaller number (geometric mean) will monotonically
+increase and the larger number (arithmetic mean) will monotonically decrease.
+
+The two monotone sequences converge to the same limit – the arithmetic-geometric mean (AGM).
+This file defines the AGM in the `NNReal` namespace and proves some of its basic properties.
+
+## References
+
+* https://en.wikipedia.org/wiki/Arithmetic–geometric_mean
+-/
+
+@[expose] public section
+
+namespace NNReal
+
+/-- The AM–GM inequality for two `NNReal`s, with means in canonical form. -/
+lemma sqrt_mul_le_half_add (x y : ℝ≥0) : sqrt (x * y) ≤ (x + y) / 2 := by
+  rw [sqrt_le_iff_le_sq, div_pow, le_div_iff₀' (by positivity), ← mul_assoc]
+  norm_num
+  exact four_mul_le_sq_add ..
+
+/-- The strict AM–GM inequality for two `NNReal`s, with means in canonical form. -/
+lemma sqrt_mul_lt_half_add_of_ne {x y : ℝ≥0} (h : x ≠ y) : sqrt (x * y) < (x + y) / 2 := by
+  wlog hl : y < x generalizing x y
+  · specialize this h.symm (h.gt_or_lt.resolve_left hl)
+    rwa [mul_comm, add_comm]
+  have key : 0 < (x - y) ^ 2 := sq_pos_iff.mpr (by rwa [← zero_lt_iff, tsub_pos_iff_lt])
+  rw [sq, tsub_mul, mul_tsub, mul_tsub, tsub_tsub_eq_add_tsub_of_le (by gcongr),
+    tsub_add_eq_add_tsub (by gcongr), tsub_tsub, show x * y + y * x = 2 * x * y by ring,
+    tsub_pos_iff_lt, ← sq, ← sq] at key
+  rw [← sqrt_sq (_ / 2), sqrt_lt_sqrt, div_pow, lt_div_iff₀' (by positivity),
+    show (2 : ℝ≥0) ^ 2 * (x * y) = 2 * x * y + 2 * x * y by ring, add_sq, add_right_comm]
+  gcongr
+
+open Function Filter Topology
+
+/-- `agmSequences x y` is the sequence of (geometric, arithmetic) means
+converging to the arithmetic-geometric mean starting from `x` and `y`. -/
+noncomputable def agmSequences (x y : ℝ≥0) : ℕ → ℝ≥0 × ℝ≥0 :=
+  fun n ↦ (fun p ↦ (sqrt (p.1 * p.2), (p.1 + p.2) / 2))^[n + 1] (x, y)
+
+variable {x y : ℝ≥0} {n : ℕ}
+
+@[simp]
+lemma agmSequences_zero : agmSequences x y 0 = (sqrt (x * y), (x + y) / 2) := rfl
+
+lemma agmSequences_succ : agmSequences x y (n + 1) = agmSequences (sqrt (x * y)) ((x + y) / 2) n :=
+  rfl
+
+lemma agmSequences_succ' :
+    agmSequences x y (n + 1) =
+    (sqrt ((agmSequences x y n).1 * (agmSequences x y n).2),
+      ((agmSequences x y n).1 + (agmSequences x y n).2) / 2) := by
+  nth_rw 1 [agmSequences]
+  rw [iterate_succ', comp_apply]
+  rfl
+
+lemma agmSequences_comm : agmSequences x y = agmSequences y x := by
+  funext n
+  cases n with
+  | zero => simp [mul_comm, add_comm]
+  | succ n => simp [agmSequences_succ, mul_comm, add_comm]
+
+lemma le_gm_and_am_le (h : x ≤ y) : x ≤ sqrt (x * y) ∧ (x + y) / 2 ≤ y := by
+  constructor
+  · rw [le_sqrt_iff_sq_le, sq]
+    gcongr
+  · apply div_le_of_le_mul'
+    rw [two_mul]
+    gcongr
+
+lemma dist_gm_am_le : dist (sqrt (x * y)) ((x + y) / 2) ≤ dist x y / 2 := by
+  wlog h : x ≤ y generalizing x y
+  · simpa [add_comm, mul_comm, dist_comm] using this (not_le.mp h).le
+  rw [dist_comm, dist_eq, ← NNReal.coe_sub (sqrt_mul_le_half_add ..), abs_eq]
+  calc
+    _ ≤ ((x + y) / 2 - x).toReal := by
+      gcongr
+      rw [le_sqrt_iff_sq_le, sq]
+      gcongr
+    _ = _ := by
+      nth_rw 2 [← add_halves x]
+      rw [add_div, add_tsub_add_eq_tsub_left, ← tsub_div, NNReal.coe_div, NNReal.coe_two, dist_comm,
+        dist_eq, ← NNReal.coe_sub h, abs_eq]
+
+lemma agmSequences_monotone_and_antitone :
+    (Monotone fun n ↦ (agmSequences x y n).1) ∧ Antitone fun n ↦ (agmSequences x y n).2 := by
+  suffices ∀ n, (agmSequences x y n).1 ≤ (agmSequences x y (n + 1)).1 ∧
+      (agmSequences x y (n + 1)).2 ≤ (agmSequences x y n).2 from
+    ⟨monotone_nat_of_le_succ (this · |>.1), antitone_nat_of_succ_le (this · |>.2)⟩
+  intro n
+  induction n generalizing x y with
+  | zero => exact le_gm_and_am_le (sqrt_mul_le_half_add ..)
+  | succ n ih => exact Prod.mk_le_mk.mp ih
+
+lemma agmSequences_fst_monotone : Monotone fun n ↦ (agmSequences x y n).1 :=
+  agmSequences_monotone_and_antitone.1
+
+lemma agmSequences_snd_antitone : Antitone fun n ↦ (agmSequences x y n).2 :=
+  agmSequences_monotone_and_antitone.2
+
+lemma agmSequences_fst_le_snd (n m : ℕ) : (agmSequences x y n).1 ≤ (agmSequences x y m).2 := by
+  suffices ∀ {k}, (agmSequences x y k).1 ≤ (agmSequences x y k).2 by
+    obtain h | h := le_total n m
+    · exact (agmSequences_fst_monotone h).trans this
+    · exact this.trans (agmSequences_snd_antitone h)
+  intro k
+  induction k generalizing x y with
+  | zero => exact sqrt_mul_le_half_add ..
+  | succ n ih => exact ih
+
+lemma agmSequences_fst_lt_snd_of_ne (h : x ≠ y) (n m : ℕ) :
+    (agmSequences x y n).1 < (agmSequences x y m).2 := by
+  suffices ∀ {k}, (agmSequences x y k).1 < (agmSequences x y k).2 by
+    obtain h | h := le_total n m
+    · exact (agmSequences_fst_monotone h).trans_lt this
+    · exact this.trans_le (agmSequences_snd_antitone h)
+  intro k
+  induction k generalizing x y with
+  | zero => exact sqrt_mul_lt_half_add_of_ne h
+  | succ n ih =>
+    rw [agmSequences_succ']
+    exact sqrt_mul_lt_half_add_of_ne (ih h).ne
+
+lemma agmSequences_min_max : agmSequences (min x y) (max x y) = agmSequences x y := by
+  obtain h | h := le_total x y
+  · rw [min_eq_left h, max_eq_right h]
+  · rw [min_eq_right h, max_eq_left h, agmSequences_comm]
+
+lemma dist_agmSequences_fst_snd (n : ℕ) :
+    dist (agmSequences x y n).1 (agmSequences x y n).2 ≤ dist x y / 2 ^ (n + 1) := by
+  induction n with
+  | zero => simp [dist_gm_am_le]
+  | succ n ih =>
+    rw [agmSequences_succ']
+    apply dist_gm_am_le.trans
+    rw [pow_succ, ← div_div]
+    gcongr
+
+lemma tendsto_dist_agmSequences_atTop_zero :
+    Tendsto (fun n ↦ dist (agmSequences x y n).1 (agmSequences x y n).2) atTop (𝓝 0) := by
+  apply squeeze_zero (fun _ ↦ dist_nonneg) dist_agmSequences_fst_snd
+  conv =>
+    rw [← zero_mul (dist x y / 2)]
+    enter [1, n]
+    rw [pow_succ', ← div_div, div_eq_inv_mul, ← inv_pow]
+  exact (_root_.tendsto_pow_atTop_nhds_zero_of_lt_one (by norm_num) (by norm_num)).mul_const _
+
+/-- The arithmetic-geometric mean of two `NNReal`s, defined as the infimum of arithmetic means. -/
+noncomputable def agm (x y : ℝ≥0) : ℝ≥0 :=
+  ⨅ n, (agmSequences x y n).2
+
+lemma agm_comm : agm x y = agm y x := by
+  unfold agm
+  conv_rhs =>
+    enter [1, n]
+    rw [agmSequences_comm]
+
+lemma agm_eq_ciInf : agm x y = ⨅ n, (agmSequences x y n).2 := rfl
+
+lemma tendsto_agmSequences_snd_agm : Tendsto (fun n ↦ (agmSequences x y n).2) atTop (𝓝 (agm x y)) :=
+  tendsto_atTop_ciInf agmSequences_snd_antitone (OrderBot.bddBelow _)
+
+lemma agm_le_agmSequences_snd (n : ℕ) : agm x y ≤ (agmSequences x y n).2 := ciInf_le' _ n
+
+lemma agm_le_max : agm x y ≤ max x y := by
+  wlog h : x ≤ y generalizing x y
+  · simpa [agm_comm, max_comm] using this (not_le.mp h).le
+  rw [max_eq_right h]
+  apply (agm_le_agmSequences_snd 0).trans
+  rw [agmSequences_zero]
+  exact (le_gm_and_am_le h).2
+
+lemma bddAbove_range_agmSequences_fst : BddAbove (Set.range fun n ↦ (agmSequences x y n).1) := by
+  rw [bddAbove_def]
+  use (agmSequences x y 0).2
+  simp_rw [Set.mem_range, forall_exists_index, forall_apply_eq_imp_iff]
+  exact fun _ ↦ agmSequences_fst_le_snd ..
+
+/-- The AGM is also the supremum of the geometric means. -/
+lemma agm_eq_ciSup : agm x y = ⨆ n, (agmSequences x y n).1 := by
+  refine tendsto_nhds_unique (tendsto_agmSequences_snd_agm.congr_dist ?_)
+    (tendsto_atTop_ciSup agmSequences_fst_monotone bddAbove_range_agmSequences_fst)
+  conv =>
+    enter [1, n]
+    rw [dist_comm]
+  exact tendsto_dist_agmSequences_atTop_zero
+
+lemma tendsto_agmSequences_fst_agm :
+    Tendsto (fun n ↦ (agmSequences x y n).1) atTop (𝓝 (agm x y)) := by
+  rw [agm_eq_ciSup]
+  exact tendsto_atTop_ciSup agmSequences_fst_monotone bddAbove_range_agmSequences_fst
+
+lemma agmSequences_fst_le_agm (n : ℕ) : (agmSequences x y n).1 ≤ agm x y := by
+  rw [agm_eq_ciSup]
+  exact le_ciSup bddAbove_range_agmSequences_fst _
+
+lemma min_le_agm : min x y ≤ agm x y := by
+  wlog h : x ≤ y generalizing x y
+  · simpa [agm_comm, min_comm] using this (not_le.mp h).le
+  rw [min_eq_left h]
+  refine le_trans ?_ (agmSequences_fst_le_agm 0)
+  rw [agmSequences_zero]
+  exact (le_gm_and_am_le h).1
+
+@[simp]
+lemma agm_self : agm x x = x := by
+  apply le_antisymm
+  · nth_rw 3 [← max_self x]
+    exact agm_le_max
+  · nth_rw 1 [← min_self x]
+    exact min_le_agm
+
+@[simp]
+lemma agm_zero_left : agm 0 y = 0 := by
+  suffices ∀ n, (agmSequences 0 y n).1 = 0 by simp [agm_eq_ciSup, this]
+  intro n
+  induction n with
+  | zero => simp [agmSequences]
+  | succ n ih =>
+    rw [agmSequences_succ', ih, zero_mul, sqrt_zero]
+
+@[simp]
+lemma agm_zero_right : agm x 0 = 0 := by
+  rw [agm_comm, agm_zero_left]
+
+lemma agm_pos (hx : 0 < x) (hy : 0 < y) : 0 < agm x y := (lt_min hx hy).trans_le min_le_agm
+
+lemma agm_eq_agm_agmSequences_fst_agmSequences_snd (n : ℕ) :
+    agm x y = agm (agmSequences x y n).1 (agmSequences x y n).2 := by
+  refine tendsto_nhds_unique ?_ tendsto_agmSequences_snd_agm
+  have key := @tendsto_agmSequences_snd_agm x y
+  rw [← tendsto_add_atTop_iff_nat (n + 1)] at key
+  convert key using 2 with m
+  simp_rw [agmSequences, Prod.mk.eta, ← iterate_add_apply, add_right_comm]
+
+lemma agm_eq_agm_gm_am : agm x y = agm (sqrt (x * y)) ((x + y) / 2) := by
+  simpa using agm_eq_agm_agmSequences_fst_agmSequences_snd 0
+
+lemma agmSequences_fst_lt_agm_of_pos_of_ne (hx : 0 < x) (hy : 0 < y) (hn : x ≠ y) (n : ℕ) :
+    (agmSequences x y n).1 < agm x y := by
+  rw [agm_eq_agm_agmSequences_fst_agmSequences_snd n]
+  set p := (agmSequences x y n).1
+  set q := (agmSequences x y n).2
+  apply (?_ : p < sqrt (p * q)).trans_le (agmSequences_fst_le_agm 0)
+  have ppos : 0 < p :=
+    (show 0 < sqrt (x * y) by positivity).trans_le (agmSequences_fst_monotone (zero_le n))
+  have plq : p < q := agmSequences_fst_lt_snd_of_ne hn ..
+  nth_rw 1 [← mul_self_sqrt p, sqrt_mul]
+  gcongr
+
+lemma agm_lt_agmSequences_snd_of_ne (hn : x ≠ y) (n : ℕ) : agm x y < (agmSequences x y n).2 := by
+  rw [agm_eq_agm_agmSequences_fst_agmSequences_snd n]
+  set p := (agmSequences x y n).1
+  set q := (agmSequences x y n).2
+  apply (agm_le_agmSequences_snd 0).trans_lt (?_ : (p + q) / 2 < q)
+  have plq : p < q := agmSequences_fst_lt_snd_of_ne hn ..
+  nth_rw 2 [← add_halves q]
+  rw [add_div]
+  gcongr
+
+lemma min_lt_agm_of_pos_of_ne (hx : 0 < x) (hy : 0 < y) (hn : x ≠ y) : min x y < agm x y := by
+  wlog h : x < y generalizing x y
+  · simpa [agm_comm, min_comm] using this hy hx hn.symm (hn.gt_or_lt.resolve_right h)
+  rw [min_eq_left h.le]
+  refine lt_of_le_of_lt ?_ (agmSequences_fst_lt_agm_of_pos_of_ne hx hy hn 0)
+  rw [agmSequences_zero]
+  exact (le_gm_and_am_le h.le).1
+
+lemma agm_lt_max_of_ne (hn : x ≠ y) : agm x y < max x y := by
+  wlog h : x < y generalizing x y
+  · simpa [agm_comm, max_comm] using this hn.symm (hn.gt_or_lt.resolve_right h)
+  rw [max_eq_right h.le]
+  apply (agm_lt_agmSequences_snd_of_ne hn 0).trans_le
+  rw [agmSequences_zero]
+  exact (le_gm_and_am_le h.le).2
+
+/-- The AGM distributes over multiplication. -/
+lemma agm_mul_distrib {k : ℝ≥0} : agm (k * x) (k * y) = k * agm x y := by
+  simp_rw [agm, mul_iInf]
+  congr! with n
+  induction n generalizing x y with
+  | zero => simp [← mul_div_assoc, mul_add]
+  | succ n ih =>
+    rw [agmSequences_succ, ← mul_add, mul_div_assoc, mul_mul_mul_comm,
+      ← sq, sqrt_mul, sqrt_sq, ih, agmSequences_succ]
+
+end NNReal