Catalog/VC/EpsilonApproximationBound/Full.lean

1	import Catalog.VC.VCDimension.Full
2	import Catalog.VC.EpsilonApproximation.Full
3	import Catalog.VC.ShatterFunctionLemma.Full
4	import Catalog.Sparsity.ChernoffBound.Full
5	import Mathlib.Analysis.SpecialFunctions.Log.Basic
6	import Mathlib.Analysis.SpecialFunctions.Log.Monotone
7	import Mathlib.Analysis.SpecialFunctions.Pow.Real
8	import Mathlib.Analysis.Complex.ExponentialBounds
9	import Mathlib.Algebra.Order.Field.GeomSum
10	import Mathlib.Probability.ProbabilityMassFunction.Constructions
11	import Mathlib.Probability.ProbabilityMassFunction.Integrals
12	import Mathlib.Probability.Independence.Basic
13	import Mathlib.MeasureTheory.Integral.Pi
14
15	namespace Catalog.VC.EpsilonApproximationBound
16
17	def IsRelativeApprox {α : Type*} [DecidableEq α]
18	(𝒜 : Finset (Finset α)) (Y Z : Finset α) (ε : ℝ) : Prop :=
19	∀ S ∈ 𝒜, \|((S ∩ Z).card : ℝ) / Z.card - ((S ∩ Y).card : ℝ) / Y.card\| ≤ ε
20
21	lemma approx_transitive {α : Type*} [DecidableEq α] [Fintype α]
22	(𝒜 : Finset (Finset α)) {Y Z : Finset α} {ε₁ ε₂ : ℝ}
23	(hY : Catalog.VC.EpsilonApproximation.IsEpsilonApprox 𝒜 ε₁ Y)
24	(hZ : IsRelativeApprox 𝒜 Y Z ε₂) :
25	Catalog.VC.EpsilonApproximation.IsEpsilonApprox 𝒜 (ε₁ + ε₂) Z := by
26	intro S hS
27	refine le_trans (abs_sub_le _ (((S ∩ Y).card : ℝ) / Y.card) _) ?_
28	simpa [add_comm, add_left_comm, add_assoc] using add_le_add (hZ S hS) (hY S hS)
29
30	lemma relativeApprox_self {α : Type*} [DecidableEq α]
31	(𝒜 : Finset (Finset α)) (Y : Finset α) :
32	IsRelativeApprox 𝒜 Y Y 0 := by
33	intro S hS
34	simp
35
36	lemma relativeApprox_mono {α : Type*} [DecidableEq α]
37	(𝒜 : Finset (Finset α)) {Y Z : Finset α} {ε ε' : ℝ}
38	(h : IsRelativeApprox 𝒜 Y Z ε) (hε : ε ≤ ε') :
39	IsRelativeApprox 𝒜 Y Z ε' := by
40	intro S hS
41	exact (h S hS).trans hε
42
43	lemma relativeApprox_trans {α : Type*} [DecidableEq α]
44	(𝒜 : Finset (Finset α)) {W Y Z : Finset α} {ε₁ ε₂ : ℝ}
45	(h₁ : IsRelativeApprox 𝒜 W Y ε₁) (h₂ : IsRelativeApprox 𝒜 Y Z ε₂) :
46	IsRelativeApprox 𝒜 W Z (ε₁ + ε₂) := by
47	intro S hS
48	refine le_trans (abs_sub_le _ (((S ∩ Y).card : ℝ) / Y.card) _) ?_
49	linarith [h₂ S hS, h₁ S hS]
50
51	private lemma trace_card_le {α : Type*} [DecidableEq α] [Fintype α]
52	(𝒜 : Finset (Finset α)) {d : ℕ} (hd : 𝒜.vcDim ≤ d) (Y : Finset α) :
53	(Catalog.VC.ShatterFunction.trace 𝒜 Y).card ≤
54	Catalog.VC.ShatterFunctionLemma.binomialSum d Y.card := by
55	calc (Catalog.VC.ShatterFunction.trace 𝒜 Y).card
56	≤ Catalog.VC.ShatterFunction.shatterFun 𝒜 Y.card :=
57	Finset.le_sup_of_le (Finset.mem_filter.mpr ⟨Finset.mem_univ Y, rfl⟩) le_rfl
58	_ ≤ Catalog.VC.ShatterFunctionLemma.binomialSum d Y.card :=
59	Catalog.VC.ShatterFunctionLemma.shatterFunctionLemma 𝒜 hd Y.card
60
61	lemma exists_half_subset {α : Type*} [DecidableEq α]
62	(Y : Finset α) (hY : 2 ≤ Y.card) :
63	∃ Z : Finset α, Z ⊆ Y ∧ 0 < Z.card ∧ Z.card ≤ Y.card / 2 := by
64	let m := Y.card / 2
65	have hm_pos : 0 < m := by
66	dsimp [m]
67	omega
68	have hm_le : m ≤ Y.card := by
69	dsimp [m]
70	exact Nat.div_le_self _ _
71	rcases Finset.exists_subset_card_eq (s := Y) hm_le with ⟨Z, hZY, hZcard⟩
72	refine ⟨Z, hZY, ?_, ?_⟩
73	· simpa [hZcard] using hm_pos
74	· simpa [m] using hZcard.le
75
76	lemma dyadic_error_decay_two_steps {m : ℕ} (hm : 2 ≤ m) :
77	Real.sqrt (Real.log ((2 : ℝ) ^ (m + 2)) / ((2 : ℝ) ^ (m + 2)))
78	≤ (3 / 4 : ℝ) * Real.sqrt (Real.log ((2 : ℝ) ^ m) / ((2 : ℝ) ^ m)) := by
79	have hbase :
80	Real.log ((2 : ℝ) ^ (m + 2)) / ((2 : ℝ) ^ (m + 2))
81	≤ ((3 / 4 : ℝ)^2) * (Real.log ((2 : ℝ) ^ m) / ((2 : ℝ) ^ m)) := by
82	rw [Real.log_pow, Real.log_pow, pow_add]
83	have hpow_ne : ((2 : ℝ) ^ m) ≠ 0 := by
84	positivity
85	field_simp [hpow_ne]
86	ring_nf
87	have hm36 : 16 * ((2 + m : ℕ) : ℝ) ≤ 36 * m := by
88	exact_mod_cast (show 16 * (2 + m) ≤ 36 * m by omega)
89	nlinarith [hm36, Real.log_pos (by norm_num : (1 : ℝ) < 2)]
90	have hsqrt34 : Real.sqrt ((3 / 4 : ℝ)^2) = (3 / 4 : ℝ) := by
91	rw [Real.sqrt_sq_eq_abs]
92	norm_num
93	calc
94	Real.sqrt (Real.log ((2 : ℝ) ^ (m + 2)) / ((2 : ℝ) ^ (m + 2)))
95	≤ Real.sqrt (((3 / 4 : ℝ)^2) * (Real.log ((2 : ℝ) ^ m) / ((2 : ℝ) ^ m))) :=
96	Real.sqrt_le_sqrt hbase
97	_ = Real.sqrt ((3 / 4 : ℝ)^2) * Real.sqrt (Real.log ((2 : ℝ) ^ m) / ((2 : ℝ) ^ m)) := by
98	rw [Real.sqrt_mul (by positivity)]
99	_ = (3 / 4 : ℝ) * Real.sqrt (Real.log ((2 : ℝ) ^ m) / ((2 : ℝ) ^ m)) := by
100	rw [hsqrt34]
101
102	private lemma relativeApprox_of_trace {α : Type*} [DecidableEq α]
103	(𝒜 : Finset (Finset α)) (Y Z : Finset α) (hZY : Z ⊆ Y) {ε : ℝ}
104	(htrace : ∀ T ∈ Catalog.VC.ShatterFunction.trace 𝒜 Y,
105	\|((T ∩ Z).card : ℝ) / Z.card - (T.card : ℝ) / Y.card\| ≤ ε) :
106	IsRelativeApprox 𝒜 Y Z ε := by
107	intro S hS
108	have hmem : S ∩ Y ∈ Catalog.VC.ShatterFunction.trace 𝒜 Y := by
109	exact Finset.mem_image.mpr ⟨S, hS, by simp⟩
110	have hsub :
111	Y ∩ (Z ∩ S) = Z ∩ S := by
112	ext x
113	constructor
114	· intro hx
115	simp only [Finset.mem_inter] at hx ⊢
116	exact ⟨hx.2.1, hx.2.2⟩
117	· intro hx
118	simp only [Finset.mem_inter] at hx ⊢
119	exact ⟨hZY hx.1, hx.1, hx.2⟩
120	simpa [Catalog.VC.ShatterFunction.trace, hsub, Finset.inter_assoc, Finset.inter_left_comm,
121	Finset.inter_comm] using htrace (S ∩ Y) hmem
122
123	/-- Density deviation for any two nested subsets is at most 1. -/
124	private lemma density_deviation_le_one {α : Type*} [DecidableEq α]
125	{T Y Z : Finset α} (hTY : T ⊆ Y) (hZY : Z ⊆ Y) (hZ : 0 < Z.card) :
126	\|((T ∩ Z).card : ℝ) / Z.card - (T.card : ℝ) / Y.card\| ≤ 1 := by
127	have hZcard : (0 : ℝ) < Z.card := Nat.cast_pos.mpr hZ
128	have hYcard : (0 : ℝ) < Y.card := by
129	exact_mod_cast lt_of_lt_of_le hZ (Finset.card_le_card hZY)
130	have h1 : ((T ∩ Z).card : ℝ) / Z.card ≤ 1 := by
131	rw [div_le_one hZcard]
132	exact_mod_cast Finset.card_le_card Finset.inter_subset_right
133	have h2 : (T.card : ℝ) / Y.card ≤ 1 := by
134	rw [div_le_one hYcard]
135	exact_mod_cast Finset.card_le_card hTY
136	have h3 : 0 ≤ ((T ∩ Z).card : ℝ) / Z.card := div_nonneg (Nat.cast_nonneg _) hZcard.le
137	have h4 : 0 ≤ (T.card : ℝ) / Y.card := div_nonneg (Nat.cast_nonneg _) hYcard.le
138	rw [abs_le]
139	exact ⟨by linarith, by linarith⟩
140
141	/-- Additive-to-ratio conversion for density deviations.
142	If \|tz - k/2\| ≤ t and \|z - n/2\| ≤ s and z ≥ n/4,
143	then \|tz/z - k/n\| ≤ 4(t+s)/n. -/
144	private lemma ratio_of_additive {n k z tz : ℝ}
145	(hn : 0 < n) (hz : 0 < z) (hk : k ≤ n) (hk0 : 0 ≤ k)
146	(hz_lb : n / 4 ≤ z)
147	{t s : ℝ}
148	(h_trace : \|tz - k / 2\| ≤ t)
149	(h_size : \|z - n / 2\| ≤ s) :
150	\|tz / z - k / n\| ≤ 4 * (t + s) / n := by
151	have hs : 0 ≤ s := le_trans (abs_nonneg _) h_size
152	have ht : 0 ≤ t := le_trans (abs_nonneg _) h_trace
153	rw [div_sub_div _ _ (ne_of_gt hz) (ne_of_gt hn)]
154	have h_denom_pos : 0 < z * n := mul_pos hz hn
155	rw [abs_div, abs_of_pos h_denom_pos, div_le_div_iff₀ h_denom_pos hn]
156	have key : \|tz * n - z * k\| ≤ n * (t + s) := by
157	have eq : tz * n - z * k = n * (tz - k / 2) - k * (z - n / 2) := by ring
158	rw [eq]
159	calc \|n * (tz - k / 2) - k * (z - n / 2)\|
160	≤ \|n * (tz - k / 2)\| + \|-(k * (z - n / 2))\| := abs_add_le _ _
161	_ = n * \|tz - k / 2\| + k * \|z - n / 2\| := by
162	rw [abs_neg, abs_mul, abs_mul, abs_of_pos hn, abs_of_nonneg hk0]
163	_ ≤ n * t + k * s := by nlinarith
164	_ ≤ n * t + n * s := by nlinarith
165	_ = n * (t + s) := by ring
166	nlinarith [key, abs_nonneg (tz * n - z * k)]
167
168	-- Product Bernoulli(1/2) probability space for the probabilistic method
169	section ProbSetup
170	open MeasureTheory ProbabilityTheory
171
172	private noncomputable def bernHalf : PMF Bool :=
173	PMF.bernoulli (⟨1/2, by norm_num⟩ : NNReal)
174	(by show (⟨1/2, _⟩ : NNReal).val ≤ (1 : NNReal).val; simp; norm_num)
175
176	private noncomputable def bernHalfMeas : Measure Bool := bernHalf.toMeasure
177	private instance : IsProbabilityMeasure bernHalfMeas := by
178	unfold bernHalfMeas; infer_instance
179
180	private noncomputable def prodBern (n : ℕ) : Measure (Fin n → Bool) :=
181	Measure.pi (fun (_ : Fin n) => bernHalfMeas)
182
183	private instance (n : ℕ) : IsProbabilityMeasure (prodBern n) :=
184	Measure.pi.instIsProbabilityMeasure _
185
186	private def ind (b : Bool) : ℝ := if b then 1 else 0
187
188	private lemma exp_neg_mul_log_nat (n c : ℕ) (hn : 1 < n) :
189	Real.exp (-(↑c * Real.log (↑n : ℝ))) = ((↑n : ℝ) ^ c)⁻¹ := by
190	rw [show -(↑c * Real.log (↑n : ℝ)) = Real.log (((↑n : ℝ) ^ c)⁻¹) from by
191	rw [Real.log_inv, Real.log_pow]]
192	exact Real.exp_log (by positivity : (0:ℝ) < ((↑n : ℝ) ^ c)⁻¹)
193
194	end ProbSetup
195
196
197	section GoodOmega
198	open MeasureTheory ProbabilityTheory Real Finset
199
200	set_option maxHeartbeats 1600000 in
201	private lemma good_omega_exists (d : ℕ) :
202	∃ N : ℕ, 2 ≤ N ∧
203	∀ (n : ℕ), N ≤ n →
204	∀ (family : Finset (Finset (Fin n))),
205	family.card ≤ Catalog.VC.ShatterFunctionLemma.binomialSum d n →
206	∃ ω : Fin n → Bool,
207	\|(((Finset.univ.filter (fun i => ω i)).card : ℝ) - ↑n / 2)\| ≤
208	Real.sqrt (3 * ↑n * Real.log ↑n) ∧
209	∀ T ∈ family,
210	\|(((T.filter (fun i => ω i)).card : ℝ) - ↑T.card / 2)\| ≤
211	Real.sqrt (2 * (↑d + 1) * ↑n * Real.log ↑n) := by
212	refine ⟨max 512 (4 * (d + 2)), by omega, ?_⟩
213	intro n hn family hfamily
214	have hn512 : 512 ≤ n := by omega
215	have hn_pos : (0 : ℝ) < ↑n := by exact_mod_cast (show 0 < n by omega)
216	have hn_ne : (↑n : ℝ) ≠ 0 := ne_of_gt hn_pos
217	have hnd : 4 * (d + 2) ≤ n := by omega
218	have hn1 : (1 : ℝ) < ↑n := by exact_mod_cast (show 1 < n by omega)
219	have hn1' : 1 < n := by omega
220	-- ═══════════════════════════════════════════════════════
221	-- Probability space
222	-- ═══════════════════════════════════════════════════════
223	set μ := prodBern n
224	set X : Fin n → (Fin n → Bool) → ℝ := fun i ω => ind (ω i)
225	have hp : (1:ℝ)/2 ∈ Set.Icc 0 1 := ⟨by norm_num, by norm_num⟩
226	have hX_meas : ∀ i, Measurable (X i) := fun _ => measurable_of_finite _
227	have hX_indep : iIndepFun X μ :=
228	@iIndepFun_pi (Fin n) _ (fun _ => Bool) (fun _ => inferInstance)
229	(fun _ => bernHalfMeas) _ (fun _ => ℝ) (fun _ => inferInstance) (fun _ => ind)
230	(fun _ => (measurable_of_finite _).aemeasurable)
231	have hX_bern : ∀ i, ∀ᵐ ω ∂μ, X i ω = 0 ∨ X i ω = 1 :=
232	fun _ => Filter.Eventually.of_forall (fun ω => by simp [X, ind])
233	have hX_mean : ∀ i, ∫ ω, X i ω ∂μ = 1/2 := fun i => by
234	have h := @integral_comp_eval (Fin n) _ (fun _ => Bool) (fun _ => inferInstance)
235	(fun _ => bernHalfMeas) ℝ _ _ _ i ind
236	(Measurable.aestronglyMeasurable (measurable_of_finite _))
237	show ∫ ω, ind (ω i) ∂prodBern n = 1/2
238	unfold prodBern; rw [h, bernHalfMeas, PMF.integral_eq_sum]
239	simp [ind, bernHalf, PMF.bernoulli_apply]
240	rfl
241	-- ═══════════════════════════════════════════════════════
242	-- √(3n log n) ≤ n/4 for n ≥ 512
243	-- ═══════════════════════════════════════════════════════
244	have hlog_pos : 0 < log ↑n := log_pos hn1
245	have h_sz : sqrt (3 * ↑n * log ↑n) ≤ ↑n / 4 := by
246	rw [sqrt_le_left (by positivity)]
247	have h512R : (512 : ℝ) ≤ ↑n := by exact_mod_cast hn512
248	have hlog_bound : log ↑n ≤ 8 + ↑n / 512 := by
249	have hndiv_pos : (0 : ℝ) < ↑n / 512 := by linarith
250	linarith [log_div (ne_of_gt hn_pos) (by norm_num : (512:ℝ) ≠ 0),
251	show log (512 : ℝ) ≤ 9 from by
252	rw [show (512:ℝ) = 2^(9:ℕ) from by norm_num, log_pow]; push_cast
253	nlinarith [log_le_sub_one_of_pos (by norm_num : (0:ℝ) < 2)],
254	log_le_sub_one_of_pos hndiv_pos]
255	nlinarith [mul_le_mul_of_nonneg_left hlog_bound (show (0:ℝ) ≤ 3 * ↑n by positivity),
256	log_nonneg (le_of_lt hn1)]
257	-- ═══════════════════════════════════════════════════════
258	-- Size Chernoff: P(\|Z - n/2\| ≥ √(3n log n)) ≤ 2/n²
259	-- ═══════════════════════════════════════════════════════
260	-- δ = 2√(3n log n)/n ∈ (0,1)
261	have hδ_s_pos : 0 < 2 * sqrt (3 * ↑n * log ↑n) / ↑n :=
262	div_pos (mul_pos (by norm_num) (sqrt_pos.mpr (by nlinarith))) hn_pos
263	have hδ_s_lt : 2 * sqrt (3 * ↑n * log ↑n) / ↑n < 1 := by
264	rw [div_lt_one hn_pos]; linarith [h_sz]
265	-- Apply chernoffBound
266	have h_chern_s :=
267	Catalog.Sparsity.ChernoffBound.chernoffBound hp hX_meas hX_indep hX_bern hX_mean
268	(Set.mem_Ioo.mpr ⟨hδ_s_pos, hδ_s_lt⟩)
269	-- Threshold simplification: δ * (n * 1/2) = √(3n log n)
270	have h_thr_s : 2 * sqrt (3 * ↑n * log ↑n) / ↑n * (↑n * (1/2)) =
271	sqrt (3 * ↑n * log ↑n) := by field_simp
272	-- Exponent simplification: δ² * (n/2) / 3 = 2 log n
273	have h_exp_s : (2 * sqrt (3 * ↑n * log ↑n) / ↑n) ^ 2 * (↑n * (1/2)) / 3 =
274	2 * log ↑n := by
275	have hsq : sqrt (3 * ↑n * log ↑n) ^ 2 = 3 * ↑n * log ↑n := sq_sqrt (by positivity)
276	field_simp
277	nlinarith [hsq]
278	rw [h_thr_s] at h_chern_s
279	-- Combine: μ.real(bad_size) ≤ 2/n²
280	have h_size_bound : μ.real {ω \| sqrt (3 * ↑n * log ↑n) ≤
281	\|∑ i : Fin n, X i ω - ↑n * (1/2)\|} ≤ 2 * ((↑n : ℝ) ^ 2)⁻¹ := by
282	have h2 : (2 : ℝ) = ↑(2 : ℕ) := by norm_num
283	calc μ.real _ ≤ 2 * rexp (-((2 * sqrt (3 * ↑n * log ↑n) / ↑n) ^ 2 *
284	(↑n * (1/2)) / 3)) := h_chern_s
285	_ = 2 * rexp (-(2 * log ↑n)) := by rw [h_exp_s]
286	_ = 2 * ((↑n : ℝ) ^ 2)⁻¹ := by rw [h2, exp_neg_mul_log_nat n 2 hn1']
287	-- ═══════════════════════════════════════════════════════
288	-- Trace Chernoff
289	-- ═══════════════════════════════════════════════════════
290	set t := sqrt (2 * (↑d + 1) * ↑n * log ↑n)
291	have ht_nonneg : 0 ≤ t := sqrt_nonneg _
292	have h_trace_bound : ∀ T ∈ family,
293	μ.real {ω \| t < \|(∑ j : Fin T.card,
294	X ((T.orderIsoOfFin rfl) j) ω) - ↑T.card * (1/2)\|} ≤
295	2 * ((↑n : ℝ) ^ (d+1))⁻¹ := by
296	intro T hT
297	have hTn : T.card ≤ n := by
298	calc T.card ≤ univ.card := card_le_card (subset_univ T)
299	_ = n := by simp [Fintype.card_fin]
300	by_cases hT_big : (2 * t : ℝ) < ↑T.card
301	· -- Big trace: Chernoff via precomp
302	have hTcard_pos : (0 : ℝ) < ↑T.card := by linarith [ht_nonneg]
303	have hf_inj : Function.Injective
304	(fun j : Fin T.card => ((T.orderIsoOfFin rfl) j : Fin n)) := by
305	intro a b hab
306	exact_mod_cast (T.orderIsoOfFin rfl).injective (Subtype.val_injective hab)
307	have hXT_indep : iIndepFun (fun j (ω : Fin n → Bool) =>
308	X ((T.orderIsoOfFin rfl) j) ω) μ :=
309	hX_indep.precomp hf_inj
310	have hchern_T := Catalog.Sparsity.ChernoffBound.chernoffBound hp
311	(fun j => hX_meas _) hXT_indep (fun j => hX_bern _) (fun j => hX_mean _)
312	(Set.mem_Ioo.mpr ⟨show 0 < 2 * t / ↑T.card from div_pos (by positivity) hTcard_pos,
313	show 2 * t / ↑T.card < 1 from by rw [div_lt_one hTcard_pos]; linarith⟩)
314	-- Threshold: δ_T * (T.card/2) = t
315	have h_thr_T : 2 * t / ↑T.card * (↑T.card * (1/2)) = t := by
316	field_simp
317	-- Exponent bound: δ_T² * T.card/2/3 ≥ (d+1) * log n
318	have h_exp_T : (↑(d+1) : ℝ) * log ↑n ≤
319	(2 * t / ↑T.card) ^ 2 * (↑T.card * (1/2)) / 3 := by
320	have hsq : t ^ 2 = 2 * (↑d + 1) * ↑n * log ↑n := sq_sqrt (by positivity)
321	have hTR : (↑T.card : ℝ) ≤ ↑n := by exact_mod_cast hTn
322	have key : (2 * t / ↑T.card) ^ 2 * (↑T.card * (1/2)) / 3 =
323	2 * t ^ 2 / (3 * ↑T.card) := by field_simp
324	rw [key, hsq]
325	rw [le_div_iff₀ (by positivity : (0:ℝ) < 3 * ↑T.card)]
326	push_cast; nlinarith [hTcard_pos, hTR, hlog_pos]
327	rw [h_thr_T] at hchern_T
328	-- {t < \|...\|} ⊆ {t ≤ \|...\|}, and chernoff bounds the ≤ version
329	have h_subset : {ω : Fin n → Bool \| t < \|(∑ j : Fin T.card,
330	X ((T.orderIsoOfFin rfl) j) ω) - ↑T.card * (1/2)\|} ⊆
331	{ω \| t ≤ \|(∑ j : Fin T.card,
332	X ((T.orderIsoOfFin rfl) j) ω) - ↑T.card * (1/2)\|} :=
333	fun _ hω => Set.mem_setOf.mpr (le_of_lt (Set.mem_setOf.mp hω))
334	calc μ.real {ω \| t < \|(∑ j : Fin T.card, X ((T.orderIsoOfFin rfl) j) ω) -
335	↑T.card * (1/2)\|}
336	≤ μ.real {ω \| t ≤ \|(∑ j : Fin T.card, X ((T.orderIsoOfFin rfl) j) ω) -
337	↑T.card * (1/2)\|} :=
338	measureReal_mono h_subset (measure_ne_top μ _)
339	_ ≤ 2 * rexp (-((2 * t / ↑T.card) ^ 2 * (↑T.card * (1/2)) / 3)) := hchern_T
340	_ ≤ 2 * rexp (-(↑(d+1) * log ↑n)) := by
341	apply mul_le_mul_of_nonneg_left _ (by norm_num : (0:ℝ) ≤ 2)
342	apply exp_le_exp.mpr; linarith [h_exp_T]
343	_ = 2 * ((↑n : ℝ) ^ (d+1))⁻¹ := by
344	congr 1; exact exp_neg_mul_log_nat n (d+1) hn1'
345	· -- Small trace: deterministic bound
346	push_neg at hT_big
347	have h_det : ∀ ω : Fin n → Bool, \|(∑ j : Fin T.card,
348	X ((T.orderIsoOfFin rfl) j) ω) - ↑T.card * (1/2)\| ≤ t := by
349	intro ω
350	have h_lo : 0 ≤ ∑ j : Fin T.card, X ((T.orderIsoOfFin rfl) j) ω :=
351	sum_nonneg (fun j _ => by simp [X, ind]; split <;> norm_num)
352	have h_hi : ∑ j : Fin T.card, X ((T.orderIsoOfFin rfl) j) ω ≤ ↑T.card :=
353	calc _ ≤ ∑ _j : Fin T.card, (1 : ℝ) :=
354	sum_le_sum (fun j _ => by simp [X, ind]; split <;> norm_num)
355	_ = ↑T.card := by simp
356	rw [abs_le]; constructor <;> nlinarith [hT_big]
357	have h_empty : {ω : Fin n → Bool \| t < \|(∑ j : Fin T.card,
358	X ((T.orderIsoOfFin rfl) j) ω) - ↑T.card * (1/2)\|} = ∅ := by
359	ext ω; simp only [Set.mem_setOf_eq, Set.mem_empty_iff_false, iff_false]
360	exact not_lt.mpr (h_det ω)
361	rw [h_empty]; simp [Measure.real]
362	-- ═══════════════════════════════════════════════════════
363	-- Union bound: total bad prob < 1
364	-- ═══════════════════════════════════════════════════════
365	set bad_size := {ω : Fin n → Bool \| sqrt (3 * ↑n * log ↑n) ≤
366	\|∑ i : Fin n, X i ω - ↑n * (1/2)\|}
367	set bad_trace : Finset (Fin n) → Set (Fin n → Bool) := fun T =>
368	{ω \| t < \|(∑ j : Fin T.card, X ((T.orderIsoOfFin rfl) j) ω) -
369	↑T.card * (1/2)\|}
370	set bad := bad_size ∪ ⋃ T ∈ family, bad_trace T
371	have hbad_meas : MeasurableSet bad := Set.Finite.measurableSet (Set.toFinite _)
372	-- Convert μ.real bounds to ENNReal
373	have h_mu_size : μ bad_size ≤ ENNReal.ofReal (2 * ((↑n : ℝ) ^ 2)⁻¹) :=
374	(ENNReal.ofReal_toReal (measure_ne_top μ _)).symm ▸
375	ENNReal.ofReal_le_ofReal h_size_bound
376	have h_mu_trace : ∀ T ∈ family,
377	μ (bad_trace T) ≤ ENNReal.ofReal (2 * ((↑n : ℝ) ^ (d+1))⁻¹) := by
378	intro T hT
379	exact (ENNReal.ofReal_toReal (measure_ne_top μ _)).symm ▸
380	ENNReal.ofReal_le_ofReal (h_trace_bound T hT)
381	-- μ(bad) < 1
382	have h_mu_bad : μ bad < 1 := by
383	calc μ bad ≤ μ bad_size + μ (⋃ T ∈ family, bad_trace T) := measure_union_le _ _
384	_ ≤ μ bad_size + ∑ T ∈ family, μ (bad_trace T) := by
385	gcongr; exact measure_biUnion_finset_le _ _
386	_ ≤ ENNReal.ofReal (2 * ((↑n : ℝ) ^ 2)⁻¹) +
387	∑ T ∈ family, ENNReal.ofReal (2 * ((↑n : ℝ) ^ (d+1))⁻¹) :=
388	add_le_add h_mu_size (sum_le_sum (fun T hT => h_mu_trace T hT))
389	_ = ENNReal.ofReal (2 * ((↑n : ℝ) ^ 2)⁻¹) +
390	↑family.card * ENNReal.ofReal (2 * ((↑n : ℝ) ^ (d+1))⁻¹) := by
391	simp [sum_const, nsmul_eq_mul]
392	_ < 1 := by
393	-- Convert ↑family.card to ENNReal.ofReal
394	have hcast : (↑family.card : ENNReal) = ENNReal.ofReal ↑family.card := by
395	simp [ENNReal.ofReal_natCast]
396	rw [hcast]
397	rw [← ENNReal.ofReal_mul (by positivity)]
398	rw [← ENNReal.ofReal_add (by positivity) (by positivity)]
399	rw [show (1 : ENNReal) = ENNReal.ofReal 1 from ENNReal.ofReal_one.symm]
400	exact (ENNReal.ofReal_lt_ofReal_iff (by norm_num)).mpr (by
401	-- ℝ bound: 2/n² + family.card * 2/n^{d+1} < 1
402	have hn1R : (1 : ℝ) ≤ ↑n := by exact_mod_cast (show 1 ≤ n by omega)
403	have hbinom : family.card ≤ (d + 1) * n ^ d := by
404	calc family.card ≤ Catalog.VC.ShatterFunctionLemma.binomialSum d n := hfamily
405	_ ≤ (d + 1) * n ^ d := by
406	unfold Catalog.VC.ShatterFunctionLemma.binomialSum
407	exact le_trans
408	(Finset.sum_le_sum (fun k _ => Nat.choose_le_pow n k))
409	(le_trans
410	(Finset.sum_le_sum (fun k hk =>
411	Nat.pow_le_pow_right (by omega)
412	(Nat.le_of_lt_succ (Finset.mem_range.mp hk))))
413	(by simp [Finset.card_range]))
414	have hfc : (↑family.card : ℝ) ≤ (↑d + 1) * (↑n : ℝ) ^ d := by
415	exact_mod_cast hbinom
416	have h_t1 : ↑family.card * (2 * ((↑n : ℝ) ^ (d+1))⁻¹) ≤
417	2 * (↑d + 1) / ↑n := by
418	rw [show (↑n : ℝ) ^ (d+1) = (↑n : ℝ) ^ d * ↑n from by ring]
419	calc ↑family.card * (2 * ((↑n : ℝ) ^ d * ↑n)⁻¹)
420	≤ ((↑d + 1) * (↑n : ℝ) ^ d) * (2 * ((↑n : ℝ) ^ d * ↑n)⁻¹) := by
421	gcongr
422	_ = (↑d + 1) * (2 / ↑n) := by rw [mul_inv]; field_simp
423	_ = 2 * (↑d + 1) / ↑n := by ring
424	have h_t2 : 2 * ((↑n : ℝ) ^ 2)⁻¹ ≤ 2 / ↑n := by
425	rw [show (↑n : ℝ) ^ 2 = ↑n * ↑n from by ring, mul_inv]
426	calc 2 * ((↑n : ℝ)⁻¹ * (↑n : ℝ)⁻¹)
427	≤ 2 * ((↑n : ℝ)⁻¹ * 1) := by
428	gcongr; exact inv_le_one_of_one_le₀ hn1R
429	_ = 2 / ↑n := by ring
430	calc 2 * ((↑n : ℝ) ^ 2)⁻¹ + ↑family.card * (2 * ((↑n : ℝ) ^ (d+1))⁻¹)
431	≤ 2 / ↑n + 2 * (↑d + 1) / ↑n := add_le_add h_t2 h_t1
432	_ = 2 * (↑d + 2) / ↑n := by ring
433	_ ≤ 2 * (↑d + 2) / (4 * (↑d + 2)) := by
434	gcongr; exact_mod_cast hnd
435	_ = 1 / 2 := by field_simp; norm_num
436	_ < 1 := by norm_num)
437	-- ═══════════════════════════════════════════════════════
438	-- Witness extraction
439	-- ═══════════════════════════════════════════════════════
440	have h_good : badᶜ.Nonempty := by
441	apply nonempty_of_measure_ne_zero
442	rw [measure_compl hbad_meas (measure_ne_top μ bad)]
443	simp [measure_univ]
444	exact ne_of_gt (tsub_pos_of_lt h_mu_bad)
445	obtain ⟨ω, hω⟩ := h_good
446	refine ⟨ω, ?_, ?_⟩
447	· -- Size bound
448	have hω_size : ω ∉ bad_size := fun h => hω (Set.mem_union_left _ h)
449	simp only [bad_size, Set.mem_setOf_eq, not_le] at hω_size
450	have hsum : ∑ i : Fin n, X i ω = ((univ.filter (fun i => ω i)).card : ℝ) := by
451	simp [X, ind, ← sum_boole]
452	rw [show (↑n : ℝ) / 2 = ↑n * (1/2) from by ring]
453	linarith [hsum ▸ hω_size]
454	· -- Trace bounds
455	intro T hT
456	have hω_trace : ω ∉ bad_trace T := by
457	intro h; exact hω (Set.mem_union_right _ (Set.mem_biUnion hT h))
458	simp only [bad_trace, Set.mem_setOf_eq, not_lt] at hω_trace
459	have hsum_T : ∑ j : Fin T.card, X ((T.orderIsoOfFin rfl) j) ω =
460	((T.filter (fun i => ω i)).card : ℝ) := by
461	have h1 : ∑ j : Fin T.card, X ((T.orderIsoOfFin rfl) j) ω =
462	∑ i ∈ T, X i ω := by
463	rw [← T.sum_coe_sort (fun i => X i ω)]
464	exact Fintype.sum_equiv (T.orderIsoOfFin rfl).toEquiv _ _ (fun j => rfl)
465	rw [h1]; simp [X, ind, ← sum_boole]
466	rw [show (↑T.card : ℝ) / 2 = ↑T.card * (1/2) from by ring]
467	linarith [hsum_T ▸ hω_trace]
468
469
470	end GoodOmega
471
472	/-- The probabilistic core for large sets: there exist a uniform constant `c > 0`
473	and threshold `N` (depending only on `d`) such that for any `n ≥ N`, given a
474	family of subsets of `Fin n` with polynomially bounded size, a half-sized subset
475	with good simultaneous density control exists.
476
477	The proof uses `good_omega_exists` for the probabilistic argument,
478	then converts additive bounds to ratio bounds via `ratio_of_additive`,
479	and handles the complement trick when \|Z\| > n/2. -/
480	private lemma exists_good_half_subset_large (d : ℕ) :
481	∃ (c : ℝ) (N : ℕ), 0 < c ∧ 2 ≤ N ∧
482	∀ (n : ℕ), N ≤ n →
483	∀ (family : Finset (Finset (Fin n))),
484	family.card ≤ Catalog.VC.ShatterFunctionLemma.binomialSum d n →
485	∃ Z : Finset (Fin n), 0 < Z.card ∧ Z.card ≤ n / 2 ∧
486	∀ T ∈ family,
487	\|((T ∩ Z).card : ℝ) / Z.card - (T.card : ℝ) / n\| ≤
488	c * Real.sqrt (Real.log (↑n) / ↑n) := by
489	obtain ⟨N₀, hN₀, hgood⟩ := good_omega_exists d
490	-- The density constant: 4(√(2(d+1)) + √3) accounts for the ratio conversion
491	refine ⟨4 * (Real.sqrt (2 * (↑d + 1)) + Real.sqrt 3), max N₀ 512, by positivity,
492	by omega, ?_⟩
493	intro n hn family hfamily
494	have hn0 : N₀ ≤ n := by omega
495	have hn512 : 512 ≤ n := by omega
496	have hn_pos : (0 : ℝ) < n := by positivity
497	obtain ⟨ω, h_size, h_trace⟩ := hgood n hn0 family hfamily
498	-- Z₀ = {i \| ω i = true}
499	set Z₀ := Finset.univ.filter (fun i : Fin n => ω i) with hZ₀_def
500	have hZ₀_card_le : Z₀.card ≤ n := by
501	calc Z₀.card ≤ Finset.univ.card := Finset.card_filter_le _ _
502	_ = n := by simp [Fintype.card_fin]
503	-- T ∩ Z₀ = T.filter (ω ·) for any T
504	have hTZ₀ : ∀ T : Finset (Fin n), T ∩ Z₀ = T.filter (fun i => ω i) := by
505	intro T; ext x; simp [Z₀, Finset.mem_inter, Finset.mem_filter]
506	-- Size lower bound: \|\|Z₀\| - n/2\| ≤ √(3n log n) and n ≥ 512 imply n/4 ≤ \|Z₀\| ≤ 3n/4
507	have h_sz : Real.sqrt (3 * ↑n * Real.log ↑n) ≤ ↑n / 4 := by
508	rw [Real.sqrt_le_left (by positivity : (0:ℝ) ≤ (↑n : ℝ) / 4)]
509	have h512R : (512 : ℝ) ≤ (↑n : ℝ) := by exact_mod_cast hn512
510	have hlog_bound : Real.log (↑n : ℝ) ≤ 8 + (↑n : ℝ) / 512 := by
511	have hndiv_pos : (0 : ℝ) < (↑n : ℝ) / 512 := by linarith
512	have hlog_split : Real.log (↑n : ℝ) = Real.log 512 + Real.log ((↑n : ℝ) / 512) := by
513	linarith [Real.log_div (ne_of_gt hn_pos) (by norm_num : (512:ℝ) ≠ 0)]
514	rw [hlog_split]
515	have h1 : Real.log (512 : ℝ) ≤ 9 := by
516	rw [show (512:ℝ) = 2^(9:ℕ) from by norm_num, Real.log_pow]
517	have hlog2 : Real.log 2 ≤ 2 - 1 := Real.log_le_sub_one_of_pos (by norm_num)
518	push_cast; nlinarith
519	linarith [Real.log_le_sub_one_of_pos hndiv_pos]
520	nlinarith [mul_le_mul_of_nonneg_left hlog_bound (show (0:ℝ) ≤ 3 * ↑n by positivity),
521	Real.log_nonneg (show (1:ℝ) ≤ ↑n by linarith)]
522	have hZ₀_lb : n / 4 ≤ Z₀.card := by
523	have h := (abs_le.mp (le_trans h_size h_sz)).1
524	have hR : (↑(n / 4) : ℝ) ≤ ↑Z₀.card := by
525	have : (↑(n / 4) : ℝ) * 4 ≤ ↑n := by exact_mod_cast Nat.div_mul_le_self n 4
526	linarith
527	exact_mod_cast hR
528	have hZ₀_ub : Z₀.card ≤ 3 * n / 4 := by
529	have h := (abs_le.mp (le_trans h_size h_sz)).2
530	have h4 : 4 * (↑Z₀.card : ℝ) ≤ 3 * ↑n := by linarith
531	have h4N : 4 * Z₀.card ≤ 3 * n := by exact_mod_cast h4
532	omega
533	-- Complement Z₁ has the same properties (sign flip in deviations)
534	set Z₁ := Finset.univ.filter (fun i : Fin n => ¬ω i) with hZ₁_def
535	have hZ₀Z₁ : Z₀.card + Z₁.card = n := by
536	have hZ₀Z₁_eq : Z₀ ∪ Z₁ = Finset.univ := by
537	ext x; simp [Z₀, Z₁, Finset.mem_union, Finset.mem_filter, em]
538	have hZ₀Z₁_disj : Disjoint Z₀ Z₁ := by
539	simp [Finset.disjoint_filter, Z₀, Z₁]
540	rw [← Finset.card_union_of_disjoint hZ₀Z₁_disj, hZ₀Z₁_eq]
541	simp [Fintype.card_fin]
542	have hZ₁_lb : n / 4 ≤ Z₁.card := by omega
543	have hTZ₁ : ∀ T : Finset (Fin n), T ∩ Z₁ = T.filter (fun i => ¬ω i) := by
544	intro T; ext x; simp [Z₁, Finset.mem_inter, Finset.mem_filter]
545	-- Partition lemma: T.filter(ω) + T.filter(¬ω) = T.card
546	have hTpart : ∀ T : Finset (Fin n),
547	(T.filter (fun i => ω i)).card + (T.filter (fun i => ¬ω i)).card = T.card := by
548	intro T
549	have h := @Finset.card_filter_add_card_filter_not (Fin n) T (fun i => ω i = true) _ _
550	convert h using 1
551	-- Helper: ratio_of_additive application for either choice of Z
552	-- Both Z₀ and Z₁ have the same additive deviations (sign flip for complement)
553	have hsn : Real.sqrt ↑n ≠ 0 := Real.sqrt_ne_zero'.mpr hn_pos
554	-- Algebraic simplification lemma
555	have halg : 4 * (Real.sqrt (2 * (↑d + 1) * ↑n * Real.log ↑n) +
556	Real.sqrt (3 * ↑n * Real.log ↑n)) / ↑n =
557	4 * (Real.sqrt (2 * (↑d + 1)) + Real.sqrt 3) * Real.sqrt (Real.log ↑n / ↑n) := by
558	have hn' : (↑n : ℝ) ≠ 0 := ne_of_gt hn_pos
559	have h1 : Real.sqrt (2 * (↑d + 1) * ↑n * Real.log ↑n) =
560	Real.sqrt (2 * (↑d + 1)) * (Real.sqrt ↑n * Real.sqrt (Real.log ↑n)) := by
561	rw [show 2 * (↑d + 1) * ↑n * Real.log ↑n =
562	(2 * (↑d + 1)) * (↑n * Real.log ↑n) from by ring,
563	Real.sqrt_mul (by positivity), Real.sqrt_mul (by positivity : (0:ℝ) ≤ ↑n)]
564	have h3 : Real.sqrt (3 * ↑n * Real.log ↑n) =
565	Real.sqrt 3 * (Real.sqrt ↑n * Real.sqrt (Real.log ↑n)) := by
566	rw [show 3 * ↑n * Real.log ↑n = 3 * (↑n * Real.log ↑n) from by ring,
567	Real.sqrt_mul (by norm_num : (0:ℝ) ≤ 3), Real.sqrt_mul (by positivity : (0:ℝ) ≤ ↑n)]
568	have hlog : Real.sqrt (Real.log ↑n / ↑n) = Real.sqrt (Real.log ↑n) / Real.sqrt ↑n :=
569	Real.sqrt_div' _ (by positivity : (0:ℝ) ≤ ↑n)
570	rw [h1, h3, hlog]; field_simp; rw [Real.sq_sqrt (by positivity : (0:ℝ) ≤ ↑n)]; ring
571	-- ℝ lower bounds (from additive control, not from ℕ division)
572	have hZ₀_lb_R : (↑n : ℝ) / 4 ≤ ↑Z₀.card :=
573	le_of_neg_le_neg (by linarith [(abs_le.mp (le_trans h_size h_sz)).1])
574	have hZ₁_lb_R : (↑n : ℝ) / 4 ≤ ↑Z₁.card := by
575	have : (↑Z₁.card : ℝ) = ↑n - ↑Z₀.card := by push_cast [← hZ₀Z₁]; ring
576	linarith [(abs_le.mp (le_trans h_size h_sz)).2]
577	have hTcard : ∀ T : Finset (Fin n), T.card ≤ n := by
578	intro T
579	calc T.card ≤ Finset.univ.card := Finset.card_le_card (Finset.subset_univ T)
580	_ = n := by simp [Fintype.card_fin]
581	-- Choose Z₀ if Z₀.card ≤ n/2, else Z₁
582	by_cases hZ₀_half : Z₀.card ≤ n / 2
583	· -- Use Z₀
584	refine ⟨Z₀, by omega, hZ₀_half, ?_⟩
585	intro T hT
586	have h_trace_T := h_trace T hT
587	rw [← hTZ₀] at h_trace_T
588	have := ratio_of_additive hn_pos (by linarith [hZ₀_lb_R] : (0:ℝ) < ↑Z₀.card)
589	(by exact_mod_cast hTcard T) (by positivity : (0:ℝ) ≤ ↑T.card)
590	hZ₀_lb_R h_trace_T h_size
591	linarith [halg]
592	· -- Use Z₁ (complement)
593	push_neg at hZ₀_half
594	have hZ₁_le : Z₁.card ≤ n / 2 := by omega
595	refine ⟨Z₁, by omega, hZ₁_le, ?_⟩
596	intro T hT
597	-- Complement size deviation: \|Z₁ - n/2\| = \|Z₀ - n/2\| (sign flip)
598	have h_size_Z₁ : \|(↑Z₁.card : ℝ) - ↑n / 2\| ≤ Real.sqrt (3 * ↑n * Real.log ↑n) := by
599	have hZ₁R : (↑Z₁.card : ℝ) = ↑n - ↑Z₀.card := by push_cast [← hZ₀Z₁]; ring
600	rw [hZ₁R]; rw [show (↑n : ℝ) - ↑Z₀.card - ↑n / 2 = -(↑Z₀.card - ↑n / 2) from by ring]
601	rw [abs_neg]; exact h_size
602	-- Complement trace deviation: \|T∩Z₁ - T/2\| = \|T∩Z₀ - T/2\| (sign flip)
603	have h_trace_T : \|((T ∩ Z₁).card : ℝ) - ↑T.card / 2\| ≤
604	Real.sqrt (2 * (↑d + 1) * ↑n * Real.log ↑n) := by
605	have hpart := hTpart T
606	rw [← hTZ₀, ← hTZ₁] at hpart
607	have hpart_R : ((T ∩ Z₁).card : ℝ) = ↑T.card - ↑(T ∩ Z₀).card := by
608	push_cast [← hpart]; ring
609	rw [hpart_R]
610	rw [show (↑T.card : ℝ) - ↑(T ∩ Z₀).card - ↑T.card / 2 =
611	-(↑(T ∩ Z₀).card - ↑T.card / 2) from by ring]
612	rw [abs_neg]
613	have := h_trace T hT; rwa [← hTZ₀] at this
614	have := ratio_of_additive hn_pos (by linarith [hZ₁_lb_R] : (0:ℝ) < ↑Z₁.card)
615	(by exact_mod_cast hTcard T) (by positivity : (0:ℝ) ≤ ↑T.card)
616	hZ₁_lb_R h_trace_T h_size_Z₁
617	linarith [halg]
618
619	/-- For traces of a family on Y, the density deviation is at most 1 when Z ⊆ Y. -/
620	private lemma trace_deviation_le_one {α : Type*} [DecidableEq α]
621	{𝒜 : Finset (Finset α)} {Y Z : Finset α} (hZY : Z ⊆ Y) (hZ : 0 < Z.card)
622	{T : Finset α} (hT : T ∈ Catalog.VC.ShatterFunction.trace 𝒜 Y) :
623	\|((T ∩ Z).card : ℝ) / Z.card - (T.card : ℝ) / Y.card\| ≤ 1 := by
624	have hTY : T ⊆ Y := by
625	simp only [Catalog.VC.ShatterFunction.trace, Finset.mem_image] at hT
626	obtain ⟨S, _, rfl⟩ := hT
627	exact Finset.inter_subset_right
628	exact density_deviation_le_one hTY hZY hZ
629
630	/-- Trace-level version of the random halving step.
631	The constant `c` is chosen uniformly for all set sizes by combining:
632	- For large Y (\|Y\| ≥ N(d)): the probabilistic argument from
633	`exists_good_half_subset_large`.
634	- For small Y (2 ≤ \|Y\| < N): the trivial bound \|deviation\| ≤ 1, absorbed into
635	the constant since √(log\|Y\|/\|Y\|) is bounded below for \|Y\| in this range.
636
637	The wrapper `random_halving_step` then lifts this to the original family
638	by `relativeApprox_of_trace`. -/
639	private lemma random_halving_trace_step (d : ℕ) :
640	∃ c : ℝ, 0 < c ∧
641	∀ {α : Type*} [DecidableEq α] [Fintype α]
642	(𝒜 : Finset (Finset α)) (hd : 𝒜.vcDim ≤ d) (Y : Finset α),
643	2 ≤ Y.card →
644	∃ Z : Finset α, Z ⊆ Y ∧ 0 < Z.card ∧ Z.card ≤ Y.card / 2 ∧
645	∀ T ∈ Catalog.VC.ShatterFunction.trace 𝒜 Y,
646	\|((T ∩ Z).card : ℝ) / Z.card - (T.card : ℝ) / Y.card\| ≤
647	c * Real.sqrt (Real.log (Y.card : ℝ) / Y.card) := by
648	-- Get probabilistic constant and threshold for large sets
649	obtain ⟨c_prob, N, hc_prob, hN, h_large⟩ := exists_good_half_subset_large d
650	-- For small Y (2 ≤ \|Y\| < N): \|deviation\| ≤ 1 ≤ c_small · √(log\|Y\|/\|Y\|)
651	-- when c_small = √(N / log 2), since N·log\|Y\| ≥ \|Y\|·log 2 for \|Y\| < N.
652	have hlog2_pos : (0 : ℝ) < Real.log 2 := Real.log_pos (by norm_num)
653	set c_small : ℝ := Real.sqrt (↑N / Real.log 2) with hc_small_def
654	have hc_small_pos : 0 < c_small := by
655	rw [hc_small_def]
656	exact Real.sqrt_pos.mpr (div_pos (Nat.cast_pos.mpr (by omega)) hlog2_pos)
657	-- Choose c = max(c_prob, c_small)
658	refine ⟨max c_prob c_small, lt_max_of_lt_left hc_prob, ?_⟩
659	intro α _ _ 𝒜 hd Y hY
660	by_cases hYN : N ≤ Y.card
661	· -- Large Y: transfer to Fin Y.card via embedding f : Fin Y.card ↪ α with image Y.
662	set n := Y.card with hn_def
663	have hn_pos : 0 < n := by omega
664	-- Embedding Fin n ↪ α with range = Y, via Y.equivFin.symm composed with subtype.
665	let e : Fin n ≃ ↥Y := Y.equivFin.symm
666	let f : Fin n ↪ α :=
667	e.toEmbedding.trans (Function.Embedding.subtype (· ∈ Y))
668	have hf_range : ∀ i, f i ∈ Y := fun i => (e i).2
669	have hf_inj : Function.Injective f := f.injective
670	-- For any T ⊆ Y, T = (preimage f) mapped back, so cardinality is preserved.
671	have h_round : ∀ T : Finset α, T ⊆ Y →
672	(T.preimage f hf_inj.injOn).map f = T := by
673	intro T hTY
674	ext x
675	simp only [Finset.mem_map, Finset.mem_preimage]
676	refine ⟨?_, fun hx => ?_⟩
677	· rintro ⟨i, hi, rfl⟩; exact hi
678	· refine ⟨e.symm ⟨x, hTY hx⟩, ?_, ?_⟩
679	· show f (e.symm ⟨x, hTY hx⟩) ∈ T
680	have : f (e.symm ⟨x, hTY hx⟩) = x := by
681	simp [f, e, Function.Embedding.trans_apply, Equiv.toEmbedding_apply]
682	rw [this]; exact hx
683	· simp [f, e, Function.Embedding.trans_apply, Equiv.toEmbedding_apply]
684	have h_card_pre : ∀ T : Finset α, T ⊆ Y →
685	(T.preimage f (hf_inj.injOn)).card = T.card := by
686	intro T hTY
687	have h := congrArg Finset.card (h_round T hTY)
688	rwa [Finset.card_map] at h
689	-- Transfer the trace family.
690	let toFin : Finset α → Finset (Fin n) :=
691	fun T => T.preimage f (hf_inj.injOn)
692	let family' : Finset (Finset (Fin n)) :=
693	(Catalog.VC.ShatterFunction.trace 𝒜 Y).image toFin
694	have hfam_card : family'.card ≤ Catalog.VC.ShatterFunctionLemma.binomialSum d n := by
695	calc family'.card
696	≤ (Catalog.VC.ShatterFunction.trace 𝒜 Y).card := Finset.card_image_le
697	_ ≤ _ := trace_card_le 𝒜 hd Y
698	obtain ⟨Z'_fin, hZ'_pos, hZ'_half, hZ'_prop⟩ :=
699	h_large n hYN family' hfam_card
700	-- Pull back Z'_fin to Z ⊆ Y.
701	let Z : Finset α := Z'_fin.map f
702	have hZ_sub_Y : Z ⊆ Y := by
703	intro x hx
704	simp only [Z, Finset.mem_map] at hx
705	obtain ⟨i, _, rfl⟩ := hx
706	exact hf_range i
707	have hZ_card : Z.card = Z'_fin.card := by simp [Z]
708	refine ⟨Z, hZ_sub_Y, hZ_card.symm ▸ hZ'_pos, hZ_card.symm ▸ hZ'_half, ?_⟩
709	intro T hT
710	have hTY : T ⊆ Y := by
711	simp only [Catalog.VC.ShatterFunction.trace, Finset.mem_image] at hT
712	obtain ⟨S, _, rfl⟩ := hT
713	exact Finset.inter_subset_right
714	have hTfam : toFin T ∈ family' := Finset.mem_image.mpr ⟨T, hT, rfl⟩
715	have hT_card : (toFin T).card = T.card := h_card_pre T hTY
716	-- T ∩ Z = (toFin T ∩ Z'_fin).map f
717	have h_int : T ∩ Z = (toFin T ∩ Z'_fin).map f := by
718	ext x
719	simp only [Finset.mem_inter, Finset.mem_map, toFin, Finset.mem_preimage, Z]
720	constructor
721	· rintro ⟨hxT, ⟨i, hi, rfl⟩⟩
722	exact ⟨i, ⟨hxT, hi⟩, rfl⟩
723	· rintro ⟨i, ⟨hi1, hi2⟩, rfl⟩
724	exact ⟨hi1, ⟨i, hi2, rfl⟩⟩
725	have h_int_card : (T ∩ Z).card = ((toFin T) ∩ Z'_fin).card := by
726	rw [h_int, Finset.card_map]
727	have hprop := hZ'_prop _ hTfam
728	rw [hT_card, ← hZ_card, ← h_int_card] at hprop
729	calc \|((T ∩ Z).card : ℝ) / Z.card - (T.card : ℝ) / ↑n\|
730	≤ c_prob * Real.sqrt (Real.log ↑n / ↑n) := hprop
731	_ ≤ max c_prob c_small * Real.sqrt (Real.log ↑n / ↑n) := by
732	gcongr; exact le_max_left _ _
733	· -- Small Y (2 ≤ Y.card < N): use trivial bound
734	push_neg at hYN
735	obtain ⟨Z, hZY, hZpos, hZhalf⟩ := exists_half_subset Y hY
736	refine ⟨Z, hZY, hZpos, hZhalf, ?_⟩
737	intro T hT
738	have hdev := trace_deviation_le_one hZY hZpos hT
739	-- Show: 1 ≤ max(c_prob, c_small) · √(log\|Y\|/\|Y\|)
740	-- Since max ≥ c_small and c_small · √(log\|Y\|/\|Y\|) ≥ 1
741	have hYcard_pos : (0 : ℝ) < Y.card := Nat.cast_pos.mpr (by omega)
742	have hlogY : Real.log 2 ≤ Real.log (↑Y.card) :=
743	Real.log_le_log (by positivity) (by exact_mod_cast hY)
744	have hN_ge_Y : (Y.card : ℝ) < ↑N := by exact_mod_cast hYN
745	-- Key: c_small² · (log\|Y\|/\|Y\|) = (N/log 2) · (log\|Y\|/\|Y\|) ≥ N/\|Y\| > 1
746	have h_prod_ge : c_small * Real.sqrt (Real.log (↑Y.card) / ↑Y.card) ≥ 1 := by
747	rw [hc_small_def, ← Real.sqrt_mul (by positivity : (0 : ℝ) ≤ ↑N / Real.log 2)]
748	rw [show (1 : ℝ) = Real.sqrt 1 from (Real.sqrt_one).symm]
749	apply Real.sqrt_le_sqrt
750	have : ↑N / Real.log 2 * (Real.log (↑Y.card) / ↑Y.card) =
751	↑N * Real.log (↑Y.card) / (Real.log 2 * ↑Y.card) := by ring
752	rw [this]
753	rw [le_div_iff₀ (mul_pos hlog2_pos hYcard_pos)]
754	nlinarith [hlogY, hN_ge_Y.le, hYcard_pos, hlog2_pos]
755	calc \|((T ∩ Z).card : ℝ) / Z.card - (T.card : ℝ) / Y.card\|
756	≤ 1 := hdev
757	_ ≤ c_small * Real.sqrt (Real.log (↑Y.card) / ↑Y.card) := h_prod_ge
758	_ ≤ max c_prob c_small * Real.sqrt (Real.log (↑Y.card) / ↑Y.card) := by
759	gcongr
760	exact le_max_right _ _
761
762	/-- Planned one-step helper for the repeated-halving proof.
763	It expresses the source's passage from a current ground set `Y` to a smaller
764	subset `Z` that approximates densities on `Y`. -/
765	lemma random_halving_step (d : ℕ) :
766	∃ c : ℝ, 0 < c ∧
767	∀ {α : Type*} [DecidableEq α] [Fintype α]
768	(𝒜 : Finset (Finset α)) (hd : 𝒜.vcDim ≤ d) (Y : Finset α),
769	2 ≤ Y.card →
770	∃ Z : Finset α, Z ⊆ Y ∧ 0 < Z.card ∧ Z.card ≤ Y.card / 2 ∧
771	IsRelativeApprox 𝒜 Y Z
772	(c * Real.sqrt (Real.log (Y.card : ℝ) / Y.card)) := by
773	rcases random_halving_trace_step d with ⟨c, hc, hstep⟩
774	refine ⟨c, hc, ?_⟩
775	intro α _ _ 𝒜 hd Y hY
776	rcases hstep 𝒜 hd Y hY with ⟨Z, hZY, hZpos, hZhalf, htrace⟩
777	refine ⟨Z, hZY, hZpos, hZhalf, relativeApprox_of_trace 𝒜 Y Z hZY htrace⟩
778
779	/-- Planned summation helper for the repeated-halving iteration.
780	It packages the geometric tail estimate used at the end of Matousek Lemma 5.13. -/
781	lemma geometric_error_sum :
782	∃ Cgeom : ℝ, 0 < Cgeom ∧
783	∀ n : ℕ, 2 ≤ n →
784	Finset.sum (Finset.range n) (fun i =>
785	Real.sqrt (Real.log ((2 : ℝ) ^ (n - i)) / ((2 : ℝ) ^ (n - i)))) ≤
786	Cgeom * Real.sqrt (Real.log (2 : ℝ) / 2) := by
787	refine ⟨10, by positivity, ?_⟩
788	intro n hn
789	let b : ℕ → ℝ := fun m =>
790	Real.sqrt (Real.log ((2 : ℝ) ^ m) / ((2 : ℝ) ^ m))
791	let a : ℕ → ℝ := fun k => b (k + 1)
792	have hb0 : b 0 = 0 := by
793	dsimp [b]
794	simp
795	have ha0 : a 0 = Real.sqrt (Real.log (2 : ℝ) / 2) := by
796	dsimp [a, b]
797	simp
798	have ha1 : a 1 = Real.sqrt (Real.log (2 : ℝ) / 2) := by
799	dsimp [a, b]
800	rw [Real.log_pow]
801	congr 1
802	ring
803	have ha2 : a 2 ≤ Real.sqrt (Real.log (2 : ℝ) / 2) := by
804	dsimp [a, b]
805	apply Real.sqrt_le_sqrt
806	rw [Real.log_pow]
807	have hlog : 3 * Real.log (2 : ℝ) / ((2 : ℝ) ^ 3) ≤ Real.log (2 : ℝ) / 2 := by
808	have hpos : 0 < Real.log (2 : ℝ) := Real.log_pos (by norm_num)
809	nlinarith
810	simpa using hlog
811	have hforward :
812	Finset.sum (Finset.range n) (fun i => b (n - i)) =
813	Finset.sum (Finset.range n) (fun k => a k) := by
814	have hflip := Finset.sum_flip (f := b) (n := n)
815	rw [Finset.sum_range_succ, Finset.sum_range_succ'] at hflip
816	simpa [a, hb0] using hflip
817	have h_nonneg : ∀ k : ℕ, 0 ≤ a k := by
818	intro k
819	exact Real.sqrt_nonneg _
820	have h_extend :
821	Finset.sum (Finset.range n) (fun k => a k) ≤
822	Finset.sum (Finset.range (2 * (n / 2 + 1))) (fun k => a k) := by
823	apply Finset.sum_le_sum_of_subset_of_nonneg
824	· intro x hx
825	simp at hx ⊢
826	omega
827	· intro x hx hxN
828	exact h_nonneg x
829	have h_pairs : ∀ m : ℕ,
830	Finset.sum (Finset.range (2 * (m + 1))) a =
831	a 0 + a 1 + Finset.sum (Finset.range m) (fun t => a (2 * t + 2) + a (2 * t + 3)) := by
832	intro m
833	induction m with
834	\| zero =>
835	norm_num [Finset.sum_range_succ]
836	\| succ m ihm =>
837	rw [show 2 * (m.succ + 1) = 2 * (m + 1) + 2 by omega, Finset.sum_range_add, ihm]
838	have htwo : ∑ x ∈ Finset.range 2, a (2 * (m + 1) + x) = a (2 * m + 2) + a (2 * m + 3) := by
839	rw [Finset.sum_range_succ, Finset.sum_range_succ]
840	simp
841	ring_nf
842	rw [htwo]
843	have htail :
844	a (2 * m + 2) + a (2 * m + 3) +
845	Finset.sum (Finset.range m) (fun t => a (2 * t + 2) + a (2 * t + 3)) =
846	Finset.sum (Finset.range (m + 1)) (fun t => a (2 * t + 2) + a (2 * t + 3)) := by
847	simpa [add_assoc, add_left_comm, add_comm, Nat.mul_comm, Nat.mul_left_comm, Nat.mul_assoc] using
848	(Finset.sum_range_succ_comm (f := fun t => a (2 * t + 2) + a (2 * t + 3)) m).symm
849	linarith
850	have hb_even : ∀ t : ℕ,
851	b (2 * t + 2) ≤ (3 / 4 : ℝ) ^ t * Real.sqrt (Real.log (2 : ℝ) / 2) := by
852	intro t
853	induction t with
854	\| zero =>
855	exact le_of_eq (by simpa [a] using ha1)
856	\| succ t iht =>
857	have hdec := dyadic_error_decay_two_steps (m := 2 * t + 2) (by omega)
858	have hEq : 2 * t.succ + 2 = 2 * t + 4 := by omega
859	rw [hEq]
860	calc
861	b (2 * t + 4) ≤ (3 / 4 : ℝ) * b (2 * t + 2) := hdec
862	_ ≤ (3 / 4 : ℝ) * ((3 / 4 : ℝ) ^ t * Real.sqrt (Real.log (2 : ℝ) / 2)) := by
863	gcongr
864	_ = (3 / 4 : ℝ) ^ t.succ * Real.sqrt (Real.log (2 : ℝ) / 2) := by
865	rw [pow_succ]
866	ring
867	have hb_odd : ∀ t : ℕ,
868	b (2 * t + 3) ≤ (3 / 4 : ℝ) ^ t * Real.sqrt (Real.log (2 : ℝ) / 2) := by
869	intro t
870	induction t with
871	\| zero =>
872	simpa [a] using ha2
873	\| succ t iht =>
874	have hdec := dyadic_error_decay_two_steps (m := 2 * t + 3) (by omega)
875	have hEq : 2 * t.succ + 3 = 2 * t + 5 := by omega
876	rw [hEq]
877	calc
878	b (2 * t + 5) ≤ (3 / 4 : ℝ) * b (2 * t + 3) := hdec
879	_ ≤ (3 / 4 : ℝ) * ((3 / 4 : ℝ) ^ t * Real.sqrt (Real.log (2 : ℝ) / 2)) := by
880	gcongr
881	_ = (3 / 4 : ℝ) ^ t.succ * Real.sqrt (Real.log (2 : ℝ) / 2) := by
882	rw [pow_succ]
883	ring
884	have hpair_bound : ∀ t : ℕ,
885	a (2 * t + 2) + a (2 * t + 3) ≤
886	2 * ((3 / 4 : ℝ) ^ t) * Real.sqrt (Real.log (2 : ℝ) / 2) := by
887	intro t
888	have h1 : a (2 * t + 2) ≤ (3 / 4 : ℝ) ^ t * Real.sqrt (Real.log (2 : ℝ) / 2) := by
889	simpa [a, Nat.add_assoc, Nat.mul_comm, Nat.mul_left_comm, Nat.mul_assoc] using hb_odd t
890	have h2 : a (2 * t + 3) ≤ (3 / 4 : ℝ) ^ t * Real.sqrt (Real.log (2 : ℝ) / 2) := by
891	have h2raw : b (2 * (t + 1) + 2) ≤ (3 / 4 : ℝ) ^ (t + 1) * Real.sqrt (Real.log (2 : ℝ) / 2) :=
892	hb_even (t + 1)
893	have hEq : 2 * (t + 1) + 2 = 2 * t + 4 := by omega
894	rw [hEq] at h2raw
895	have hpow : (3 / 4 : ℝ) ^ (t + 1) * Real.sqrt (Real.log (2 : ℝ) / 2) ≤
896	(3 / 4 : ℝ) ^ t * Real.sqrt (Real.log (2 : ℝ) / 2) := by
897	have hpow' : (3 / 4 : ℝ) ^ (t + 1) ≤ (3 / 4 : ℝ) ^ t := by
898	rw [pow_succ]
899	have hnonneg : 0 ≤ (3 / 4 : ℝ) ^ t := pow_nonneg (by norm_num) t
900	nlinarith
901	gcongr
902	exact le_trans h2raw hpow
903	linarith
904	have hgeom : ∀ m : ℕ,
905	Finset.sum (Finset.range m) (fun t =>
906	2 * ((3 / 4 : ℝ) ^ t) * Real.sqrt (Real.log (2 : ℝ) / 2)) ≤
907	8 * Real.sqrt (Real.log (2 : ℝ) / 2) := by
908	intro m
909	have hs : ∑ t ∈ Finset.range m, ((3 / 4 : ℝ) ^ t) ≤ 4 := by
910	have hs' :=
911	geom_sum_Ico_le_of_lt_one (x := (3 / 4 : ℝ)) (m := 0) (n := m) (by positivity) (by norm_num)
912	norm_num at hs' ⊢
913	simpa using hs'
914	calc
915	Finset.sum (Finset.range m) (fun t =>
916	2 * ((3 / 4 : ℝ) ^ t) * Real.sqrt (Real.log (2 : ℝ) / 2)) =
917	Finset.sum (Finset.range m) (fun t =>
918	(2 * Real.sqrt (Real.log (2 : ℝ) / 2)) * ((3 / 4 : ℝ) ^ t)) := by
919	congr with t
920	ring
921	_ =
922	(2 * Real.sqrt (Real.log (2 : ℝ) / 2)) *
923	(∑ t ∈ Finset.range m, ((3 / 4 : ℝ) ^ t)) := by
924	rw [Finset.mul_sum]
925	_ ≤ (2 * Real.sqrt (Real.log (2 : ℝ) / 2)) * 4 := by
926	have hfac : 0 ≤ 2 * Real.sqrt (Real.log (2 : ℝ) / 2) := by positivity
927	exact mul_le_mul_of_nonneg_left hs hfac
928	_ = 8 * Real.sqrt (Real.log (2 : ℝ) / 2) := by
929	ring
930	calc
931	Finset.sum (Finset.range n) (fun i =>
932	Real.sqrt (Real.log ((2 : ℝ) ^ (n - i)) / ((2 : ℝ) ^ (n - i)))) =
933	Finset.sum (Finset.range n) (fun k => a k) := hforward
934	_ ≤ Finset.sum (Finset.range (2 * (n / 2 + 1))) (fun k => a k) := h_extend
935	_ = a 0 + a 1 + Finset.sum (Finset.range (n / 2)) (fun t => a (2 * t + 2) + a (2 * t + 3)) := by
936	simpa [h_pairs, Nat.add_assoc, Nat.mul_comm, Nat.mul_left_comm, Nat.mul_assoc]
937	_ ≤ Real.sqrt (Real.log (2 : ℝ) / 2) + Real.sqrt (Real.log (2 : ℝ) / 2) +
938	Finset.sum (Finset.range (n / 2)) (fun t =>
939	2 * ((3 / 4 : ℝ) ^ t) * Real.sqrt (Real.log (2 : ℝ) / 2)) := by
940	have hsum :
941	Finset.sum (Finset.range (n / 2)) (fun t => a (2 * t + 2) + a (2 * t + 3)) ≤
942	Finset.sum (Finset.range (n / 2)) (fun t =>
943	2 * ((3 / 4 : ℝ) ^ t) * Real.sqrt (Real.log (2 : ℝ) / 2)) := by
944	exact Finset.sum_le_sum (fun t ht => hpair_bound t)
945	linarith [le_of_eq ha0, le_of_eq ha1, hsum]
946	_ ≤ Real.sqrt (Real.log (2 : ℝ) / 2) + Real.sqrt (Real.log (2 : ℝ) / 2) +
947	8 * Real.sqrt (Real.log (2 : ℝ) / 2) := by
948	gcongr
949	exact hgeom (n / 2)
950	_ = 10 * Real.sqrt (Real.log (2 : ℝ) / 2) := by
951	ring
952
953	/-- `Finset.univ` is a `0`-approximation for any family. -/
954	private lemma univ_isEpsilonApprox {α : Type*} [DecidableEq α] [Fintype α]
955	(𝒜 : Finset (Finset α)) :
956	Catalog.VC.EpsilonApproximation.IsEpsilonApprox 𝒜 0 Finset.univ := by
957	intro S _
958	simp [Finset.inter_univ, Finset.card_univ]
959
960	/-- Monotonicity of `IsEpsilonApprox` in the tolerance parameter. -/
961	private lemma isEpsilonApprox_mono {α : Type*} [DecidableEq α] [Fintype α]
962	{𝒜 : Finset (Finset α)} {Y : Finset α} {ε₁ ε₂ : ℝ}
963	(h : Catalog.VC.EpsilonApproximation.IsEpsilonApprox 𝒜 ε₁ Y) (hε : ε₁ ≤ ε₂) :
964	Catalog.VC.EpsilonApproximation.IsEpsilonApprox 𝒜 ε₂ Y := fun S hS =>
965	le_trans (h S hS) hε
966
967	/-- The halving iteration: starting from `Finset.univ` (a 0-approximation),
968	repeatedly apply `random_halving_step` until the size drops below `threshold`.
969
970	The accumulated error is bounded by `K · c · √(log m / m)` where `m` is
971	the threshold, using the fact that the error terms
972	`c · √(log\|Yᵢ\|/\|Yᵢ\|)` along the halving chain sum to at most
973	`K · c · √(log m / m)` (the terms decay because `√(log x / x)` is
974	eventually decreasing and sizes at least double going backwards).
975
976	Proof strategy: by strong induction on `Fintype.card α`.
977	- If `Fintype.card α ≤ threshold`: `Finset.univ` works.
978	- Otherwise: apply `random_halving_step` to get `W` with `\|W\| ≤ \|univ\|/2`,
979	and use `approx_transitive` to compose the step error with the recursive
980	error. The total error is bounded by the analytic sum bound. -/
981	private lemma iterate_halving_approx {c : ℝ} (hc : 0 ≤ c) {d : ℕ}
982	{α : Type*} [DecidableEq α] [Fintype α]
983	(step : ∀ (𝒜 : Finset (Finset α)), 𝒜.vcDim ≤ d → ∀ Y : Finset α, 2 ≤ Y.card →
984	∃ Z, Z ⊆ Y ∧ 0 < Z.card ∧ Z.card ≤ Y.card / 2 ∧
985	IsRelativeApprox 𝒜 Y Z (c * Real.sqrt (Real.log (↑Y.card) / ↑Y.card)))
986	(𝒜 : Finset (Finset α)) (hd : 𝒜.vcDim ≤ d) (threshold : ℕ) (ht : 1 ≤ threshold)
987	(B : ℕ → ℝ) (hB_nonneg : ∀ n, 0 ≤ B n)
988	(hB_step : ∀ n m : ℕ, threshold < n → 2 ≤ n → m ≤ n / 2 →
989	c * Real.sqrt (Real.log (n : ℝ) / n) + B m ≤ B n) :
990	∀ (Y₀ : Finset α), 0 < Y₀.card →
991	∀ ε₀ : ℝ, 0 ≤ ε₀ →
992	Catalog.VC.EpsilonApproximation.IsEpsilonApprox 𝒜 ε₀ Y₀ →
993	∃ Z : Finset α, Z ⊆ Y₀ ∧ 0 < Z.card ∧ Z.card ≤ threshold ∧
994	Catalog.VC.EpsilonApproximation.IsEpsilonApprox 𝒜 (ε₀ + B Y₀.card) Z := by
995	-- Strong induction on Y₀.card.
996	suffices h : ∀ (n : ℕ) (Y₀ : Finset α), Y₀.card = n → 0 < n →
997	∀ ε₀ : ℝ, 0 ≤ ε₀ →
998	Catalog.VC.EpsilonApproximation.IsEpsilonApprox 𝒜 ε₀ Y₀ →
999	∃ Z : Finset α, Z ⊆ Y₀ ∧ 0 < Z.card ∧ Z.card ≤ threshold ∧
1000	Catalog.VC.EpsilonApproximation.IsEpsilonApprox 𝒜 (ε₀ + B Y₀.card) Z by
1001	intro Y₀ hY₀ ε₀ hε₀ hYε
1002	exact h Y₀.card Y₀ rfl hY₀ ε₀ hε₀ hYε
1003	intro n
1004	induction n using Nat.strong_induction_on with
1005	\| _ n ih =>
1006	intro Y₀ hYn hYpos ε₀ hε₀ hYε
1007	have hYpos' : 0 < Y₀.card := hYn ▸ hYpos
1008	by_cases hcase : n ≤ threshold
1009	· -- Base case: Y₀ already at or below threshold.
1010	refine ⟨Y₀, subset_refl _, hYpos', hYn ▸ hcase, ?_⟩
1011	exact isEpsilonApprox_mono hYε (by linarith [hB_nonneg Y₀.card])
1012	· -- Inductive case: halve Y₀.
1013	push_neg at hcase
1014	have hYcard_ge : 2 ≤ Y₀.card := by rw [hYn]; omega
1015	obtain ⟨W, hWY, hWpos, hWhalf, hWrel⟩ := step 𝒜 hd Y₀ hYcard_ge
1016	have hWlt : W.card < n := by
1017	rw [← hYn]
1018	exact lt_of_le_of_lt hWhalf (Nat.div_lt_self (by omega) (by norm_num))
1019	have hWnewε : Catalog.VC.EpsilonApproximation.IsEpsilonApprox 𝒜
1020	(ε₀ + c * Real.sqrt (Real.log (Y₀.card : ℝ) / Y₀.card)) W :=
1021	approx_transitive 𝒜 hYε hWrel
1022	have hsqrt_nonneg : 0 ≤ c * Real.sqrt (Real.log (Y₀.card : ℝ) / Y₀.card) :=
1023	mul_nonneg hc (Real.sqrt_nonneg _)
1024	have hε_new_nonneg : 0 ≤ ε₀ + c * Real.sqrt (Real.log (Y₀.card : ℝ) / Y₀.card) := by
1025	linarith
1026	obtain ⟨Z, hZW, hZpos, hZthresh, hZε⟩ :=
1027	ih W.card hWlt W rfl hWpos _ hε_new_nonneg hWnewε
1028	refine ⟨Z, hZW.trans hWY, hZpos, hZthresh, ?_⟩
1029	-- Combine: total error so far ≤ ε₀ + B Y₀.card via hB_step.
1030	have hbound :
1031	c * Real.sqrt (Real.log (Y₀.card : ℝ) / Y₀.card) + B W.card ≤ B Y₀.card :=
1032	hB_step Y₀.card W.card (by rw [hYn]; exact hcase) hYcard_ge hWhalf
1033	refine isEpsilonApprox_mono hZε ?_
1034	linarith
1035
1036	/-- Helper: monotonicity of `√(log x / x)` on `[3, ∞)`. -/
1037	private lemma sqrt_log_div_antitone {a b : ℝ} (ha : 3 ≤ a) (hab : a ≤ b) :
1038	Real.sqrt (Real.log b / b) ≤ Real.sqrt (Real.log a / a) := by
1039	apply Real.sqrt_le_sqrt
1040	have hexp_le : Real.exp 1 ≤ a := le_of_lt (lt_of_lt_of_le Real.exp_one_lt_three ha)
1041	exact Real.log_div_self_antitoneOn hexp_le (le_trans hexp_le hab) hab
1042
1043	/-- Analytic geometric tail estimate along a dyadic chain.
1044	For an absolute constant `Kchain`, for any threshold `T ≥ 3` and any `L`,
1045	`∑_{j=0}^{L-1} √(log(T·2^j)/(T·2^j)) ≤ Kchain · √(log T / T)`.
1046
1047	This is the geometric-decay analog of `geometric_error_sum`,
1048	parameterized by an arbitrary base `T` rather than `2`.
1049	The sum converges because `√(log(T·2^j)/(T·2^j))` decays like
1050	`2^{-j/2} · √(log(T·2^j))`, and the logarithmic factor is dominated
1051	by the geometric decay. -/
1052	private lemma dyadic_chain_geometric_bound :
1053	∃ Kchain : ℝ, 0 < Kchain ∧ ∀ T : ℕ, 4 ≤ T → ∀ L : ℕ,
1054	∑ j ∈ Finset.range L,
1055	Real.sqrt (Real.log ((T : ℝ) * 2^j) / ((T : ℝ) * 2^j))
1056	≤ Kchain * Real.sqrt (Real.log T / T) := by
1057	refine ⟨10, by norm_num, ?_⟩
1058	intro T hT L
1059	have hT_pos : (0 : ℝ) < T := by exact_mod_cast (by omega : 0 < T)
1060	have hT_ge4 : (4 : ℝ) ≤ (T : ℝ) := by exact_mod_cast hT
1061	have hT_ge3 : (3 : ℝ) ≤ (T : ℝ) := by linarith
1062	set f : ℕ → ℝ := fun j =>
1063	Real.sqrt (Real.log ((T : ℝ) * 2^j) / ((T : ℝ) * 2^j)) with hf_def
1064	have hf_nn : ∀ j, 0 ≤ f j := fun j => Real.sqrt_nonneg _
1065	have hXpos : ∀ j : ℕ, (0 : ℝ) < (T : ℝ) * 2^j := fun j => by positivity
1066	have hXge4 : ∀ j : ℕ, (4 : ℝ) ≤ (T : ℝ) * 2^j := fun j => by
1067	have h1 : (1 : ℝ) ≤ (2 : ℝ)^j := one_le_pow₀ (by norm_num : (1:ℝ) ≤ 2)
1068	nlinarith
1069	-- f(0) = √(log T / T)
1070	have hf0 : f 0 = Real.sqrt (Real.log T / T) := by
1071	simp [f]
1072	-- Two-step decay: f(j+2) ≤ (3/4) f(j)
1073	have hdecay : ∀ j : ℕ, f (j+2) ≤ (3/4 : ℝ) * f j := by
1074	intro j
1075	have hXg := hXge4 j
1076	have hX := hXpos j
1077	have hlogX_pos : 0 < Real.log ((T : ℝ) * 2^j) := by
1078	apply Real.log_pos; linarith
1079	have hlogX_ge_log4 : Real.log 4 ≤ Real.log ((T : ℝ) * 2^j) :=
1080	Real.log_le_log (by norm_num) hXg
1081	have hpow_eq : ((T : ℝ) * 2^(j+2)) = 4 * ((T : ℝ) * 2^j) := by
1082	rw [pow_add]; ring
1083	have h4Xpos : (0 : ℝ) < 4 * ((T : ℝ) * 2^j) := by positivity
1084	have hbase :
1085	Real.log ((T : ℝ) * 2^(j+2)) / ((T : ℝ) * 2^(j+2))
1086	≤ ((3/4 : ℝ)^2) * (Real.log ((T : ℝ) * 2^j) / ((T : ℝ) * 2^j)) := by
1087	rw [hpow_eq, Real.log_mul (by norm_num : (4:ℝ) ≠ 0) (ne_of_gt hX)]
1088	rw [div_le_iff₀ h4Xpos]
1089	have hX_ne : ((T : ℝ) * 2^j) ≠ 0 := ne_of_gt hX
1090	rw [show ((3/4 : ℝ))^2 * (Real.log ((T:ℝ) * 2^j) / ((T:ℝ) * 2^j)) * (4 * ((T:ℝ) * 2^j))
1091	= (9/4 : ℝ) * Real.log ((T:ℝ) * 2^j) from by
1092	field_simp; ring]
1093	have hlog4_pos : 0 < Real.log 4 := Real.log_pos (by norm_num)
1094	linarith [hlogX_ge_log4, hlog4_pos]
1095	have hsqrt34 : Real.sqrt ((3/4:ℝ)^2) = (3/4:ℝ) := by
1096	rw [Real.sqrt_sq_eq_abs]; norm_num
1097	show f (j+2) ≤ (3/4 : ℝ) * f j
1098	calc f (j+2)
1099	≤ Real.sqrt (((3/4:ℝ)^2) * (Real.log ((T:ℝ)2^j) / ((T:ℝ)2^j))) :=
1100	Real.sqrt_le_sqrt hbase
1101	_ = Real.sqrt ((3/4:ℝ)^2) * Real.sqrt (Real.log ((T:ℝ)2^j) / ((T:ℝ)2^j)) := by
1102	rw [Real.sqrt_mul (by positivity)]
1103	_ = (3/4 : ℝ) * f j := by rw [hsqrt34]
1104	-- f(1) ≤ f(0)
1105	have hf1_le_f0 : f 1 ≤ f 0 := by
1106	show Real.sqrt (Real.log ((T:ℝ) * 2^1) / ((T:ℝ) * 2^1)) ≤
1107	Real.sqrt (Real.log ((T:ℝ) * 2^0) / ((T:ℝ) * 2^0))
1108	simp only [pow_zero, pow_one, mul_one]
1109	exact sqrt_log_div_antitone hT_ge3 (by linarith)
1110	-- f(2k) ≤ (3/4)^k f(0)
1111	have hf_even : ∀ k, f (2k) ≤ (3/4 : ℝ)^k f 0 := by
1112	intro k
1113	induction k with
1114	\| zero => simp
1115	\| succ k ih =>
1116	have heq : 2 * (k+1) = 2*k + 2 := by ring
1117	rw [heq]
1118	have h34_nn : (0 : ℝ) ≤ 3/4 := by norm_num
1119	calc f (2*k+2)
1120	≤ (3/4 : ℝ) * f (2k) := hdecay (2k)
1121	_ ≤ (3/4 : ℝ) * ((3/4 : ℝ)^k * f 0) := by
1122	have := mul_le_mul_of_nonneg_left ih h34_nn
1123	linarith
1124	_ = (3/4 : ℝ)^(k+1) * f 0 := by rw [pow_succ]; ring
1125	-- f(2k+1) ≤ (3/4)^k f(0)
1126	have hf_odd : ∀ k, f (2k+1) ≤ (3/4 : ℝ)^k f 0 := by
1127	intro k
1128	induction k with
1129	\| zero => simpa using hf1_le_f0
1130	\| succ k ih =>
1131	have heq : 2 * (k+1) + 1 = (2*k+1) + 2 := by ring
1132	rw [heq]
1133	have h34_nn : (0 : ℝ) ≤ 3/4 := by norm_num
1134	calc f ((2*k+1)+2)
1135	≤ (3/4 : ℝ) * f (2k+1) := hdecay (2k+1)
1136	_ ≤ (3/4 : ℝ) * ((3/4 : ℝ)^k * f 0) := by
1137	have := mul_le_mul_of_nonneg_left ih h34_nn
1138	linarith
1139	_ = (3/4 : ℝ)^(k+1) * f 0 := by rw [pow_succ]; ring
1140	-- f(j) ≤ (3/4)^(j/2) f(0)
1141	have hf_floor : ∀ j, f j ≤ (3/4 : ℝ)^(j/2) * f 0 := by
1142	intro j
1143	by_cases hpar : j % 2 = 0
1144	· have hjk : j = 2 * (j/2) := by omega
1145	have h := hf_even (j/2)
1146	rw [← hjk] at h
1147	exact h
1148	· have hjk : j = 2 * (j/2) + 1 := by omega
1149	have h := hf_odd (j/2)
1150	rw [← hjk] at h
1151	exact h
1152	-- ∑_{j<2m} (3/4)^(j/2) = 2 · ∑_{k<m} (3/4)^k
1153	have hpair : ∀ m : ℕ, ∑ j ∈ Finset.range (2*m), (3/4 : ℝ)^(j/2) =
1154	2 * ∑ k ∈ Finset.range m, (3/4 : ℝ)^k := by
1155	intro m
1156	induction m with
1157	\| zero => simp
1158	\| succ m ih =>
1159	have heq : 2 * (m+1) = 2*m + 2 := by ring
1160	rw [heq, Finset.sum_range_succ, Finset.sum_range_succ, ih, Finset.sum_range_succ]
1161	have h1 : (2*m)/2 = m := by omega
1162	have h2 : (2*m+1)/2 = m := by omega
1163	rw [h1, h2]; ring
1164	-- Bound on ∑ (3/4)^(j/2)
1165	have hgeom_floor : ∑ j ∈ Finset.range L, (3/4 : ℝ)^(j/2) ≤ 8 := by
1166	have hext :
1167	∑ j ∈ Finset.range L, (3/4 : ℝ)^(j/2) ≤
1168	∑ j ∈ Finset.range (2*(L/2 + 1)), (3/4 : ℝ)^(j/2) := by
1169	apply Finset.sum_le_sum_of_subset_of_nonneg
1170	· intro x hx; simp at hx ⊢; omega
1171	· intros; positivity
1172	rw [hpair (L/2 + 1)] at hext
1173	have hgeom_4 : ∑ k ∈ Finset.range (L/2 + 1), (3/4 : ℝ)^k ≤ 4 := by
1174	have h := geom_sum_Ico_le_of_lt_one (x := (3/4 : ℝ)) (m := 0) (n := L/2 + 1)
1175	(by norm_num) (by norm_num)
1176	rw [← Finset.range_eq_Ico] at h
1177	have h4 : ((3/4 : ℝ))^0 / (1 - 3/4) = 4 := by norm_num
1178	rw [h4] at h
1179	exact h
1180	linarith
1181	-- Combine: ∑ f(j) ≤ ∑ (3/4)^(j/2) f(0) = f(0) · ∑(3/4)^(j/2) ≤ 8·f(0) ≤ 10·f(0)
1182	have hf0_nn : 0 ≤ f 0 := hf_nn 0
1183	calc ∑ j ∈ Finset.range L, f j
1184	≤ ∑ j ∈ Finset.range L, (3/4 : ℝ)^(j/2) * f 0 :=
1185	Finset.sum_le_sum (fun j _ => hf_floor j)
1186	_ = (∑ j ∈ Finset.range L, (3/4 : ℝ)^(j/2)) * f 0 := by
1187	rw [Finset.sum_mul]
1188	_ ≤ 8 * f 0 := by
1189	have := mul_le_mul_of_nonneg_right hgeom_floor hf0_nn
1190	linarith
1191	_ ≤ 10 * Real.sqrt (Real.log T / T) := by
1192	have h0 : 0 ≤ Real.sqrt (Real.log T / T) := Real.sqrt_nonneg _
1193	rw [hf0]; linarith
1194
1195	/-- Analytic helper for `halving_budget_exists`: for any positive `c` and `K`,
1196	there is a constant `C₀` such that for any `C ≥ C₀` and `r ≥ 2`,
1197	setting `T := ⌊C·r²·log r⌋` we have `T ≥ 4` and
1198	`K·c·√(log T/T) ≤ 1/r`. -/
1199	private lemma exists_threshold_const (c K : ℝ) (hc : 0 < c) (hK : 0 < K) :
1200	∃ C₀ : ℝ, 0 < C₀ ∧ ∀ C : ℝ, C₀ ≤ C → ∀ r : ℝ, 2 ≤ r →
1201	4 ≤ Nat.floor (C * r^2 * Real.log r) ∧
1202	K * c * Real.sqrt (Real.log (Nat.floor (C * r^2 * Real.log r) : ℝ) /
1203	(Nat.floor (C * r^2 * Real.log r) : ℝ)) ≤ 1 / r := by
1204	set A : ℝ := K^2 * c^2 with hA_def
1205	have hA_pos : 0 < A := by positivity
1206	have hlog2_pos : 0 < Real.log 2 := Real.log_pos one_lt_two
1207	have hlog2_half : (1 : ℝ) / 2 < Real.log 2 := by
1208	have := Real.log_two_gt_d9; linarith
1209	-- Step 1: log x / x → 0, so eventually log x ≤ x · (log 2)/(8A)
1210	have htend : Filter.Tendsto (fun x : ℝ => Real.log x / x) Filter.atTop (nhds 0) := by
1211	have h := Real.tendsto_pow_log_div_mul_add_atTop 1 0 1 one_ne_zero
1212	simpa using h
1213	have hε_pos : 0 < Real.log 2 / (8 * A) := by positivity
1214	have hev : ∀ᶠ x in Filter.atTop, Real.log x / x < Real.log 2 / (8 * A) :=
1215	htend.eventually (gt_mem_nhds hε_pos)
1216	rw [Filter.eventually_atTop] at hev
1217	obtain ⟨C₁, hC₁⟩ := hev
1218	refine ⟨max (max C₁ 8) (24 * A), ?_, ?_⟩
1219	· have : (0 : ℝ) < 8 := by norm_num
1220	have h1 : (8 : ℝ) ≤ max C₁ 8 := le_max_right _ _
1221	have h2 : max C₁ 8 ≤ max (max C₁ 8) (24 * A) := le_max_left _ _
1222	linarith
1223	intro C hC r hr
1224	have hC₁_le : C₁ ≤ C := le_trans (le_trans (le_max_left _ _) (le_max_left _ _)) hC
1225	have h8_le : (8 : ℝ) ≤ C :=
1226	le_trans (le_trans (le_max_right _ _) (le_max_left _ _)) hC
1227	have h24A_le : 24 * A ≤ C := le_trans (le_max_right _ _) hC
1228	have hC_pos : 0 < C := by linarith
1229	have hlogC_nn : 0 ≤ Real.log C := Real.log_nonneg (by linarith)
1230	have hlogr_pos : 0 < Real.log r := Real.log_pos (by linarith)
1231	have hlogr_ge : Real.log 2 ≤ Real.log r := Real.log_le_log (by norm_num) hr
1232	have hr_pos : 0 < r := by linarith
1233	have hr2 : (4 : ℝ) ≤ r^2 := by nlinarith
1234	-- log C / C < log 2 / (8A), so 8 A log C < C log 2
1235	have hlogC_bound : 8 * A * Real.log C ≤ C * Real.log 2 := by
1236	have hlt := hC₁ C hC₁_le
1237	have h8A : (0 : ℝ) < 8 * A := by positivity
1238	have h1 : Real.log C / C * (C * (8 * A)) < Real.log 2 / (8 * A) * (C * (8 * A)) :=
1239	mul_lt_mul_of_pos_right hlt (by positivity)
1240	have h2 : Real.log C * (8 * A) < Real.log 2 * C := by
1241	have e1 : Real.log C / C * (C * (8 * A)) = Real.log C * (8 * A) := by
1242	field_simp
1243	have e2 : Real.log 2 / (8 * A) * (C * (8 * A)) = Real.log 2 * C := by
1244	field_simp
1245	linarith [h1, e1.symm.le, e2.symm.le]
1246	linarith
1247	-- T setup
1248	set X : ℝ := C * r^2 * Real.log r with hX_def
1249	have hX_pos : 0 < X := by positivity
1250	-- X ≥ C * 4 * log 2 ≥ 8 * 4 * log 2 > 16
1251	have hX_ge16 : (16 : ℝ) ≤ X := by
1252	have h := mul_le_mul (a := C * 4) (b := C * r^2) (c := Real.log 2) (d := Real.log r)
1253	(by nlinarith) hlogr_ge hlog2_pos.le (by positivity)
1254	have hCge : C * 4 * Real.log 2 ≥ 16 := by
1255	have : 8 * 4 * Real.log 2 ≥ 16 := by nlinarith
1256	nlinarith
1257	linarith [h]
1258	set T : ℕ := Nat.floor X with hT_def
1259	have hT_le : (T : ℝ) ≤ X := Nat.floor_le hX_pos.le
1260	have hT_ge : X - 1 ≤ (T : ℝ) := by
1261	have := Nat.sub_one_lt_floor X
1262	linarith
1263	have hT_ge_half : X / 2 ≤ (T : ℝ) := by linarith
1264	have hT_pos_real : (0 : ℝ) < (T : ℝ) := by linarith
1265	have hT_ge4 : 4 ≤ T := by
1266	have : (4 : ℝ) ≤ (T : ℝ) := by linarith
1267	exact_mod_cast this
1268	refine ⟨hT_ge4, ?_⟩
1269	-- Bound on log T
1270	have hT_le_Cr3 : (T : ℝ) ≤ C * r^3 := by
1271	have hlogr_le_r : Real.log r ≤ r := (Real.log_le_self hr_pos.le)
1272	have : X ≤ C * r^2 * r := by
1273	have := mul_le_mul_of_nonneg_left hlogr_le_r (by positivity : (0 : ℝ) ≤ C * r^2)
1274	simpa [hX_def] using this
1275	have h2 : C * r^2 * r = C * r^3 := by ring
1276	linarith [hT_le, this, h2.le]
1277	have hCr3_pos : 0 < C * r^3 := by positivity
1278	have hlogT_le : Real.log T ≤ Real.log C + 3 * Real.log r := by
1279	have h1 : Real.log T ≤ Real.log (C * r^3) :=
1280	Real.log_le_log hT_pos_real hT_le_Cr3
1281	have h2 : Real.log (C * r^3) = Real.log C + 3 * Real.log r := by
1282	rw [Real.log_mul hC_pos.ne' (by positivity), Real.log_pow]; push_cast; ring
1283	linarith
1284	have hlogT_nn : 0 ≤ Real.log T := Real.log_nonneg (by
1285	have : (1 : ℝ) ≤ 4 := by norm_num
1286	have h4 : (4 : ℝ) ≤ T := by exact_mod_cast hT_ge4
1287	linarith)
1288	-- Main inequality: A * r² * log T ≤ T
1289	have hMain : A * r^2 * Real.log T ≤ (T : ℝ) := by
1290	have hstep1 : A * r^2 * Real.log T ≤ A * r^2 * (Real.log C + 3 * Real.log r) :=
1291	mul_le_mul_of_nonneg_left hlogT_le (by positivity)
1292	have hstep2 : A * r^2 * (Real.log C + 3 * Real.log r) ≤ X / 2 := by
1293	-- equivalent: 2 A (log C + 3 log r) ≤ C log r (after dividing by r²)
1294	have hgoal : 2 * A * (Real.log C + 3 * Real.log r) ≤ C * Real.log r := by
1295	-- 2 A log C + 6 A log r ≤ C log r
1296	-- We have 8 A log C ≤ C log 2 ≤ C log r, so 2 A log C ≤ C log r / 4
1297	have h1 : 2 * A * Real.log C ≤ C * Real.log r / 4 := by
1298	have : 8 * A * Real.log C ≤ C * Real.log r := by
1299	have := hlogC_bound
1300	nlinarith [mul_le_mul_of_nonneg_left hlogr_ge (by linarith : (0:ℝ) ≤ C)]
1301	linarith
1302	-- 6 A log r ≤ C log r / 4 since 24 A ≤ C
1303	have h2 : 6 * A * Real.log r ≤ C * Real.log r / 4 := by
1304	have : 24 * A * Real.log r ≤ C * Real.log r := by
1305	have := mul_le_mul_of_nonneg_right h24A_le hlogr_pos.le
1306	linarith
1307	linarith
1308	nlinarith
1309	-- multiply hgoal by r²/2
1310	have hX2 : X / 2 = C * r^2 * Real.log r / 2 := by simp [hX_def]
1311	rw [hX2]
1312	nlinarith [hgoal, sq_nonneg r, hr_pos]
1313	linarith [hT_ge_half]
1314	-- Now derive K c √(log T/T) ≤ 1/r
1315	have hKcr_pos : 0 < K * c * r := by positivity
1316	have hsq_le : (K * c * r * Real.sqrt (Real.log T / T))^2 ≤ 1 := by
1317	have hnn : (0 : ℝ) ≤ Real.log T / T := div_nonneg hlogT_nn hT_pos_real.le
1318	rw [mul_pow, Real.sq_sqrt hnn]
1319	have : (K * c * r)^2 * (Real.log T / T) = A * r^2 * Real.log T / T := by
1320	simp [hA_def]; ring
1321	rw [this, div_le_one hT_pos_real]
1322	exact hMain
1323	have hpos : 0 ≤ K * c * r * Real.sqrt (Real.log T / T) := by
1324	apply mul_nonneg hKcr_pos.le (Real.sqrt_nonneg _)
1325	have hKcr_le_1 : K * c * r * Real.sqrt (Real.log T / T) ≤ 1 := by
1326	have h := Real.sqrt_le_sqrt hsq_le
1327	rw [Real.sqrt_sq hpos, Real.sqrt_one] at h
1328	exact h
1329	rw [le_div_iff₀ hr_pos]
1330	have heq : K * c * Real.sqrt (Real.log T / T) * r =
1331	K * c * r * Real.sqrt (Real.log T / T) := by ring
1332	rw [heq]; exact hKcr_le_1
1333
1334	/-- Construct the analytic budget for the halving iteration. -/
1335	private lemma halving_budget_exists {c : ℝ} (hc : 0 < c) (Cgeom : ℝ) (hCgeom : 0 < Cgeom) :
1336	∃ C : ℝ, 0 < C ∧ (max 1 (c * Cgeom + 1)) ^ 2 ≤ C ∧
1337	∀ (r : ℝ), 2 ≤ r → ∀ (M : ℕ),
1338	∃ (threshold : ℕ) (B : ℕ → ℝ),
1339	1 ≤ threshold ∧
1340	((threshold : ℝ) ≤ C * r ^ 2 * Real.log r) ∧
1341	(∀ n, 0 ≤ B n) ∧
1342	B M ≤ 1 / r ∧
1343	(∀ n m : ℕ, threshold < n → 2 ≤ n → m ≤ n / 2 →
1344	c * Real.sqrt (Real.log (n : ℝ) / n) + B m ≤ B n) := by
1345	obtain ⟨Kchain, hKchain_pos, hdyadic⟩ := dyadic_chain_geometric_bound
1346	obtain ⟨C₀, hC₀_pos, hanalytic⟩ := exists_threshold_const c Kchain hc hKchain_pos
1347	refine ⟨max C₀ ((max 1 (c * Cgeom + 1)) ^ 2),
1348	lt_of_lt_of_le hC₀_pos (le_max_left _ _),
1349	le_max_right _ _, ?_⟩
1350	intro r hr M
1351	set Cmax := max C₀ ((max 1 (c * Cgeom + 1)) ^ 2) with hCmax_def
1352	have hC₀_le : C₀ ≤ Cmax := le_max_left _ _
1353	obtain ⟨hT_ge4, hanalytic_bnd⟩ := hanalytic Cmax hC₀_le r hr
1354	set T : ℕ := Nat.floor (Cmax * r^2 * Real.log r) with hT_def
1355	have hT_pos : 0 < T := by omega
1356	have hCmax_pos : 0 < Cmax := lt_of_lt_of_le hC₀_pos hC₀_le
1357	have hlogr_pos : 0 < Real.log r := Real.log_pos (by linarith)
1358	set L : ℕ → ℕ := fun n => if n ≤ T then 0 else Nat.log 2 (n / T) + 1 with hL_def
1359	set f : ℕ → ℝ := fun k =>
1360	Real.sqrt (Real.log ((T : ℝ) * 2^k) / ((T : ℝ) * 2^k)) with hf_def
1361	set B : ℕ → ℝ := fun n => c * ∑ k ∈ Finset.range (L n), f k with hB_def
1362	have hf_nn : ∀ k, 0 ≤ f k := fun k => Real.sqrt_nonneg _
1363	have hB_nn : ∀ n, 0 ≤ B n := fun n =>
1364	mul_nonneg (le_of_lt hc) (Finset.sum_nonneg (fun _ _ => hf_nn _))
1365	have hc_nn : 0 ≤ c := le_of_lt hc
1366	-- Key: For T < n, c√(log n/n) ≤ c f (L n - 1).
1367	have hkey : ∀ n : ℕ, T < n → c * Real.sqrt (Real.log (n : ℝ) / n) ≤ c * f (L n - 1) := by
1368	intro n hn
1369	have hL_n : L n = Nat.log 2 (n / T) + 1 := by
1370	simp only [hL_def]; rw [if_neg (not_le.mpr hn)]
1371	have hLn_pos : 0 < L n := by rw [hL_n]; omega
1372	have hk_eq : L n - 1 = Nat.log 2 (n / T) := by rw [hL_n]; omega
1373	have hnT_pos : 0 < n / T := Nat.div_pos (le_of_lt hn) hT_pos
1374	have hpow_le : 2 ^ (Nat.log 2 (n / T)) ≤ n / T :=
1375	Nat.pow_log_le_self 2 (Nat.pos_iff_ne_zero.mp hnT_pos)
1376	have hTpow_le_n : T * 2 ^ (L n - 1) ≤ n := by
1377	rw [hk_eq]
1378	calc T * 2 ^ (Nat.log 2 (n / T))
1379	≤ T * (n / T) := Nat.mul_le_mul_left T hpow_le
1380	_ ≤ n := Nat.mul_div_le n T
1381	have hT_le_Tpow : T ≤ T * 2 ^ (L n - 1) := by
1382	apply Nat.le_mul_of_pos_right
1383	exact Nat.two_pow_pos _
1384	have hTpow_ge3_nat : 3 ≤ T * 2 ^ (L n - 1) := le_trans (by omega) hT_le_Tpow
1385	have hTpow_ge3 : (3 : ℝ) ≤ ((T * 2 ^ (L n - 1) : ℕ) : ℝ) := by exact_mod_cast hTpow_ge3_nat
1386	have hTpow_le_n_real : ((T * 2 ^ (L n - 1) : ℕ) : ℝ) ≤ (n : ℝ) := by exact_mod_cast hTpow_le_n
1387	have hsqrt_le :
1388	Real.sqrt (Real.log (n : ℝ) / (n : ℝ))
1389	≤ Real.sqrt (Real.log ((T * 2 ^ (L n - 1) : ℕ) : ℝ) /
1390	((T * 2 ^ (L n - 1) : ℕ) : ℝ)) :=
1391	sqrt_log_div_antitone hTpow_ge3 hTpow_le_n_real
1392	have heq : f (L n - 1) =
1393	Real.sqrt (Real.log ((T * 2 ^ (L n - 1) : ℕ) : ℝ) /
1394	((T * 2 ^ (L n - 1) : ℕ) : ℝ)) := by
1395	simp only [hf_def]; push_cast; rfl
1396	rw [heq]
1397	exact mul_le_mul_of_nonneg_left hsqrt_le hc_nn
1398	refine ⟨T, B, by omega, ?_, hB_nn, ?_, ?_⟩
1399	· -- T ≤ Cmax·r²·log r
1400	have hprod_nn : 0 ≤ Cmax * r^2 * Real.log r := by positivity
1401	exact Nat.floor_le hprod_nn
1402	· -- B M ≤ 1/r
1403	have h1 : (∑ k ∈ Finset.range (L M), f k) ≤
1404	Kchain * Real.sqrt (Real.log (T : ℝ) / T) := hdyadic T hT_ge4 (L M)
1405	have h2 : B M ≤ c * (Kchain * Real.sqrt (Real.log (T : ℝ) / T)) := by
1406	show c * _ ≤ _
1407	exact mul_le_mul_of_nonneg_left h1 hc_nn
1408	have h3 : c * (Kchain * Real.sqrt (Real.log (T : ℝ) / T)) =
1409	Kchain * c * Real.sqrt (Real.log (T : ℝ) / T) := by ring
1410	rw [h3] at h2
1411	exact le_trans h2 hanalytic_bnd
1412	· -- recurrence
1413	intro n m hn_gt_T hn_ge2 hm_le_half
1414	have hL_n : L n = Nat.log 2 (n / T) + 1 := by
1415	simp only [hL_def]; rw [if_neg (not_le.mpr hn_gt_T)]
1416	have hLn_pos : 0 < L n := by rw [hL_n]; omega
1417	have hLm_lt_Ln : L m < L n := by
1418	by_cases hmT : m ≤ T
1419	· have hLm_zero : L m = 0 := by simp only [hL_def]; rw [if_pos hmT]
1420	rw [hLm_zero]; exact hLn_pos
1421	· push_neg at hmT
1422	have hL_m : L m = Nat.log 2 (m / T) + 1 := by
1423	simp only [hL_def]; rw [if_neg (not_le.mpr hmT)]
1424	have hmT_div : m / T ≤ (n / T) / 2 := by
1425	calc m / T ≤ (n / 2) / T := Nat.div_le_div_right hm_le_half
1426	_ = n / (2 * T) := Nat.div_div_eq_div_mul n 2 T
1427	_ = n / (T * 2) := by rw [mul_comm 2 T]
1428	_ = (n / T) / 2 := (Nat.div_div_eq_div_mul n T 2).symm
1429	have hnT_ge2 : 2 ≤ n / T := by
1430	have h2m : 2 * m ≤ n := by omega
1431	have hmge : T + 1 ≤ m := hmT
1432	have : 2 * T + 2 ≤ n := by omega
1433	calc 2 = (2 * T) / T := (Nat.mul_div_cancel 2 hT_pos).symm
1434	_ ≤ n / T := Nat.div_le_div_right (by omega)
1435	have hlog_div : Nat.log 2 ((n / T) / 2) = Nat.log 2 (n / T) - 1 :=
1436	Nat.log_div_base 2 (n / T)
1437	have hlog_le : Nat.log 2 (m / T) ≤ Nat.log 2 (n / T) - 1 := by
1438	calc Nat.log 2 (m / T) ≤ Nat.log 2 ((n / T) / 2) := Nat.log_mono_right hmT_div
1439	_ = Nat.log 2 (n / T) - 1 := hlog_div
1440	have hlog_n_pos : 1 ≤ Nat.log 2 (n / T) := by
1441	have h := Nat.log_mono_right (b := 2) hnT_ge2
1442	simpa using h
1443	rw [hL_m, hL_n]; omega
1444	have hLn_sub : L n - 1 < L n := by omega
1445	have hLm_le : L m ≤ L n - 1 := by omega
1446	have hsplit : ∑ k ∈ Finset.range (L n), f k =
1447	(∑ k ∈ Finset.range (L m), f k) +
1448	∑ k ∈ Finset.Ico (L m) (L n), f k := by
1449	have h := (Finset.sum_Ico_consecutive f (Nat.zero_le (L m)) (le_of_lt hLm_lt_Ln)).symm
1450	simp only [Finset.range_eq_Ico]
1451	exact h
1452	have hIco_ge : f (L n - 1) ≤ ∑ k ∈ Finset.Ico (L m) (L n), f k := by
1453	apply Finset.single_le_sum (f := f) (s := Finset.Ico (L m) (L n))
1454	(fun i _ => hf_nn i)
1455	rw [Finset.mem_Ico]
1456	exact ⟨hLm_le, hLn_sub⟩
1457	have hBn_eq : B n = c * (∑ k ∈ Finset.range (L m), f k) +
1458	c * ∑ k ∈ Finset.Ico (L m) (L n), f k := by
1459	show c * _ = _
1460	rw [hsplit, mul_add]
1461	have hBm_eq : B m = c * ∑ k ∈ Finset.range (L m), f k := rfl
1462	have hkeyN := hkey n hn_gt_T
1463	have hIco_mul : c * f (L n - 1) ≤ c * ∑ k ∈ Finset.Ico (L m) (L n), f k :=
1464	mul_le_mul_of_nonneg_left hIco_ge hc_nn
1465	calc c * Real.sqrt (Real.log (n : ℝ) / n) + B m
1466	≤ c * f (L n - 1) + B m := by linarith
1467	_ ≤ c * (∑ k ∈ Finset.Ico (L m) (L n), f k) + B m := by linarith
1468	_ = B n := by rw [hBn_eq, hBm_eq]; ring
1469
1470	/-- For any finite set family of VC-dimension at most `d`, and `r ≥ 2`,
1471	there exists a `(1/r)`-approximation of size `O(r² log r)`.
1472	The constant `C` depends only on `d`. (Lemma 5.13) -/
1473	theorem epsilonApproxBound (d : ℕ) : ∃ C : ℝ, 0 < C ∧
1474	∀ (α : Type*) [DecidableEq α] [Fintype α] (𝒜 : Finset (Finset α)),
1475	𝒜.vcDim ≤ d →
1476	∀ (r : ℝ), 2 ≤ r →
1477	∃ Y : Finset α, Catalog.VC.EpsilonApproximation.IsEpsilonApprox 𝒜 (1 / r) Y ∧
1478	(Y.card : ℝ) ≤ C * r ^ 2 * Real.log r := by
1479	-- Get the halving step constant and the geometric error sum constant
1480	obtain ⟨c, hc, step⟩ := random_halving_step d
1481	obtain ⟨Cgeom, hCgeom, geom_bound⟩ := geometric_error_sum
1482	obtain ⟨C, hCpos, _hCge, hbudget⟩ := halving_budget_exists hc Cgeom hCgeom
1483	refine ⟨C, hCpos, ?_⟩
1484	intro α inst1 inst2 𝒜 hd r hr
1485	-- Use step at this specific universe to fix the metavariable
1486	have hstep := @step α inst1 inst2
1487	by_cases h_small : (Fintype.card α : ℝ) ≤ C * r ^ 2 * Real.log r
1488	· -- Small ground set: Y = Finset.univ is already small enough
1489	refine ⟨Finset.univ, isEpsilonApprox_mono (univ_isEpsilonApprox 𝒜) ?_, ?_⟩
1490	· positivity
1491	· simp [Finset.card_univ]; linarith
1492	· -- Large ground set: iterate halving from univ.
1493	push_neg at h_small
1494	-- Obtain the analytic budget.
1495	obtain ⟨threshold, B, ht, hthresh_le, hB_nonneg, hB_top, hB_step⟩ :=
1496	hbudget r hr (Fintype.card α)
1497	-- Universe is non-empty (since \|α\| ≥ C·r²·log r ≥ 0 — actually we need ≥ 1).
1498	have h_univ_pos : 0 < (Finset.univ : Finset α).card := by
1499	rw [Finset.card_univ]
1500	have hCpos : (0 : ℝ) < C := by positivity
1501	have hlog2_pos : 0 < Real.log 2 := Real.log_pos (by norm_num)
1502	have hlogr_pos : 0 < Real.log r := Real.log_pos (by linarith)
1503	have h_prod_pos : 0 < C * r ^ 2 * Real.log r := by positivity
1504	have : (0 : ℝ) < (Fintype.card α : ℝ) := lt_of_lt_of_le h_prod_pos (le_of_lt h_small)
1505	exact_mod_cast this
1506	-- Apply iterate_halving_approx starting from univ (a 0-approx).
1507	obtain ⟨Z, hZsub, hZpos, hZthresh, hZε⟩ :=
1508	iterate_halving_approx (le_of_lt hc) hstep 𝒜 hd threshold ht B hB_nonneg hB_step
1509	Finset.univ h_univ_pos 0 le_rfl (univ_isEpsilonApprox 𝒜)
1510	refine ⟨Z, ?_, ?_⟩
1511	· -- IsEpsilonApprox 𝒜 (1/r) Z, using B (Fintype.card α) ≤ 1/r
1512	have hbound : (0 : ℝ) + B (Finset.univ : Finset α).card ≤ 1 / r := by
1513	rw [Finset.card_univ]; linarith [hB_top]
1514	exact isEpsilonApprox_mono hZε hbound
1515	· -- Size: Z.card ≤ threshold ≤ C·r²·log r
1516	calc (Z.card : ℝ) ≤ (threshold : ℝ) := by exact_mod_cast hZthresh
1517	_ ≤ C * r ^ 2 * Real.log r := hthresh_le
1518
1519	end Catalog.VC.EpsilonApproximationBound
1520