Instances For
theorem
MultiplicativeWeights.expert_penalty_split
{n : ℕ}
{P : Type u_1}
(M : Fin n → P → ℝ)
(outcomes : ℕ → P)
(i : Fin n)
(T : ℕ)
:
totalExpertPenalty M outcomes i T = totalNonnegPenalty M outcomes i T + totalNegPenalty M outcomes i T
theorem
MultiplicativeWeights.general_mw_regret_bound
{P : Type u_1}
{n : ℕ}
(hn : 0 < n)
(M : Fin n → P → ℝ)
(ρ ε : ℝ)
(outcomes : ℕ → P)
(hε_pos : 0 < ε)
(hε_le : ε ≤ 1 / 2)
(hρ_pos : 0 < ρ)
(hM : ∀ (i : Fin n) (j : P), M i j ∈ Set.Icc (-ρ) ρ)
(i : Fin n)
(T : ℕ)
:
totalExpectedPenalty M ρ ε outcomes T ≤ ρ * Real.log ↑n / ε + (1 + ε) * totalNonnegPenalty M outcomes i T + (1 - ε) * totalNegPenalty M outcomes i T
theorem
MultiplicativeWeights.corollary_algebraic_core
(totalExp expertTotal A B ρ logn δ : ℝ)
(T : ℕ)
(hT_pos : 0 < ↑T)
(hρ_pos : 0 < ρ)
(hδ_pos : 0 < δ)
(hAB : A + B = expertTotal)
(hAmB : A - B ≤ ↑T * ρ)
(hbound : totalExp ≤ ρ * logn / (δ / (4 * ρ)) + (1 + δ / (4 * ρ)) * A + (1 - δ / (4 * ρ)) * B)
(hT_big : 16 * ρ ^ 2 * logn / δ ^ 2 ≤ ↑T)
:
theorem
MultiplicativeWeights.mw_average_penalty_bound
{P : Type u_1}
{n : ℕ}
(hn : 0 < n)
(M : Fin n → P → ℝ)
{ρ : ℝ}
(outcomes : ℕ → P)
(hρ_pos : 0 < ρ)
(hM : ∀ (i : Fin n) (j : P), M i j ∈ Set.Icc (-ρ) ρ)
{δ : ℝ}
(hδ_pos : 0 < δ)
(hε_le : δ / (4 * ρ) ≤ 1 / 2)
{T : ℕ}
(hT_pos : 0 < T)
(hT_big : 16 * ρ ^ 2 * Real.log ↑n / δ ^ 2 ≤ ↑T)
(i : Fin n)
: