Documentation

MDP.Bellman

theorem iSup_iterate_succ' {α : Type u_1} [CompleteLattice α] (f : αα) :
⨆ (n : ), f^[n + 1] = ⨆ (n : ), f^[n]
theorem iSup_iterate_succ {α : Type u_1} [CompleteLattice α] (f : αα) :
⨆ (n : ), f^[n + 1] = ⨆ (n : ), f^[n]
noncomputable def MDP.Φf {State : Type u_1} {Act : Type u_2} {M : MDP State Act} (s : State) (α : Act) :
Equations
Instances For
    noncomputable def MDP.Φ {State : Type u_1} {Act : Type u_2} {M : MDP State Act} (O : Optimization) (c : M.Costs) :

    The Bellman operator.

    Equations
    Instances For
      @[reducible, inline, deprecated "Φ 𝒟" (since := "2025-09-15")]
      noncomputable abbrev MDP. {State : Type u_1} {Act : Type u_2} {M : MDP State Act} (c : M.Costs) :

      The demonic Bellman operator.

      Equations
      Instances For
        @[reducible, inline, deprecated "Φ 𝒜" (since := "2025-09-15")]
        noncomputable abbrev MDP. {State : Type u_1} {Act : Type u_2} {M : MDP State Act} (c : M.Costs) :

        The angelic Bellman operator.

        Equations
        Instances For
          noncomputable def MDP.Φℒ {State : Type u_1} {Act : Type u_2} {M : MDP State Act} ( : 𝔏[M]) (c : M.Costs) :

          The Bellman operator with a fixed scheduler (necessarily Markovian).

          Equations
          Instances For
            theorem MDP.Φ.monotone' {State : Type u_1} {Act : Type u_2} {M : MDP State Act} {O : Optimization} :
            theorem MDP.dΦ_le_Φℒ {State✝ : Type u_3} {Act✝ : Type u_4} {M✝ : MDP State✝ Act✝} { : 𝔏[M✝]} :
            @[deprecated "lfp (M.Φ O)" (since := "2025-09-15")]
            noncomputable def MDP.lfp_Φ {State : Type u_1} {Act : Type u_2} {M : MDP State Act} :
            M.CostsM.Costs
            Equations
            Instances For
              theorem MDP.iSup_succ_Φ_eq_iSup_Φ {State : Type u_1} {Act : Type u_2} {M : MDP State Act} (O : Optimization) (c : M.Costs) :
              ⨆ (n : ), (⇑(Φ O c))^[n + 1] = ⨆ (n : ), (⇑(Φ O c))^[n]
              theorem MDP.iSup_succ_Φ_eq_iSup_Φ_apply {State : Type u_1} {Act : Type u_2} {M : MDP State Act} {x : State} (O : Optimization) (c : M.Costs) :
              ⨆ (n : ), (⇑(Φ O c))^[n + 1] x = ⨆ (n : ), (⇑(Φ O c))^[n] x
              noncomputable def MDP.lfp_Φℒ {State : Type u_1} {Act : Type u_2} {M : MDP State Act} ( : 𝔏[M]) :
              M.CostsM.Costs
              Equations
              Instances For
                theorem MDP.map_lfp_Φℒ {State✝ : Type u_3} {Act✝ : Type u_4} {M✝ : MDP State✝ Act✝} {c : 𝔏[M✝]} {𝒮 : M✝.Costs} :
                (Φℒ c 𝒮) (lfp_Φℒ c 𝒮) = lfp_Φℒ c 𝒮
                theorem MDP.Φf_ωScottContinuous {State : Type u_1} {Act : Type u_2} {M : MDP State Act} {s : State} {a : Act} :
                theorem MDP.Φℒ_ωScottContinuous {State : Type u_1} {Act : Type u_2} {M : MDP State Act} {c : 𝔏[M]} { : M.Costs} :
                theorem MDP.lfp_Φℒ_eq_iSup_Φℒ {State : Type u_1} {Act : Type u_2} {M : MDP State Act} :
                lfp_Φℒ = fun (c : 𝔏[M]) ( : M.Costs) => ⨆ (n : ), (⇑(Φℒ c ))^[n]
                theorem MDP.lfp_Φℒ_eq_iSup_succ_Φℒ {State : Type u_1} {Act : Type u_2} {M : MDP State Act} :
                lfp_Φℒ = fun (c : 𝔏[M]) ( : M.Costs) => ⨆ (n : ), (⇑(Φℒ c ))^[n + 1]
                class Optimization.ΦContinuous {S : Type u_3} {A : Type u_4} (O : Optimization) (M : MDP S A) :
                Instances
                  theorem MDP.lfp_Φ_eq_iSup_Φ {State : Type u_1} {Act : Type u_2} {M : MDP State Act} {c : M.Costs} {O : Optimization} [i : O.ΦContinuous M] :
                  OrderHom.lfp (Φ O c) = ⨆ (n : ), (⇑(Φ O c))^[n]
                  theorem MDP.lfp_Φ_eq_iSup_succ_Φ {State : Type u_1} {Act : Type u_2} {M : MDP State Act} {c : M.Costs} {O : Optimization} [i : O.ΦContinuous M] :
                  OrderHom.lfp (Φ O c) = ⨆ (n : ), (⇑(Φ O c))^[n + 1]
                  instance MDP.instΦContinuousAngelic {State : Type u_1} {Act : Type u_2} {M : MDP State Act} :
                  instance MDP.instΦContinuousDemonic {State : Type u_1} {Act : Type u_2} {M : MDP State Act} [M.FiniteBranching] :
                  instance MDP.instΦContinuous {State : Type u_1} {Act : Type u_2} {M : MDP State Act} [M.FiniteBranching] {O : Optimization} :