Alternative forward models

This tutorial was generated using Literate.jl. Download the source as a .jl file. Download the source as a .ipynb file.

This example demonstrates how to train convex and non-convex models.

This example uses the following packages:

using SDDP
import Ipopt
import PowerModels
import Test

Formulation

For our model, we build a simple optimal power flow model with a single hydro-electric generator.

The formulation of our optimal power flow problem depends on model_type, which must be one of the PowerModels formulations.

(To run locally, download pglib_opf_case5_pjm.m and update filename appropriately.)

function build_model(model_type)
    filename = joinpath(@__DIR__, "pglib_opf_case5_pjm.m")
    data = PowerModels.parse_file(filename)
    return SDDP.PolicyGraph(
        SDDP.UnicyclicGraph(0.95);
        sense = :Min,
        lower_bound = 0.0,
        optimizer = Ipopt.Optimizer,
    ) do sp, t
        power_model = PowerModels.instantiate_model(
            data,
            model_type,
            PowerModels.build_opf;
            jump_model = sp,
        )
        # Now add hydro power models. Assume that generator 5 is hydro, and the
        # rest are thermal.
        pg = power_model.var[:it][:pm][:nw][0][:pg][5]
        sp[:pg] = pg
        @variable(sp, x >= 0, SDDP.State, initial_value = 10.0)
        @variable(sp, deficit >= 0)
        @constraint(sp, balance, x.out == x.in - pg + deficit)
        @stageobjective(sp, objective_function(sp) + 1e6 * deficit)
        SDDP.parameterize(sp, [0, 2, 5]) do ω
            return SDDP.set_normalized_rhs(balance, ω)
        end
        return
    end
end

build_model (generic function with 1 method)

Training a convex model

We can build and train a convex approximation of the optimal power flow problem.

The problem with the convex model is that it does not accurately simulate the true dynamics of the problem. Therefore, it under-estimates the true cost of operation.

convex = build_model(PowerModels.DCPPowerModel)
SDDP.train(convex; iteration_limit = 10)

-------------------------------------------------------------------
         SDDP.jl (c) Oscar Dowson and contributors, 2017-25
-------------------------------------------------------------------
problem
  nodes           : 1
  state variables : 1
  scenarios       : Inf
  existing cuts   : false
options
  solver          : serial mode
  risk measure    : SDDP.Expectation()
  sampling scheme : SDDP.InSampleMonteCarlo
subproblem structure
  VariableRef                             : [20, 20]
  AffExpr in MOI.EqualTo{Float64}         : [13, 13]
  AffExpr in MOI.Interval{Float64}        : [6, 6]
  VariableRef in MOI.GreaterThan{Float64} : [14, 14]
  VariableRef in MOI.LessThan{Float64}    : [11, 11]
numerical stability report
  matrix range     [1e+00, 2e+02]
  objective range  [1e+00, 1e+06]
  bounds range     [4e-01, 6e+00]
  rhs range        [5e-01, 5e+00]
-------------------------------------------------------------------
 iteration    simulation      bound        time (s)     solves  pid
-------------------------------------------------------------------
         1   1.274089e+06  5.017598e+04  1.711180e-01        43   1
         5   4.067898e+05  3.756841e+05  1.484169e+00       263   1
         7   2.048883e+06  4.074485e+05  2.768300e+00       465   1
        10   9.922528e+04  4.183036e+05  3.178887e+00       526   1
-------------------------------------------------------------------
status         : iteration_limit
total time (s) : 3.178887e+00
total solves   : 526
best bound     :  4.183036e+05
simulation ci  :  5.000171e+05 ± 4.034325e+05
numeric issues : 0
-------------------------------------------------------------------

To more accurately simulate the dynamics of the problem, a common approach is to write the cuts representing the policy to a file, and then read them into a non-convex model:

SDDP.write_cuts_to_file(convex, "convex.cuts.json")
non_convex = build_model(PowerModels.ACPPowerModel)
SDDP.read_cuts_from_file(non_convex, "convex.cuts.json")

Now we can simulate non_convex to evaluate the policy.

result = SDDP.simulate(non_convex, 1)

1-element Vector{Vector{Dict{Symbol, Any}}}:
 [Dict(:bellman_term => 395752.9890698975, :noise_term => 5, :node_index => 1, :stage_objective => 17624.178370710113, :objective_state => nothing, :belief => Dict(1 => 1.0)), Dict(:bellman_term => 395098.97737876826, :noise_term => 5, :node_index => 1, :stage_objective => 17624.178370354402, :objective_state => nothing, :belief => Dict(1 => 1.0)), Dict(:bellman_term => 403915.8545336708, :noise_term => 0, :node_index => 1, :stage_objective => 17624.178381568763, :objective_state => nothing, :belief => Dict(1 => 1.0)), Dict(:bellman_term => 403261.84283321834, :noise_term => 5, :node_index => 1, :stage_objective => 17624.178379679088, :objective_state => nothing, :belief => Dict(1 => 1.0)), Dict(:bellman_term => 407935.1835426768, :noise_term => 0, :node_index => 1, :stage_objective => 22193.240772952922, :objective_state => nothing, :belief => Dict(1 => 1.0)), Dict(:bellman_term => 407281.1717919707, :noise_term => 5, :node_index => 1, :stage_objective => 17624.17842124894, :objective_state => nothing, :belief => Dict(1 => 1.0)), Dict(:bellman_term => 407935.1835427424, :noise_term => 2, :node_index => 1, :stage_objective => 22555.156273926947, :objective_state => nothing, :belief => Dict(1 => 1.0)), Dict(:bellman_term => 407281.17179202376, :noise_term => 5, :node_index => 1, :stage_objective => 17624.178421248937, :objective_state => nothing, :belief => Dict(1 => 1.0)), Dict(:bellman_term => 407935.18354274245, :noise_term => 2, :node_index => 1, :stage_objective => 22555.156274010125, :objective_state => nothing, :belief => Dict(1 => 1.0)), Dict(:bellman_term => 407281.1717920238, :noise_term => 5, :node_index => 1, :stage_objective => 17624.17842124894, :objective_state => nothing, :belief => Dict(1 => 1.0))  …  Dict(:bellman_term => 407281.1717921735, :noise_term => 5, :node_index => 1, :stage_objective => 17624.178421248944, :objective_state => nothing, :belief => Dict(1 => 1.0)), Dict(:bellman_term => 406627.16007011646, :noise_term => 5, :node_index => 1, :stage_objective => 17624.178401286645, :objective_state => nothing, :belief => Dict(1 => 1.0)), Dict(:bellman_term => 408056.5159874213, :noise_term => 0, :node_index => 1, :stage_objective => 27420.553470545066, :objective_state => nothing, :belief => Dict(1 => 1.0)), Dict(:bellman_term => 412364.2715349417, :noise_term => 0, :node_index => 1, :stage_objective => 27420.553470545052, :objective_state => nothing, :belief => Dict(1 => 1.0)), Dict(:bellman_term => 407935.1829087369, :noise_term => 5, :node_index => 1, :stage_objective => 18380.454751017478, :objective_state => nothing, :belief => Dict(1 => 1.0)), Dict(:bellman_term => 407281.1711662849, :noise_term => 5, :node_index => 1, :stage_objective => 17624.178421248896, :objective_state => nothing, :belief => Dict(1 => 1.0)), Dict(:bellman_term => 410149.7254678595, :noise_term => 0, :node_index => 1, :stage_objective => 27420.553470545074, :objective_state => nothing, :belief => Dict(1 => 1.0)), Dict(:bellman_term => 414457.4810153788, :noise_term => 0, :node_index => 1, :stage_objective => 27420.553470544877, :objective_state => nothing, :belief => Dict(1 => 1.0)), Dict(:bellman_term => 421105.69013841165, :noise_term => 0, :node_index => 1, :stage_objective => 27420.553494386764, :objective_state => nothing, :belief => Dict(1 => 1.0)), Dict(:bellman_term => 441205.3050071765, :noise_term => 0, :node_index => 1, :stage_objective => 27420.55350562847, :objective_state => nothing, :belief => Dict(1 => 1.0))]

A problem with reading and writing the cuts to file is that the cuts have been generated from trial points of the convex model. Therefore, the policy may be arbitrarily bad at points visited by the non-convex model.

Training a non-convex model

We can also build and train a non-convex formulation of the optimal power flow problem.

The problem with the non-convex model is that because it is non-convex, SDDP.jl may find a sub-optimal policy. Therefore, it may over-estimate the true cost of operation.

non_convex = build_model(PowerModels.ACPPowerModel)
SDDP.train(non_convex; iteration_limit = 10)
result = SDDP.simulate(non_convex, 1)

1-element Vector{Vector{Dict{Symbol, Any}}}:
 [Dict(:bellman_term => 409498.53182866715, :noise_term => 5, :node_index => 1, :stage_objective => 17629.314309163234, :objective_state => nothing, :belief => Dict(1 => 1.0)), Dict(:bellman_term => 414679.7096383052, :noise_term => 2, :node_index => 1, :stage_objective => 17629.31431083395, :objective_state => nothing, :belief => Dict(1 => 1.0)), Dict(:bellman_term => 413999.9236977312, :noise_term => 5, :node_index => 1, :stage_objective => 17629.314310500416, :objective_state => nothing, :belief => Dict(1 => 1.0)), Dict(:bellman_term => 413320.1377574513, :noise_term => 5, :node_index => 1, :stage_objective => 17629.314310206475, :objective_state => nothing, :belief => Dict(1 => 1.0))]

Combining convex and non-convex models

To summarize, training with the convex model constructs cuts at points that may never be visited by the non-convex model, and training with the non-convex model may construct arbitrarily poor cuts because a key assumption of SDDP is convexity.

As a compromise, we can train a policy using a combination of the convex and non-convex models; we'll use the non-convex model to generate trial points on the forward pass, and we'll use the convex model to build cuts on the backward pass.

convex = build_model(PowerModels.DCPPowerModel)

A policy graph with 1 nodes.
 Node indices: 1

non_convex = build_model(PowerModels.ACPPowerModel)

A policy graph with 1 nodes.
 Node indices: 1

To do so, we train convex using the SDDP.AlternativeForwardPass forward pass, which simulates the model using non_convex, and we use SDDP.AlternativePostIterationCallback as a post-iteration callback, which copies cuts from the convex model back into the non_convex model.

SDDP.train(
    convex;
    forward_pass = SDDP.AlternativeForwardPass(non_convex),
    post_iteration_callback = SDDP.AlternativePostIterationCallback(non_convex),
    iteration_limit = 10,
)

-------------------------------------------------------------------
         SDDP.jl (c) Oscar Dowson and contributors, 2017-25
-------------------------------------------------------------------
problem
  nodes           : 1
  state variables : 1
  scenarios       : Inf
  existing cuts   : false
options
  solver          : serial mode
  risk measure    : SDDP.Expectation()
  sampling scheme : SDDP.InSampleMonteCarlo
subproblem structure
  VariableRef                             : [20, 20]
  AffExpr in MOI.EqualTo{Float64}         : [13, 13]
  AffExpr in MOI.Interval{Float64}        : [6, 6]
  VariableRef in MOI.GreaterThan{Float64} : [14, 14]
  VariableRef in MOI.LessThan{Float64}    : [11, 11]
numerical stability report
  matrix range     [1e+00, 2e+02]
  objective range  [1e+00, 1e+06]
  bounds range     [4e-01, 6e+00]
  rhs range        [5e-01, 5e+00]
-------------------------------------------------------------------
 iteration    simulation      bound        time (s)     solves  pid
-------------------------------------------------------------------
         1   2.595696e+05  8.441389e+04  2.821920e-01        42   1
         3   3.976417e+06  2.110723e+05  2.295910e+00       252   1
         8   3.016261e+05  3.211073e+05  3.582538e+00       381   1
         9   2.323392e+06  3.386967e+05  5.820411e+00       573   1
        10   5.893709e+05  3.508227e+05  6.750280e+00       657   1
-------------------------------------------------------------------
status         : iteration_limit
total time (s) : 6.750280e+00
total solves   : 657
best bound     :  3.508227e+05
simulation ci  :  8.044136e+05 ± 8.097506e+05
numeric issues : 0
-------------------------------------------------------------------

In practice, if we were to simulate non_convex now, we should obtain a better policy than either of the two previous approaches.