slight code refactoring + docstrings + initial doc/obc.rst

murrayrm · murrayrm · commit 2456f365057c · 2021-02-26T22:46:34.000-08:00
diff --git a/control/obc.py b/control/obc.py
diff --git a/control/tests/obc_test.py b/control/tests/obc_test.py
@@ -13,7 +13,7 @@
 from control.tests.conftest import slycotonly
 
 
-def test_finite_horizon_mpc_simple():
+def test_finite_horizon_simple():
     # Define a linear system with constraints
     # Source: https://www.mpt3.org/UI/RegulationProblem
 
@@ -30,18 +30,13 @@ def test_finite_horizon_mpc_simple():
     R = [[1]]
     cost = obc.quadratic_cost(sys, Q, R)
 
-    # Create a model predictive controller system
+    # Set up the optimal control problem
     time = np.arange(0, 5, 1)
-    optctrl = obc.OptimalControlProblem(sys, time, cost, constraints)
-    mpc = optctrl.mpc
-
-    # Optimal control input for a given value of the initial state
     x0 = [4, 0]
-    u = mpc(x0)
-    np.testing.assert_almost_equal(u, -1)
 
     # Retrieve the full open-loop predictions
-    t, u_openloop = optctrl.compute_trajectory(x0, squeeze=True)
+    t, u_openloop = obc.compute_optimal_input(
+        sys, time, x0, cost, constraints, squeeze=True)
     np.testing.assert_almost_equal(
         u_openloop, [-1, -1, 0.1393, 0.3361, -5.204e-16], decimal=4)
 
@@ -54,7 +49,7 @@ def test_finite_horizon_mpc_simple():
 
 
 @slycotonly
-def test_finite_horizon_mpc_oscillator():
+def test_class_interface():
     # oscillator model defined in 2D
     # Source: https://www.mpt3.org/UI/RegulationProblem
     A = [[0.5403, -0.8415], [0.8415, 0.5403]]
@@ -124,11 +119,10 @@ def test_mpc_iosystem():
     cost = obc.quadratic_cost(model, Q, R, x0=xd, u0=ud)
 
     # online MPC controller object is constructed with a horizon 6
-    optctrl = obc.OptimalControlProblem(
+    ctrl = obc.create_mpc_iosystem(
         model, np.arange(0, 6) * 0.2, cost, constraints)
 
     # Define an I/O system implementing model predictive control
-    ctrl = optctrl.create_mpc_iosystem()
     loop = ct.feedback(sys, ctrl, 1)
 
     # Choose a nearby initial condition to speed up computation
diff --git a/doc/classes.rst b/doc/classes.rst
@@ -30,3 +30,14 @@ that allow for linear, nonlinear, and interconnected elements:
    LinearICSystem
    LinearIOSystem
    NonlinearIOSystem
+
+Additional classes
+==================
+.. autosummary::
+
+   flatsys.BasisFamily
+   flatsys.FlatSystem
+   flatsys.LinearFlatSystem
+   flatsys.PolyFamily
+   flatsys.SystemTrajectory
+   obc.OptimalControlProblem
diff --git a/doc/examples.rst b/doc/examples.rst
@@ -43,5 +43,6 @@ using running examples in FBS2e.
 
    cruise
    describing_functions
+   mpc_aircraft
    steering
    pvtol-lqr-nested
diff --git a/doc/index.rst b/doc/index.rst
@@ -30,6 +30,7 @@ implements basic operations for analysis and design of feedback control systems.
    flatsys
    iosys
    descfcn
+   obc
    examples
 
 * :ref:`genindex`
diff --git a/doc/mpc-overview.png b/doc/mpc-overview.png
diff --git a/doc/mpc_aircraft.ipynb b/doc/mpc_aircraft.ipynb
@@ -0,0 +1 @@
+../examples/mpc_aircraft.ipynb
diff --git a/doc/obc.rst b/doc/obc.rst
@@ -0,0 +1,140 @@
+.. _obc-module:
+
+**************************
+Optimization-based control
+**************************
+
+.. automodule:: control.obc
+   :no-members:
+   :no-inherited-members:
+
+Optimal control problem setup
+=============================
+
+Consider now the *optimal control problem*:
+
+.. math::
+
+  \min_{u(\cdot)} 
+  \int_0^T L(x,u)\, dt + V \bigl( x(T) \bigr)
+
+subject to the constraint
+
+.. math::
+
+  \dot x = f(x, u), \qquad x\in\mathbb{R}^n,\, u\in\mathbb{R}^m.
+
+Abstractly, this is a constrained optimization problem where we seek a
+*feasible trajectory* :math:`(x(t), u(t))` that minimizes the cost function
+
+.. math::
+
+  J(x, u) = \int_0^T L(x,u)\, dt + V \bigl( x(T) \bigr).
+
+More formally, this problem is equivalent to the "standard" problem of
+minimizing a cost function :math:`J(x, u)` where :math:`(x, u) \in L_2[0,T]`
+(the set of square integrable functions) and :math:`h(z) = \dot x(t) -
+f(x(t), u(t)) = 0` models the dynamics.  The term :math:`L(x, u)` is
+referred to as the integral (or trajectory) cost and :math:`V(x(T))` is the
+final (or terminal) cost.
+
+It is often convenient to ask that the final value of the trajectory,
+denoted :math:`x_\text{f}`, be specified.  We can do this by requiring that
+:math:`x(T) = x_\text{f}` or by using a more general form of constraint:
+
+.. math::
+   
+  \psi_i(x(T)) = 0, \qquad i = 1, \dots, q.
+
+The fully constrained case is obtained by setting :math:`q = n` and defining
+:math:`\psi_i(x(T)) = x_i(T) - x_{i,\text{f}}`.  For a control problem with
+a full set of terminal constraints, :math:`V(x(T))` can be omitted (since
+its value is fixed).
+
+Finally, we may wish to consider optimizations in which either the state or
+the inputs are constrained by a set of nonlinear functions of the form
+
+.. math::
+   
+  \text{lb}_i \leq g_i(x, u) \leq \text{ub}_i, \qquad i = 1, \dots, k.
+
+where :math:`\text{lb}_i` and :math:`\text{ub}_i` represent lower and upper
+bounds on the constraint function :math:`g_i`.  Note that these constraints
+can be on the input, the state, or combinations of input and state,
+depending on the form of :math:`g_i`.  Furthermore, these constraints are
+intended to hold at all instants in time along the trajectory.
+
+A common use of optimization-based control techniques is the implementation
+of model predictive control (also called receding horizon control).  In
+model predict control, a finite horizon optimal control problem is solved,
+generating open-loop state and control trajectories.  The resulting control
+trajectory is applied to the system for a fraction of the horizon
+length. This process is then repeated, resulting in a sampled data feedback
+law.  This approach is illustrated in the following figure:
+
+.. image:: mpc-overview.png
+
+Every :math:`\Delta T` seconds, an optimal control problem is solved over a
+:math:`T` second horizon, starting from the current state.  The first
+:math:`\Delta T` seconds of the optimal control :math:`u_T^{\*}(\cdot;
+x(t))` is then applied to the system. If we let :math:`x_T^{\*}(\cdot;
+x(t))` represent the optimal trajectory starting from :math:`x(t)`$ then the
+system state evolves from :math:`x(t)` at current time :math:`t` to
+:math:`x_T^{*}(\delta T, x(t))` at the next sample time :math:`t + \Delta
+T`, assuming no model uncertainty.
+
+In reality, the system will not follow the predicted path exactly, so that
+the red (computed) and blue (actual) trajectories will diverge.  We thus
+recompute the optimal path from the new state at time :math:`t + \Delta T`,
+extending our horizon by an additional :math:`\Delta T` units of time.  This
+approach can be shown to generate stabilizing control laws under suitable
+conditions (see, for example, the FBS2e supplement on `Optimization-Based
+Control <https://fbswiki.org/wiki/index.php/OBC>`_.
+  
+Module usage
+============
+
+The `obc` module provides a means of computing optimal trajectories for
+nonlinear systems and implementing optimization-based controllers, including
+model predictive control.  It follows the basic problem setup described
+above, but carries out all computations in *discrete time* (so that
+integrals become sums) and over a *finite horizon*.
+
+To describe an optimal control problem we need an input/output system, a
+time horizon, a cost function, and (optionally) a set of constraints on the
+state and/or input, either along the trajectory and at the terminal time.
+The `obc` module operates by converting the optimal control problem into a
+standard optimization problem that can be solved by
+:func:`scipy.optimize.minimize`.  The optimal control problem can be solved
+by using the `~control.obc.compute_optimal_input` function:
+
+  import control.obc as obc
+  inputs = obc.compute_optimal_inputs(sys, horizon, X0, cost, constraints)
+
+The `sys` parameter should be a :class:`~control.InputOutputSystem` and the
+`horizon` parameter should represent a time vector that gives the list of
+times at which the `cost` and `constraints` should be evaluated. By default,
+`constraints` are taken to be trajectory constraints holding at all points
+on the trajectory.  The `terminal_constraint` parameter can be used to
+specify a constraint that only holds at the final point of the trajectory
+and the `terminal_cost` paramter can be used to specify a terminal cost
+function.
+
+
+Example
+=======
+
+Module classes and functions
+============================
+.. autosummary::
+   :toctree: generated/
+
+   ~control.obc.OptimalControlProblem
+   ~control.obc.compute_optimal_input
+   ~control.obc.create_mpc_iosystem
+   ~control.obc.input_poly_constraint
+   ~control.obc.input_range_constraint
+   ~control.obc.output_poly_constraint
+   ~control.obc.output_range_constraint
+   ~control.obc.state_poly_constraint
+   ~control.obc.state_range_constraint
diff --git a/examples/mpc_aircraft.ipynb b/examples/mpc_aircraft.ipynb
@@ -78,7 +78,7 @@
     "cost = obc.quadratic_cost(model, Q, R, x0=xd, u0=ud)\n",
     "\n",
     "# online MPC controller object is constructed with a horizon 6\n",
-    "optctrl = obc.OptimalControlProblem(model, np.arange(0, 6) * 0.2, cost, constraints)"
+    "ctrl = obc.create_mpc_iosystem(model, np.arange(0, 6) * 0.2, cost, constraints)"
    ]
   },
   {
@@ -99,7 +99,6 @@
    ],
    "source": [
     "# Define an I/O system implementing model predictive control\n",
-    "ctrl = optctrl.create_mpc_iosystem()\n",
     "loop = ct.feedback(sys, ctrl, 1)\n",
     "print(loop)"
    ]

Original file line number	Diff line number	Diff line change
`@@ -78,7 +78,7 @@`
`78`	`78`	`"cost = obc.quadratic_cost(model, Q, R, x0=xd, u0=ud)\n",`
`79`	`79`	`"\n",`
`80`	`80`	`"# online MPC controller object is constructed with a horizon 6\n",`
`81`		`- "optctrl = obc.OptimalControlProblem(model, np.arange(0, 6) * 0.2, cost, constraints)"`
	`81`	`+ "ctrl = obc.create_mpc_iosystem(model, np.arange(0, 6) * 0.2, cost, constraints)"`
`82`	`82`	`]`
`83`	`83`	`},`
`84`	`84`	`{`
`@@ -99,7 +99,6 @@`
`99`	`99`	`],`
`100`	`100`	`"source": [`
`101`	`101`	`"# Define an I/O system implementing model predictive control\n",`
`102`		`- "ctrl = optctrl.create_mpc_iosystem()\n",`
`103`	`102`	`"loop = ct.feedback(sys, ctrl, 1)\n",`
`104`	`103`	`"print(loop)"`
`105`	`104`	`]`