slight refactoring of cost functions + example tweaks

murrayrm · murrayrm · commit ea2884d0287a · 2021-02-26T22:46:34.000-08:00
diff --git a/control/obc.py b/control/obc.py
@@ -55,7 +55,7 @@ class OptimalControlProblem():
     def __init__(
             self, sys, time_vector, integral_cost, trajectory_constraints=[],
             terminal_cost=None, terminal_constraints=[], initial_guess=None,
-            log=False, options={}):
+            log=False, **kwargs):
         """Set up an optimal control problem
 
         To describe an optimal control problem we need an input/output system,
@@ -90,8 +90,8 @@ def __init__(
             extension of the time axis.
         log : bool, optional
             If `True`, turn on logging messages (using Python logging module).
-        options : dict, optional
-            Solver options (passed to :func:`scipy.optimal.minimize`).
+        kwargs : dict, optional
+            Additional parameters (passed to :func:`scipy.optimal.minimize`).
 
         Returns
         -------
@@ -107,7 +107,7 @@ def __init__(
         self.trajectory_constraints = trajectory_constraints
         self.terminal_cost = terminal_cost
         self.terminal_constraints = terminal_constraints
-        self.options = options
+        self.kwargs = kwargs
 
         #
         # Compute and store constraints
@@ -251,7 +251,15 @@ def _cost_function(self, inputs):
         # TODO: vectorize
         cost = 0
         for i, t in enumerate(self.time_vector):
-            cost += self.integral_cost(states[:,i], inputs[:,i])
+            if ct.isctime(self.system):
+                # Approximate the integral using trapezoidal rule
+                if i > 0:
+                    cost += 0.5 * (
+                        self.integral_cost(states[:, i-1], inputs[:, i-1]) +
+                        self.integral_cost(states[:, i], inputs[:, i])) * (
+                            self.time_vector[i] - self.time_vector[i-1])
+            else:
+                cost += self.integral_cost(states[:,i], inputs[:,i])
 
         # Terminal cost
         if self.terminal_cost is not None:
@@ -573,7 +581,7 @@ def compute_trajectory(
         # Call ScipPy optimizer
         res = sp.optimize.minimize(
             self._cost_function, self.initial_guess,
-            constraints=self.constraints, options=self.options)
+            constraints=self.constraints, **self.kwargs)
 
         # Process and return the results
         return OptimalControlResult(
@@ -676,7 +684,7 @@ def __init__(
 def compute_optimal_input(
         sys, horizon, X0, cost, constraints=[], terminal_cost=None,
         terminal_constraints=[], initial_guess=None, squeeze=None,
-        transpose=None, return_x=None, log=False, options={}):
+        transpose=None, return_x=None, log=False, **kwargs):
 
     """Compute the solution to an optimal control problem
 
@@ -743,8 +751,8 @@ def compute_optimal_input(
         If True, assume that 2D input arrays are transposed from the standard
         format.  Used to convert MATLAB-style inputs to our format.
 
-    options : dict, optional
-        Solver options (passed to :func:`scipy.optimal.minimize`).
+    kwargs : dict, optional
+        Additional parameters (passed to :func:`scipy.optimal.minimize`).
 
     Returns
     -------
@@ -763,7 +771,7 @@ def compute_optimal_input(
     ocp = OptimalControlProblem(
         sys, horizon, cost, trajectory_constraints=constraints,
         terminal_cost=terminal_cost, terminal_constraints=terminal_constraints,
-        initial_guess=initial_guess, log=log, options=options)
+        initial_guess=initial_guess, log=log, **kwargs)
 
     # Solve for the optimal input from the current state
     return ocp.compute_trajectory(
@@ -773,7 +781,7 @@ def compute_optimal_input(
 # Create a model predictive controller for an optimal control problem
 def create_mpc_iosystem(
         sys, horizon, cost, constraints=[], terminal_cost=None,
-        terminal_constraints=[], dt=True, log=False, options={}):
+        terminal_constraints=[], dt=True, log=False, **kwargs):
     """Create a model predictive I/O control system
 
     This function creates an input/output system that implements a model
@@ -805,8 +813,8 @@ def create_mpc_iosystem(
         List of constraints that should hold at the end of the trajectory.
         Same format as `constraints`.
 
-    options : dict, optional
-        Solver options (passed to :func:`scipy.optimal.minimize`).
+    kwargs : dict, optional
+        Additional parameters (passed to :func:`scipy.optimal.minimize`).
 
     Returns
     -------
@@ -821,7 +829,7 @@ def create_mpc_iosystem(
     ocp = OptimalControlProblem(
         sys, horizon, cost, trajectory_constraints=constraints,
         terminal_cost=terminal_cost, terminal_constraints=terminal_constraints,
-        log=log, options=options)
+        log=log, **kwargs)
 
     # Return an I/O system implementing the model predictive controller
     return ocp._create_mpc_iosystem(dt=dt)
@@ -863,8 +871,28 @@ def quadratic_cost(sys, Q, R, x0=0, u0=0):
         input.  The call signature of the function is cost_fun(x, u).
 
     """
-    Q = np.atleast_2d(Q)
-    R = np.atleast_2d(R)
+    # Process the input arguments
+    if Q is not None:
+        Q = np.atleast_2d(Q)
+        if Q.size == 1:         # allow scalar weights
+            Q = np.eye(sys.nstates) * Q.item()
+        elif Q.shape != (sys.nstates, sys.nstates):
+            raise ValueError("Q matrix is the wrong shape")
+
+    if R is not None:
+        R = np.atleast_2d(R)
+        if R.size == 1:         # allow scalar weights
+            R = np.eye(sys.ninputs) * R.item()
+        elif R.shape != (sys.ninputs, sys.ninputs):
+            raise ValueError("R matrix is the wrong shape")
+
+    if Q is None:
+        return lambda x, u: ((u-u0) @ R @ (u-u0)).item()
+
+    if R is None:
+        return lambda x, u: ((x-x0) @ Q @ (x-x0)).item()
+
+    # Received both Q and R matrices
     return lambda x, u: ((x-x0) @ Q @ (x-x0) + (u-u0) @ R @ (u-u0)).item()
 
 
diff --git a/examples/steering-optimal.py b/examples/steering-optimal.py
@@ -92,60 +92,101 @@ def plot_results(t, y, u, figure=None, yf=None):
 xf = [100., 2., 0.]; uf = [10., 0.]
 Tf = 10
 
-# Set up the cost functions
-Q = np.diag([0.1, 1, 0.1])      # keep lateral error low
-R = np.eye(2)                   # minimize applied inputs
-cost = obc.quadratic_cost(vehicle, Q, R, x0=xf, u0=uf)
-
 #
-# Set up different types of constraints to demonstrate
+# Approach 1: standard quadratic cost
+#
+# We can set up the optimal control problem as trying to minimize the
+# distance form the desired final point while at the same time as not
+# exerting too much control effort to achieve our goal.
+#
+# Note: depending on what version of SciPy you are using, you might get a
+# warning message about precision loss, but the solution is pretty good.
 #
 
-# Input constraints
-constraints = [ obc.input_range_constraint(vehicle, [8, -0.1], [12, 0.1]) ]
-
-# Terminal constraints (optional)
-terminal = [ obc.state_range_constraint(vehicle, xf, xf) ]
+# Set up the cost functions
+Q = np.diag([1, 10, 1])     # keep lateral error low
+R = np.diag([1, 1])         # minimize applied inputs
+cost1 = obc.quadratic_cost(vehicle, Q, R, x0=xf, u0=uf)
 
-# Time horizon and possible initial guessses
+# Define the time horizon (and spacing) for the optimization
 horizon = np.linspace(0, Tf, 10, endpoint=True)
-straight = [10, 0]              # straight trajectory
-bend_left = [10, 0.01]          # slight left veer
 
-#
-# Solve the optimal control problem in dififerent ways
-#
+# Provide an intial guess (will be extended to entire horizon)
+bend_left = [10, 0.01]          # slight left veer
 
-# Basic setup: quadratic cost, no terminal constraint, straight initial path
+# Turn on debug level logging so that we can see what the optimizer is doing
 logging.basicConfig(
-    level=logging.DEBUG, filename="steering-straight.log",
+    level=logging.DEBUG, filename="steering-integral_cost.log",
     filemode='w', force=True)
-result = obc.compute_optimal_input(
-    vehicle, horizon, x0, cost, initial_guess=straight,
-    log=True, options={'eps': 0.01})
-t1, u1 = result.time, result.inputs
+
+# Compute the optimal control, setting step size for gradient calculation (eps)
+result1 = obc.compute_optimal_input(
+    vehicle, horizon, x0, cost1, initial_guess=bend_left, log=True,
+    options={'eps': 0.01})
+
+# Extract and plot the results (+ state trajectory)
+t1, u1 = result1.time, result1.inputs
 t1, y1 = ct.input_output_response(vehicle, horizon, u1, x0)
 plot_results(t1, y1, u1, figure=1, yf=xf[0:2])
 
-# Add constraint on the input to avoid high steering angles
+#
+# Approach 2: input cost, input constraints, terminal cost
+#
+# The previous solution integrates the position error for the entire
+# horizon, and so the car changes lanes very quickly (at the cost of larger
+# inputs).  Instead, we can penalize the final state and impose a higher
+# cost on the inputs, resuling in a more graduate lane change.
+#
+# We also set the solver explicitly (its actually the default one, but shows
+# how to do this).
+#
+
+# Add input constraint, input cost, terminal cost
+constraints = [ obc.input_range_constraint(vehicle, [8, -0.1], [12, 0.1]) ]
+traj_cost = obc.quadratic_cost(vehicle, None, np.diag([0.1, 1]), u0=uf)
+term_cost = obc.quadratic_cost(vehicle, np.diag([1, 10, 10]), None, x0=xf)
+
+# Change logging to keep less information
 logging.basicConfig(
-    level=logging.INFO, filename="./steering-bendleft.log",
+    level=logging.INFO, filename="./steering-terminal_cost.log",
     filemode='w', force=True)
-result = obc.compute_optimal_input(
-    vehicle, horizon, x0, cost, constraints, initial_guess=bend_left,
-    log=True, options={'eps': 0.01})
-t2, u2 = result.time, result.inputs
+
+# Compute the optimal control
+result2 = obc.compute_optimal_input(
+    vehicle, horizon, x0, traj_cost, constraints, terminal_cost=term_cost,
+    initial_guess=bend_left, log=True,
+    method='SLSQP', options={'eps': 0.01})
+
+# Extract and plot the results (+ state trajectory)
+t2, u2 = result2.time, result2.inputs
 t2, y2 = ct.input_output_response(vehicle, horizon, u2, x0)
 plot_results(t2, y2, u2, figure=2, yf=xf[0:2])
 
-# Resolve with a terminal constraint (starting with previous result)
-logging.basicConfig(
-    level=logging.WARN, filename="./steering-terminal.log",
-    filemode='w', force=True)
-result = obc.compute_optimal_input(
-    vehicle, horizon, x0, cost, constraints,
-    terminal_constraints=terminal, initial_guess=u2,
-    log=True, options={'eps': 0.01})
-t3, u3 = result.time, result.inputs
+#
+# Approach 3: terminal constraints and new solver
+#
+# As a final example, we can remove the cost function on the state and
+# replace it with a terminal *constraint* on the state.  If a solution is
+# found, it guarantees we get to exactly the final state.
+#
+# To speeds things up a bit, we initalize the problem using the previous
+# optimal controller (which didn't quite hit the final value).
+#
+
+# Input cost and terminal constraints
+cost3 = obc.quadratic_cost(vehicle, np.zeros((3,3)), R, u0=uf)
+terminal = [ obc.state_range_constraint(vehicle, xf, xf) ]
+
+# Reset logging to its default values
+logging.basicConfig(level=logging.WARN, force=True)
+
+# Compute the optimal control
+result3 = obc.compute_optimal_input(
+    vehicle, horizon, x0, cost3, constraints,
+    terminal_constraints=terminal, initial_guess=u2, log=True,
+    options={'eps': 0.01})
+
+# Extract and plot the results (+ state trajectory)
+t3, u3 = result3.time, result3.inputs
 t3, y3 = ct.input_output_response(vehicle, horizon, u3, x0)
 plot_results(t3, y3, u3, figure=3, yf=xf[0:2])