ilqgames
A new real-time solver for large-scale differential games.
quadratic_cost_approximation.h
1 /*
2  * Copyright (c) 2019, The Regents of the University of California (Regents).
3  * All rights reserved.
4  *
5  * Redistribution and use in source and binary forms, with or without
6  * modification, are permitted provided that the following conditions are
7  * met:
8  *
9  * 1. Redistributions of source code must retain the above copyright
10  * notice, this list of conditions and the following disclaimer.
11  *
12  * 2. Redistributions in binary form must reproduce the above
13  * copyright notice, this list of conditions and the following
14  * disclaimer in the documentation and/or other materials provided
15  * with the distribution.
16  *
17  * 3. Neither the name of the copyright holder nor the names of its
18  * contributors may be used to endorse or promote products derived
19  * from this software without specific prior written permission.
20  *
21  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS AS IS
22  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
25  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
28  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
29  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
30  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
31  * POSSIBILITY OF SUCH DAMAGE.
32  *
33  * Please contact the author(s) of this library if you have any questions.
34  * Authors: David Fridovich-Keil ( dfk@eecs.berkeley.edu )
35  */
36 
37 ///////////////////////////////////////////////////////////////////////////////
38 //
39 // Container to store a quadratic approximation of a single player's cost at a
40 // particular moment in time. That is, each player should have a time-indexed
41 // set of these QuadraticApproximations.
42 //
43 // Notation is taken from Basar and Olsder, Corollary 6.1.
44 // -- Q is the Hessian with respect to state
45 // -- l is the gradient with respect to state
46 // -- Rs[ii] is the Hessian with respect to the control input of player ii
47 // -- rs[ii] is the gradient with respect to the control input of player ii
48 //
49 ///////////////////////////////////////////////////////////////////////////////
50 
51 #ifndef ILQGAMES_UTILS_QUADRATIC_COST_APPROXIMATION_H
52 #define ILQGAMES_UTILS_QUADRATIC_COST_APPROXIMATION_H
53 
54 #include <ilqgames/utils/types.h>
55 
56 #include <glog/logging.h>
57 #include <unordered_map>
58 
59 namespace ilqgames {
60 
62  MatrixXf hess;
63  VectorXf grad;
64 
65  // Construct from matrix/vector directly.
66  SingleCostApproximation(const MatrixXf& hessian, const VectorXf& gradient)
67  : hess(hessian), grad(gradient) {
68  CHECK_EQ(hess.rows(), hess.cols());
69  CHECK_EQ(hess.rows(), grad.size());
70  }
71 
72  // Construct with zeros.
73  SingleCostApproximation(Dimension dim, float regularization = 0.0)
74  : hess(regularization * MatrixXf::Identity(dim, dim)),
75  grad(VectorXf::Zero(dim)) {}
76 }; // struct SingleCostApproximation
77 
80  PlayerMap<SingleCostApproximation> control;
81 
82  // Construct from state dimension.
83  explicit QuadraticCostApproximation(Dimension xdim,
84  float regularization = 0.0)
85  : state(xdim, regularization) {}
86 }; // struct QuadraticCostApproximation
87 
88 } // namespace ilqgames
89 
90 #endif