ilqgames
A new real-time solver for large-scale differential games.
compute_strategy_costs.cpp
1 /*
2  * Copyright (c) 2020, The Regents of the University of California (Regents).
3  * All rights reserved.
4  *
5  * Redistribution and use in source and binary forms, with or without
6  * modification, are permitted provided that the following conditions are
7  * met:
8  *
9  * 1. Redistributions of source code must retain the above copyright
10  * notice, this list of conditions and the following disclaimer.
11  *
12  * 2. Redistributions in binary form must reproduce the above
13  * copyright notice, this list of conditions and the following
14  * disclaimer in the documentation and/or other materials provided
15  * with the distribution.
16  *
17  * 3. Neither the name of the copyright holder nor the names of its
18  * contributors may be used to endorse or promote products derived
19  * from this software without specific prior written permission.
20  *
21  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS AS IS
22  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
25  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
28  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
29  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
30  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
31  * POSSIBILITY OF SUCH DAMAGE.
32  *
33  * Please contact the author(s) of this library if you have any questions.
34  * Authors: David Fridovich-Keil ( dfk@eecs.berkeley.edu )
35  */
36 
37 ///////////////////////////////////////////////////////////////////////////////
38 //
39 // Compute costs for each player associated with this set of strategies and
40 // operating point.
41 //
42 ///////////////////////////////////////////////////////////////////////////////
43 
44 #include <ilqgames/cost/player_cost.h>
45 #include <ilqgames/dynamics/multi_player_flat_system.h>
46 #include <ilqgames/dynamics/multi_player_integrable_system.h>
47 #include <ilqgames/utils/compute_strategy_costs.h>
48 #include <ilqgames/utils/operating_point.h>
49 #include <ilqgames/utils/quadratic_cost_approximation.h>
50 #include <ilqgames/utils/strategy.h>
51 #include <ilqgames/utils/types.h>
52 
53 #include <glog/logging.h>
54 #include <Eigen/Dense>
55 #include <random>
56 #include <vector>
57 
58 namespace ilqgames {
59 
60 // Compute cost of a set of strategies for each player.
61 std::vector<float> ComputeStrategyCosts(
62  const std::vector<PlayerCost>& player_costs,
63  const std::vector<Strategy>& strategies,
64  const OperatingPoint& operating_point,
65  const MultiPlayerIntegrableSystem& dynamics, const VectorXf& x0,
66  bool open_loop) {
67  // Start at the initial state.
68  VectorXf x(x0);
69  Time t = 0.0;
70 
71  // Walk forward along the trajectory and accumulate total cost.
72  std::vector<VectorXf> us(dynamics.NumPlayers());
73  std::vector<float> total_costs(dynamics.NumPlayers(), 0.0);
74  const size_t num_time_steps =
75  (open_loop) ? strategies[0].Ps.size() - 1 : strategies[0].Ps.size();
76  for (size_t kk = 0; kk < num_time_steps; kk++) {
77  // Update controls.
78  for (PlayerIndex ii = 0; ii < dynamics.NumPlayers(); ii++) {
79  if (open_loop)
80  us[ii] = strategies[ii](kk, VectorXf::Zero(x.size()),
81  operating_point.us[kk][ii]);
82  else
83  us[ii] = strategies[ii](kk, x - operating_point.xs[kk],
84  operating_point.us[kk][ii]);
85  }
86 
87  const VectorXf next_x = dynamics.Integrate(t, time::kTimeStep, x, us);
88  const Time next_t = t + time::kTimeStep;
89 
90  // Update costs.
91  for (PlayerIndex ii = 0; ii < dynamics.NumPlayers(); ii++) {
92  const float cost =
93  (open_loop) ? player_costs[ii].EvaluateOffset(t, next_t, next_x, us)
94  : player_costs[ii].Evaluate(t, x, us);
95 
96  total_costs[ii] += cost;
97  }
98 
99  // Update state and time
100  x = next_x;
101  t = next_t;
102  }
103 
104  return total_costs;
105 }
106 
107 std::vector<float> ComputeStrategyCosts(const Problem& problem,
108  bool open_loop) {
109  return ComputeStrategyCosts(
110  problem.PlayerCosts(), problem.CurrentStrategies(),
111  problem.CurrentOperatingPoint(), *problem.Dynamics(),
112  problem.InitialState(), open_loop);
113 }
114 
115 } // namespace ilqgames