aGrUM  0.20.3
a C++ library for (probabilistic) graphical models
E_GreedyDecider.h
Go to the documentation of this file.
1 /**
2  *
3  * Copyright (c) 2005-2021 by Pierre-Henri WUILLEMIN(@LIP6) & Christophe GONZALES(@AMU)
4  * info_at_agrum_dot_org
5  *
6  * This library is free software: you can redistribute it and/or modify
7  * it under the terms of the GNU Lesser General Public License as published by
8  * the Free Software Foundation, either version 3 of the License, or
9  * (at your option) any later version.
10  *
11  * This library is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14  * GNU Lesser General Public License for more details.
15  *
16  * You should have received a copy of the GNU Lesser General Public License
17  * along with this library. If not, see <http://www.gnu.org/licenses/>.
18  *
19  */
20 
21 
22 /**
23  * @file
24  * @brief Headers of the epsilon-greedy decision maker class.
25  *
26  * @author Pierre-Henri WUILLEMIN(@LIP6) and Jean-Christophe MAGNAN and Christophe
27  * GONZALES(@AMU)
28  */
29 
30 
31 // =========================================================================
32 #ifndef GUM_E_GREEDY_DECIDER_H
33 #define GUM_E_GREEDY_DECIDER_H
34 // =========================================================================
35 #include <agrum/tools/core/types.h>
36 // =========================================================================
37 #include <agrum/FMDP/SDyna/Strategies/IDecisionStrategy.h>
38 #include <agrum/FMDP/SDyna/Strategies/IPlanningStrategy.h>
39 #include <agrum/FMDP/fmdp.h>
40 #include <agrum/FMDP/planning/actionSet.h>
41 #include <agrum/FMDP/simulation/statesChecker.h>
42 // =========================================================================
43 #include <agrum/tools/variables/discreteVariable.h>
44 // =========================================================================
45 
46 namespace gum {
47 
48  /**
49  * @class E_GreedyDecider E_GreedyDecider.h
50  * <agrum/FMDP/decision/E_GreedyDecider.h>
51  * @brief Class to make decision following an epsilon-greedy compromise
52  * between exploration and exploitation
53  *
54  *
55  */
57  // ###################################################################
58  /// @name Constructor & destructor.
59  // ###################################################################
60  /// @{
61  public:
62  // ==========================================================================
63  /// Constructor
64  // ==========================================================================
66 
67  // ==========================================================================
68  /// Destructor
69  // ==========================================================================
70  ~E_GreedyDecider();
71 
72  /// @}
73 
74  // ###################################################################
75  /// @name Initialization
76  // ###################################################################
77  /// @{
78  public:
79  // ==========================================================================
80  /// Initializes the learner
81  // ==========================================================================
82  void initialize(const FMDP< double >* fmdp);
83 
84  /// @}
85 
86 
87  // ###################################################################
88  /// @name Incremental methods
89  // ###################################################################
90  /// @{
91  public:
92  void checkState(const Instantiation& newState, Idx actionId);
93 
95 
96  /// @}
97 
98  private:
100  double _sss_;
101  };
102 } // namespace gum
103 #endif // GUM_E_GREEDY_DECIDER_H
void initialize(const FMDP< double > *fmdp)
Initializes the learner.
INLINE void emplace(Args &&... args)
Definition: set_tpl.h:643
ActionSet stateOptimalPolicy(const Instantiation &curState)
void checkState(const Instantiation &newState, Idx actionId)
StatesChecker _statecpt_
E_GreedyDecider()
Constructor.
<agrum/FMDP/decision/E_GreedyDecider.h>
~E_GreedyDecider()
Destructor.