31 #ifndef GUM_ADAPTIVE_RMAX_PLANER_H 32 #define GUM_ADAPTIVE_RMAX_PLANER_H 66 double discountFactor = 0.9,
67 double epsilon = 0.00001,
68 bool verbose =
true) {
80 double discountFactor = 0.9,
81 double epsilon = 0.00001,
82 bool verbose =
true) {
101 double discountFactor,
219 #endif // GUM_ADAPTIVE_RMAX_PLANER_H void makePlanning(Idx nbStep=1000000)
Performs a value iteration.
HashTable< Idx, StatesCounter *> __counterTable
HashTable< Idx, MultiDimFunctionGraph< double > *> __actionsBoolTable
<agrum/FMDP/planning/structuredPlaner.h>
~AdaptiveRMaxPlaner()
Default destructor.
virtual MultiDimFunctionGraph< double > * _valueIteration()
Performs a single step of value iteration.
Copyright 2005-2019 Pierre-Henri WUILLEMIN et Christophe GONZALES (LIP6) {prenom.nom}_at_lip6.fr.
<agrum/FMDP/SDyna/IDecisionStrategy.h>
static AdaptiveRMaxPlaner * ReducedAndOrderedInstance(const ILearningStrategy *learner, double discountFactor=0.9, double epsilon=0.00001, bool verbose=true)
std::pair< NodeId, NodeId > __visitLearner(const IVisitableGraphLearner *, NodeId currentNodeId, MultiDimFunctionGraph< double > *, MultiDimFunctionGraph< double > *)
<agrum/FMDP/SDyna/IVisitableGraphLearner.h>
const ILearningStrategy * __fmdpLearner
AdaptiveRMaxPlaner(IOperatorStrategy< double > *opi, double discountFactor, double epsilon, const ILearningStrategy *learner, bool verbose)
Default constructor.
<agrum/FMDP/planning/mddOperatorStrategy.h>
Copyright 2005-2019 Pierre-Henri WUILLEMIN et Christophe GONZALES (LIP6) {prenom.nom}_at_lip6.fr.
The class for generic Hash Tables.
HashTable< Idx, bool > __initializedTable
Copyright 2005-2019 Pierre-Henri WUILLEMIN et Christophe GONZALES (LIP6) {prenom.nom}_at_lip6.fr.
Copyright 2005-2019 Pierre-Henri WUILLEMIN et Christophe GONZALES (LIP6) {prenom.nom}_at_lip6.fr.
Copyright 2005-2019 Pierre-Henri WUILLEMIN et Christophe GONZALES (LIP6) {prenom.nom}_at_lip6.fr.
<agrum/FMDP/SDyna/ILearningStrategy.h>
void __makeRMaxFunctionGraphs()
<agrum/FMDP/planning/treeOperatorStrategy.h>
HashTable< Idx, MultiDimFunctionGraph< double > *> __actionsRMaxTable
static AdaptiveRMaxPlaner * TreeInstance(const ILearningStrategy *learner, double discountFactor=0.9, double epsilon=0.00001, bool verbose=true)
Class for assigning/browsing values to tuples of discrete variables.
<agrum/FMDP/planning/adaptiveRMaxPlaner.h>
void initialize(const FMDP< double > *fmdp)
Initializes data structure needed for making the planning.
INLINE const FMDP< double > * fmdp()
Returns a const ptr on the Factored Markov Decision Process on which we're planning.
virtual void _initVFunction()
Performs a single step of value iteration.
Size Idx
Type for indexes.
void checkState(const Instantiation &newState, Idx actionId)
Copyright 2005-2019 Pierre-Henri WUILLEMIN et Christophe GONZALES (LIP6) {prenom.nom}_at_lip6.fr.
Size NodeId
Type for node ids.
virtual void _evalPolicy()
Perform the required tasks to extract an optimal policy.