![]() |
aGrUM
0.16.0
|
#include <agrum/FMDP/learning/fmdpLearner.h>
Miscelleanous methods | |
double | __rmax |
learnerSize More... | |
double | __modaMax |
learnerSize More... | |
Size | size () |
learnerSize More... | |
const IVisitableGraphLearner * | varLearner (Idx actionId, const DiscreteVariable *var) const |
extractCount More... | |
virtual double | rMax () const |
learnerSize More... | |
virtual double | modaMax () const |
learnerSize More... | |
Definition at line 60 of file fmdpLearner.h.
|
private |
Definition at line 70 of file fmdpLearner.h.
|
private |
Definition at line 65 of file fmdpLearner.h.
|
private |
Definition at line 73 of file fmdpLearner.h.
gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::FMDPLearner | ( | double | learningThreshold, |
bool | actionReward, | ||
double | similarityThreshold = 0.05 |
||
) |
Default constructor.
Definition at line 48 of file fmdpLearner_tpl.h.
References gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__rewardLearner.
gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::~FMDPLearner | ( | ) |
Default destructor.
Definition at line 66 of file fmdpLearner_tpl.h.
References gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__actionLearners, gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__actionRewardLearners, and gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__rewardLearner.
|
inline |
Initializes the learner.
Definition at line 108 of file fmdpLearner.h.
Referenced by gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::initialize().
|
inline |
Initializes the learner.
Definition at line 113 of file fmdpLearner.h.
References gum::MultiDimFunctionGraph< GUM_SCALAR, TerminalNodePolicy >::getReducedAndOrderedInstance().
|
inline |
Initializes the learner.
Definition at line 119 of file fmdpLearner.h.
|
inline |
Initializes the learner.
Definition at line 162 of file fmdpLearner.h.
Referenced by gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::initialize().
|
inline |
Initializes the learner.
Definition at line 169 of file fmdpLearner.h.
References gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__learningThreshold, and gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__similarityThreshold.
|
inline |
Initializes the learner.
Definition at line 177 of file fmdpLearner.h.
References gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__learningThreshold, gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::addObservation(), gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::size(), and gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::updateFMDP().
|
inline |
Initializes the learner.
Definition at line 129 of file fmdpLearner.h.
Referenced by gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::initialize().
|
inline |
Initializes the learner.
Definition at line 137 of file fmdpLearner.h.
References gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__learningThreshold, and gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__similarityThreshold.
|
inline |
Initializes the learner.
Definition at line 149 of file fmdpLearner.h.
|
virtual |
Gives to the learner a new transition.
actionId | : the action on which the transition was made |
obs | : the observed transition |
Implements gum::ILearningStrategy.
Definition at line 158 of file fmdpLearner_tpl.h.
References gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__actionLearners, gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__actionReward, gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__actionRewardLearners, gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__fmdp, gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__rewardLearner, gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__rmax, gum::FMDP< GUM_SCALAR >::beginVariables(), gum::FMDP< GUM_SCALAR >::endVariables(), and gum::Observation::reward().
Referenced by gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__instantiateRewardLearner().
|
virtual |
Initializes the learner.
Implements gum::ILearningStrategy.
Definition at line 97 of file fmdpLearner_tpl.h.
References gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__actionLearners, gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__actionReward, gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__actionRewardLearners, gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__fmdp, gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__instantiateFunctionGraph(), gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__instantiateRewardLearner(), gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__instantiateVarLearner(), gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__modaMax, gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__rewardLearner, gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__rmax, gum::FMDP< GUM_SCALAR >::actionName(), gum::FMDP< GUM_SCALAR >::addReward(), gum::FMDP< GUM_SCALAR >::addRewardForAction(), gum::FMDP< GUM_SCALAR >::addTransitionForAction(), gum::FMDP< GUM_SCALAR >::beginActions(), gum::FMDP< GUM_SCALAR >::beginVariables(), gum::FMDP< GUM_SCALAR >::endActions(), gum::FMDP< GUM_SCALAR >::endVariables(), gum::Set< Key, Alloc >::insert(), gum::FMDP< GUM_SCALAR >::main2prime(), and gum::MultiDimFunctionGraph< GUM_SCALAR, TerminalNodePolicy >::setTableName().
|
inlinevirtual |
learnerSize
Implements gum::ILearningStrategy.
Definition at line 240 of file fmdpLearner.h.
References gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__modaMax.
|
inlinevirtual |
learnerSize
Implements gum::ILearningStrategy.
Definition at line 234 of file fmdpLearner.h.
References gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__rmax.
|
virtual |
learnerSize
Implements gum::ILearningStrategy.
Definition at line 192 of file fmdpLearner_tpl.h.
References gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__actionLearners, gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__actionReward, gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__actionRewardLearners, gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__fmdp, gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__rewardLearner, gum::FMDP< GUM_SCALAR >::beginActions(), gum::FMDP< GUM_SCALAR >::beginVariables(), gum::FMDP< GUM_SCALAR >::endActions(), and gum::FMDP< GUM_SCALAR >::endVariables().
Referenced by gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__instantiateRewardLearner().
|
virtual |
Starts an update of datastructure in the associated FMDP.
Implements gum::ILearningStrategy.
Definition at line 221 of file fmdpLearner_tpl.h.
References gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__actionLearners, gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__actionReward, gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__actionRewardLearners, gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__fmdp, gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__rewardLearner, gum::FMDP< GUM_SCALAR >::beginActions(), gum::FMDP< GUM_SCALAR >::beginVariables(), gum::FMDP< GUM_SCALAR >::endActions(), and gum::FMDP< GUM_SCALAR >::endVariables().
Referenced by gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__instantiateRewardLearner().
|
inlinevirtual |
extractCount
Implements gum::ILearningStrategy.
Definition at line 229 of file fmdpLearner.h.
References gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__actionLearners.
|
private |
Definition at line 252 of file fmdpLearner.h.
Referenced by gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::addObservation(), gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::initialize(), gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::size(), gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::updateFMDP(), gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::varLearner(), and gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::~FMDPLearner().
|
private |
Definition at line 254 of file fmdpLearner.h.
Referenced by gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::addObservation(), gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::initialize(), gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::size(), and gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::updateFMDP().
|
private |
Definition at line 255 of file fmdpLearner.h.
Referenced by gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::addObservation(), gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::initialize(), gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::size(), gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::updateFMDP(), and gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::~FMDPLearner().
|
private |
The FMDP to store the learned model.
Definition at line 250 of file fmdpLearner.h.
Referenced by gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::addObservation(), gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::initialize(), gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::size(), and gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::updateFMDP().
|
private |
Definition at line 258 of file fmdpLearner.h.
Referenced by gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__instantiateRewardLearner(), and gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__instantiateVarLearner().
|
private |
learnerSize
Definition at line 243 of file fmdpLearner.h.
Referenced by gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::initialize(), and gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::modaMax().
|
private |
Definition at line 256 of file fmdpLearner.h.
Referenced by gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::addObservation(), gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::FMDPLearner(), gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::initialize(), gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::size(), gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::updateFMDP(), and gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::~FMDPLearner().
|
private |
learnerSize
Definition at line 237 of file fmdpLearner.h.
Referenced by gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::addObservation(), gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::initialize(), and gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::rMax().
|
private |
Definition at line 259 of file fmdpLearner.h.
Referenced by gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__instantiateRewardLearner(), and gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::__instantiateVarLearner().