d8/d30/fmdpLearner_8h_source.html

 /**
  *
  *   Copyright 2005-2020 Pierre-Henri WUILLEMIN(@LIP6) & Christophe GONZALES(@AMU)
  *   info_at_agrum_dot_org
  *
  *  This library is free software: you can redistribute it and/or modify
  *  it under the terms of the GNU Lesser General Public License as published by
  *  the Free Software Foundation, either version 3 of the License, or
  *  (at your option) any later version.
  *
  *  This library is distributed in the hope that it will be useful,
  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  *  GNU Lesser General Public License for more details.
  *
  *  You should have received a copy of the GNU Lesser General Public License
  *  along with this library.  If not, see <http://www.gnu.org/licenses/>.
  *
  */


 /**
  * @file
  * @brief Headers of the FMDPLearner class.
  *
  * @author Jean-Christophe MAGNAN
  */

 // =========================================================================
 #ifndef GUM_FMDP_LEARNER_H
 #define GUM_FMDP_LEARNER_H
 // =========================================================================
 #include <agrum/tools/core/hashTable.h>
 // =========================================================================
 #include <agrum/FMDP/SDyna/Strategies/ILearningStrategy.h>
 #include <agrum/FMDP/fmdp.h>
 #include <agrum/FMDP/learning/datastructure/imddi.h>
 #include <agrum/FMDP/learning/datastructure/iti.h>
 #include <agrum/FMDP/learning/observation.h>
 // =========================================================================
 #include <agrum/tools/variables/discreteVariable.h>
 // =========================================================================

 namespace gum {

   /**
    * @class FMDPLearner
    * @headerfile fmdpLearner.h <agrum/FMDP/learning/fmdpLearner.h>
    * @brief
    * @ingroup fmdp_group
    *
    *
    *
    */

   template < TESTNAME    VariableAttributeSelection,
              TESTNAME    RewardAttributeSelection,
              LEARNERNAME LearnerSelection >
   class FMDPLearner: public ILearningStrategy {
     typedef
        typename LearnerSelect< LearnerSelection,
                                IMDDI< VariableAttributeSelection, false >,
                                ITI< VariableAttributeSelection, false > >::type
           VariableLearnerType;

     typedef typename LearnerSelect< LearnerSelection,
                                     IMDDI< RewardAttributeSelection, true >,
                                     ITI< RewardAttributeSelection, true > >::type
        RewardLearnerType;

     typedef HashTable< const DiscreteVariable*, VariableLearnerType* >
        VarLearnerTable;

     public:
     // ==========================================================================
     /// @name Constructor & destructor.
     // ==========================================================================
     /// @{

     // ###################################################################
     /// Default constructor
     // ###################################################################
     FMDPLearner(double learningThreshold,
                 bool   actionReward,
                 double similarityThreshold = 0.05);

     // ###################################################################
     /// Default destructor
     // ###################################################################
     ~FMDPLearner();

     /// @}

     // ###################################################################
     /// @name Initialization
     // ###################################################################
     /// @{
     public:
     // ==========================================================================
     /// Initializes the learner
     // ==========================================================================
     void initialize(FMDP< double >* fmdp);

     // ==========================================================================
     ///
     // ==========================================================================
     MultiDimFunctionGraph< double >* instantiateFunctionGraph__() {
       return instantiateFunctionGraph__(Int2Type< LearnerSelection >());
     }

     MultiDimFunctionGraph< double >*
        instantiateFunctionGraph__(Int2Type< IMDDILEARNER >) {
       return MultiDimFunctionGraph< double, ExactTerminalNodePolicy >::
          getReducedAndOrderedInstance();
     }

     MultiDimFunctionGraph< double >*
        instantiateFunctionGraph__(Int2Type< ITILEARNER >) {
       return MultiDimFunctionGraph< double,
                                     ExactTerminalNodePolicy >::getTreeInstance();
     }


     // ==========================================================================
     ///
     // ==========================================================================
     VariableLearnerType*
        instantiateVarLearner__(MultiDimFunctionGraph< double >* target,
                                Set< const DiscreteVariable* >&  mainVariables,
                                const DiscreteVariable*          learnedVar) {
       return instantiateVarLearner__(target,
                                      mainVariables,
                                      learnedVar,
                                      Int2Type< LearnerSelection >());
     }

     VariableLearnerType*
        instantiateVarLearner__(MultiDimFunctionGraph< double >* target,
                                Set< const DiscreteVariable* >&  mainVariables,
                                const DiscreteVariable*          learnedVar,
                                Int2Type< IMDDILEARNER >) {
       return new VariableLearnerType(target,
                                      learningThreshold__,
                                      similarityThreshold__,
                                      mainVariables,
                                      learnedVar);
     }

     VariableLearnerType*
        instantiateVarLearner__(MultiDimFunctionGraph< double >* target,
                                Set< const DiscreteVariable* >&  mainVariables,
                                const DiscreteVariable*          learnedVar,
                                Int2Type< ITILEARNER >) {
       return new VariableLearnerType(target,
                                      learningThreshold__,
                                      mainVariables,
                                      learnedVar);
     }


     // ==========================================================================
     ///
     // ==========================================================================
     RewardLearnerType*
        instantiateRewardLearner__(MultiDimFunctionGraph< double >* target,
                                   Set< const DiscreteVariable* >&  mainVariables) {
       return instantiateRewardLearner__(target,
                                         mainVariables,
                                         Int2Type< LearnerSelection >());
     }

     RewardLearnerType*
        instantiateRewardLearner__(MultiDimFunctionGraph< double >* target,
                                   Set< const DiscreteVariable* >&  mainVariables,
                                   Int2Type< IMDDILEARNER >) {
       return new RewardLearnerType(target,
                                    learningThreshold__,
                                    similarityThreshold__,
                                    mainVariables);
     }

     RewardLearnerType*
        instantiateRewardLearner__(MultiDimFunctionGraph< double >* target,
                                   Set< const DiscreteVariable* >&  mainVariables,
                                   Int2Type< ITILEARNER >) {
       return new RewardLearnerType(target, learningThreshold__, mainVariables);
     }

     /// @}


     // ###################################################################
     /// @name Incremental methods
     // ###################################################################
     /// @{
     public:
     // ==========================================================================
     /**
      * Gives to the learner a new transition
      * @param actionId : the action on which the transition was made
      * @param obs : the observed transition
      * @return true if learning this transition implies structural changes
      * (can trigger a new planning)
      */
     // ==========================================================================
     bool addObservation(Idx actionId, const Observation* obs);


     // ==========================================================================
     /**
      * Starts an update of datastructure in the associated FMDP
      */
     // ==========================================================================
     void updateFMDP();

     /// @}


     // ###################################################################
     /// @name Miscelleanous methods
     // ###################################################################
     /// @{
     public:
     // ==========================================================================
     /**
      * @brief learnerSize
      * @return
      */
     // ==========================================================================
     Size size();

     // ==========================================================================
     /// \brief extractCount
     // ==========================================================================
     const IVisitableGraphLearner* varLearner(Idx                     actionId,
                                              const DiscreteVariable* var) const {
       return actionLearners__[actionId]->getWithDefault(var, nullptr);
     }

     virtual double rMax() const { return rmax__; }

     private:
     double rmax__;

     public:
     virtual double modaMax() const { return modaMax__; }

     private:
     double modaMax__;

     /// @}


     private:
     /// The FMDP to store the learned model
     FMDP< double >* fmdp__;

     HashTable< Idx, VarLearnerTable* > actionLearners__;

     bool                                 actionReward__;
     HashTable< Idx, RewardLearnerType* > actionRewardLearners__;
     RewardLearnerType*                   rewardLearner__;

     const double learningThreshold__;
     const double similarityThreshold__;
   };


 } /* namespace gum */

 #include <agrum/FMDP/learning/fmdpLearner_tpl.h>

 #endif   // GUM_FMDP_LEARNER_H
gum::FMDPLearner::rewardLearner__
RewardLearnerType * rewardLearner__
Definition: fmdpLearner.h:262

gum::FMDPLearner::actionReward__
bool actionReward__
Definition: fmdpLearner.h:260

gum::FMDPLearner::initialize
void initialize(FMDP< double > *fmdp)
Initializes the learner.
Definition: fmdpLearner_tpl.h:96

gum::Set::emplace
INLINE void emplace(Args &&... args)
Definition: set_tpl.h:669

gum::FMDPLearner::instantiateFunctionGraph__
MultiDimFunctionGraph< double > * instantiateFunctionGraph__(Int2Type< ITILEARNER >)
Initializes the learner.
Definition: fmdpLearner.h:118

gum::FMDPLearner::varLearner
const IVisitableGraphLearner * varLearner(Idx actionId, const DiscreteVariable *var) const
extractCount
Definition: fmdpLearner.h:235

gum::FMDPLearner::instantiateVarLearner__
VariableLearnerType * instantiateVarLearner__(MultiDimFunctionGraph< double > *target, Set< const DiscreteVariable * > &mainVariables, const DiscreteVariable *learnedVar)
Initializes the learner.
Definition: fmdpLearner.h:128

gum::FMDPLearner::actionLearners__
HashTable< Idx, VarLearnerTable *> actionLearners__
Definition: fmdpLearner.h:258

gum::FMDPLearner::FMDPLearner
FMDPLearner(double learningThreshold, bool actionReward, double similarityThreshold=0.05)
Default constructor.
Definition: fmdpLearner_tpl.h:47

gum::FMDPLearner::modaMax__
double modaMax__
learnerSize
Definition: fmdpLearner.h:249

gum::FMDPLearner::~FMDPLearner
~FMDPLearner()
Default destructor.
Definition: fmdpLearner_tpl.h:65

gum::FMDPLearner::instantiateVarLearner__
VariableLearnerType * instantiateVarLearner__(MultiDimFunctionGraph< double > *target, Set< const DiscreteVariable * > &mainVariables, const DiscreteVariable *learnedVar, Int2Type< ITILEARNER >)
Initializes the learner.
Definition: fmdpLearner.h:150

gum::FMDPLearner::addObservation
bool addObservation(Idx actionId, const Observation *obs)
Gives to the learner a new transition.
Definition: fmdpLearner_tpl.h:159

gum::FMDPLearner::modaMax
virtual double modaMax() const
learnerSize
Definition: fmdpLearner.h:246

gum::FMDPLearner::instantiateRewardLearner__
RewardLearnerType * instantiateRewardLearner__(MultiDimFunctionGraph< double > *target, Set< const DiscreteVariable * > &mainVariables, Int2Type< ITILEARNER >)
Initializes the learner.
Definition: fmdpLearner.h:183

gum::FMDPLearner::size
Size size()
learnerSize
Definition: fmdpLearner_tpl.h:193

gum::FMDPLearner::VarLearnerTable
HashTable< const DiscreteVariable *, VariableLearnerType *> VarLearnerTable
Definition: fmdpLearner.h:72

gum::FMDPLearner::instantiateFunctionGraph__
MultiDimFunctionGraph< double > * instantiateFunctionGraph__()
Initializes the learner.
Definition: fmdpLearner.h:107

gum::FMDPLearner::instantiateRewardLearner__
RewardLearnerType * instantiateRewardLearner__(MultiDimFunctionGraph< double > *target, Set< const DiscreteVariable * > &mainVariables)
Initializes the learner.
Definition: fmdpLearner.h:165

gum::FMDPLearner::RewardLearnerType
LearnerSelect< LearnerSelection, IMDDI< RewardAttributeSelection, true >, ITI< RewardAttributeSelection, true > >::type RewardLearnerType
Definition: fmdpLearner.h:69

gum::FMDPLearner::rmax__
double rmax__
learnerSize
Definition: fmdpLearner.h:243

gum::FMDPLearner::updateFMDP
void updateFMDP()
Starts an update of datastructure in the associated FMDP.
Definition: fmdpLearner_tpl.h:222

gum::FMDPLearner::similarityThreshold__
const double similarityThreshold__
Definition: fmdpLearner.h:265

gum::FMDPLearner::rMax
virtual double rMax() const
learnerSize
Definition: fmdpLearner.h:240

gum::FMDPLearner::fmdp__
FMDP< double > * fmdp__
The FMDP to store the learned model.
Definition: fmdpLearner.h:256

gum::FMDPLearner::learningThreshold__
const double learningThreshold__
Definition: fmdpLearner.h:264

gum::FMDPLearner::actionRewardLearners__
HashTable< Idx, RewardLearnerType *> actionRewardLearners__
Definition: fmdpLearner.h:261