db/d47/DAG2BNLearner__tpl_8h_source.html

 /***************************************************************************
  *   Copyright (C) 2005 by Christophe GONZALES and Pierre-Henri WUILLEMIN  *
  *   {prenom.nom}@lip6.fr                                                  *
  *                                                                         *
  *   This program is free software; you can redistribute it and/or modify  *
  *   it under the terms of the GNU General Public License as published by  *
  *   the Free Software Foundation; either version 2 of the License, or     *
  *   (at your option) any later version.                                   *
  *                                                                         *
  *   This program is distributed in the hope that it wil be useful,        *
  *   but WITHOUT ANY WARRANTY; without even the implied warranty of        *
  *   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the         *
  *   GNU General Public License for more details.                          *
  *                                                                         *
  *   You should have received a copy of the GNU General Public License     *
  *   along with this program; if not, write to the                         *
  *   Free Software Foundation, Inc.,                                       *
  *   59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.             *
  ***************************************************************************/
 #include <algorithm>
 #include <string>
 #include <vector>

 namespace gum {

   namespace learning {

     template < template < typename > class ALLOC >
     INLINE typename DAG2BNLearner< ALLOC >::allocator_type
        DAG2BNLearner< ALLOC >::getAllocator() const {
       return *this;
     }


     template < template < typename > class ALLOC >
     DAG2BNLearner< ALLOC >::DAG2BNLearner(
        const typename DAG2BNLearner< ALLOC >::allocator_type& alloc) :
         ALLOC< NodeId >(alloc) {
       GUM_CONSTRUCTOR(DAG2BNLearner);
     }


     template < template < typename > class ALLOC >
     DAG2BNLearner< ALLOC >::DAG2BNLearner(
        const DAG2BNLearner< ALLOC >&                          from,
        const typename DAG2BNLearner< ALLOC >::allocator_type& alloc) :
         ApproximationScheme(from),
         ALLOC< NodeId >(alloc) {
       GUM_CONS_CPY(DAG2BNLearner);
     }


     template < template < typename > class ALLOC >
     DAG2BNLearner< ALLOC >::DAG2BNLearner(const DAG2BNLearner< ALLOC >& from) :
         DAG2BNLearner(from, from.getAllocator()) {}


     template < template < typename > class ALLOC >
     DAG2BNLearner< ALLOC >::DAG2BNLearner(
        DAG2BNLearner< ALLOC >&&                               from,
        const typename DAG2BNLearner< ALLOC >::allocator_type& alloc) :
         ApproximationScheme(std::move(from)),
         ALLOC< NodeId >(alloc) {
       GUM_CONS_MOV(DAG2BNLearner);
     }


     template < template < typename > class ALLOC >
     DAG2BNLearner< ALLOC >::DAG2BNLearner(DAG2BNLearner< ALLOC >&& from) :
         DAG2BNLearner(std::move(from), from.getAllocator()) {}


     template < template < typename > class ALLOC >
     DAG2BNLearner< ALLOC >* DAG2BNLearner< ALLOC >::clone(
        const typename DAG2BNLearner< ALLOC >::allocator_type& alloc) const {
       ALLOC< DAG2BNLearner< ALLOC > > allocator(alloc);
       DAG2BNLearner< ALLOC >*         new_learner = allocator.allocate(1);
       try {
         allocator.construct(new_learner, *this, alloc);
       } catch (...) {
         allocator.deallocate(new_learner, 1);
         throw;
       }

       return new_learner;
     }


     template < template < typename > class ALLOC >
     DAG2BNLearner< ALLOC >* DAG2BNLearner< ALLOC >::clone() const {
       return clone(this->getAllocator());
     }


     template < template < typename > class ALLOC >
     DAG2BNLearner< ALLOC >::~DAG2BNLearner() {
       GUM_DESTRUCTOR(DAG2BNLearner);
     }


     template < template < typename > class ALLOC >
     DAG2BNLearner< ALLOC >& DAG2BNLearner< ALLOC >::
                             operator=(const DAG2BNLearner< ALLOC >& from) {
       ApproximationScheme::operator=(from);
       return *this;
     }


     template < template < typename > class ALLOC >
     DAG2BNLearner< ALLOC >& DAG2BNLearner< ALLOC >::
                             operator=(DAG2BNLearner< ALLOC >&& from) {
       ApproximationScheme::operator=(std::move(from));
       return *this;
     }


     template < template < typename > class ALLOC >
     template < typename GUM_SCALAR >
     void DAG2BNLearner< ALLOC >::__probaVarReordering(
        gum::Potential< GUM_SCALAR >&       pot,
        const gum::Potential< GUM_SCALAR >& other_pot) {
       // check that the variables are identical
       if (!pot.variablesSequence()
               .diffSet(other_pot.variablesSequence())
               .empty()) {
         GUM_ERROR(gum::CPTError, "the potentials do not have the same variables");
       }

       // perform the copy
       Instantiation i(other_pot);
       Instantiation j(pot);
       for (i.setFirst(); !i.end(); ++i) {
         j.setVals(i);
         pot.set(j, other_pot[i]);
       }
     }

     template < template < typename > class ALLOC >
     template < typename GUM_SCALAR >
     BayesNet< GUM_SCALAR >
        DAG2BNLearner< ALLOC >::createBN(ParamEstimator< ALLOC >& estimator,
                                         const DAG&               dag) {
       BayesNet< GUM_SCALAR > bn;

       // create a bn with dummy parameters corresponding to the dag
       const auto& node2cols = estimator.nodeId2Columns();
       const auto& database = estimator.database();
       if (node2cols.empty()) {
         for (const auto id : dag) {
           bn.add(dynamic_cast< const DiscreteVariable& >(database.variable(id)),
                  id);
         }
       } else {
         for (const auto id : dag) {
           const std::size_t col = node2cols.second(id);
           bn.add(dynamic_cast< const DiscreteVariable& >(database.variable(col)),
                  id);
         }
       }

       // add the arcs
       bn.beginTopologyTransformation();
       for (const auto& arc : dag.arcs()) {
         bn.addArc(arc.tail(), arc.head());
       }
       bn.endTopologyTransformation();

       // estimate the parameters
       const VariableNodeMap& varmap = bn.variableNodeMap();
       for (const auto id : dag) {
         try {
           // get the sequence of variables and make the targets be the last
           Potential< GUM_SCALAR >& pot =
              const_cast< Potential< GUM_SCALAR >& >(bn.cpt(id));

           // get the variables of the CPT of id in the correct order
           const Sequence< const DiscreteVariable* >& vars =
              pot.variablesSequence();

           // setup the estimation
           std::vector< NodeId > conditioning_ids(vars.size() - 1);
           for (std::size_t i = std::size_t(1); i < vars.size(); ++i) {
             conditioning_ids[i - 1] = varmap.get(*(vars[i]));
           }
           estimator.setParameters(id, conditioning_ids, pot);
         } catch (DatabaseError&) { bn.generateCPT(id); }
       }

       return bn;
     }

     template < template < typename > class ALLOC >
     template < typename GUM_SCALAR >
     BayesNet< GUM_SCALAR > DAG2BNLearner< ALLOC >::createBN(
        ParamEstimator< ALLOC >& bootstrap_estimator,
        ParamEstimator< ALLOC >& general_estimator,
        const DAG&               dag) {
       // bootstrap EM by learning an initial model
       BayesNet< GUM_SCALAR > bn = createBN< GUM_SCALAR >(bootstrap_estimator, dag);
       general_estimator.setBayesNet(bn);

       // perform EM
       initApproximationScheme();

       GUM_SCALAR delta;
       do {
         // bugfix for parallel execution of VariableElimination
         const auto& xdag = bn.dag();
         for (const auto node : xdag) {
           xdag.parents(node);
           xdag.children(node);
         }

         BayesNet< GUM_SCALAR > new_bn =
            createBN< GUM_SCALAR >(general_estimator, dag);
         updateApproximationScheme();

         delta = GUM_SCALAR(0.0);
         for (const auto node : dag) {
           const auto& old_cpt = bn.cpt(node);
           const auto& new_cpt = new_bn.cpt(node);

           Instantiation old_inst(old_cpt);
           Instantiation new_inst(new_cpt);

           for (; !old_inst.end(); ++old_inst, ++new_inst) {
             const GUM_SCALAR old_val = old_cpt.get(old_inst);
             if (old_val > 0.0) {
               const GUM_SCALAR new_val = new_cpt.get(new_inst);
               const GUM_SCALAR diff = new_val - old_val;
               const auto       diffrel =
                  (diff < 0.0) ? (-diff / old_val) : (diff / old_val);
               if (delta < diffrel) delta = diffrel;
             }
           }
         }

         bn = std::move(new_bn);
       } while (continueApproximationScheme(double(delta)));

       stopApproximationScheme();   // just to be sure of the approximationScheme
                                    // has been notified of the end of loop

       return bn;
     }   // namespace learning


     template < template < typename > class ALLOC >
     INLINE ApproximationScheme& DAG2BNLearner< ALLOC >::approximationScheme() {
       return *this;
     }


   }   // namespace learning

 } /* namespace gum */
gum::BayesNet::addArc
void addArc(NodeId tail, NodeId head)
Add an arc in the BN, and update arc.head&#39;s CPT.
Definition: BayesNet_tpl.h:345

gum::Potential
aGrUM&#39;s Potential is a multi-dimensional array with tensor operators.
Definition: potential.h:57

gum::BayesNet
Class representing a Bayesian Network.
Definition: BayesNet.h:76

gum::learning::DAG2BNLearner::createBN
static BayesNet< GUM_SCALAR > createBN(ParamEstimator< ALLOC > &estimator, const DAG &dag)
create a BN from a DAG using a one pass generator (typically ML)
Definition: DAG2BNLearner_tpl.h:162

gum::learning::ParamEstimator::nodeId2Columns
const Bijection< NodeId, std::size_t, ALLOC< std::size_t > > & nodeId2Columns() const
returns the mapping from ids to column positions in the database

gum::learning::ParamEstimator::setParameters
void setParameters(const NodeId target_node, const std::vector< NodeId, ALLOC< NodeId > > &conditioning_nodes, Potential< GUM_SCALAR > &pot)
sets the CPT&#39;s parameters corresponding to a given Potential

gum::ApproximationScheme
Approximation Scheme.
Definition: approximationScheme.h:105

gum::BayesNet::add
NodeId add(const DiscreteVariable &var)
Add a variable to the gum::BayesNet.
Definition: BayesNet_tpl.h:229

gum::Sequence
The generic class for storing (ordered) sequences of objects.
Definition: sequence.h:1019

gum::VariableNodeMap
Container used to map discrete variables with nodes.
Definition: variableNodeMap.h:47

std
STL namespace.

gum::learning::DAG2BNLearner::~DAG2BNLearner
virtual ~DAG2BNLearner()
destructor
Definition: DAG2BNLearner_tpl.h:113

gum::BayesNet::generateCPT
void generateCPT(NodeId node) const
randomly generate CPT for a given node in a given structure
Definition: BayesNet_tpl.h:641

gum::ApproximationScheme::initApproximationScheme
void initApproximationScheme()
Initialise the scheme.
Definition: approximationScheme_inl.h:185

gum
gum is the global namespace for all aGrUM entities
Definition: agrum.h:25

gum::Instantiation::setVals
Instantiation & setVals(const Instantiation &i)
Assign the values from i in the Instantiation.
Definition: instantiation_inl.h:452

gum::learning::ParamEstimator::setBayesNet
void setBayesNet(const BayesNet< GUM_SCALAR > &new_bn)
assign a new Bayes net to all the counter&#39;s generators depending on a BN

gum::DatabaseError
Definition: exceptions.h:436

gum::BayesNet::beginTopologyTransformation
void beginTopologyTransformation()
When inserting/removing arcs, node CPTs change their dimension with a cost in time.
Definition: BayesNet_tpl.h:591

gum::learning::DAG2BNLearner::getAllocator
allocator_type getAllocator() const
returns the allocator used by the score
Definition: DAG2BNLearner_tpl.h:39

gum::learning::DAG2BNLearner::allocator_type
ALLOC< NodeId > allocator_type
type for the allocators passed in arguments of methods
Definition: DAG2BNLearner.h:54

gum::ApproximationScheme::continueApproximationScheme
bool continueApproximationScheme(double error)
Update the scheme w.r.t the new error.
Definition: approximationScheme_inl.h:225

gum::BayesNet::variableNodeMap
const VariableNodeMap & variableNodeMap() const final
Returns a map between variables and nodes of this gum::BayesNet.
Definition: BayesNet_tpl.h:317

gum::CPTError
Definition: exceptions.h:358

gum::learning::DAG2BNLearner::operator=
DAG2BNLearner< ALLOC > & operator=(const DAG2BNLearner< ALLOC > &from)
copy operator
Definition: DAG2BNLearner_tpl.h:121

gum::ApproximationScheme::stopApproximationScheme
void stopApproximationScheme()
Stop the approximation scheme.
Definition: approximationScheme_inl.h:217

gum::learning::DAG2BNLearner::approximationScheme
ApproximationScheme & approximationScheme()
returns the approximation policy of the learning algorithm
Definition: DAG2BNLearner_tpl.h:272

gum::BayesNet::cpt
const Potential< GUM_SCALAR > & cpt(NodeId varId) const final
Returns the CPT of a variable.
Definition: BayesNet_tpl.h:312

gum::learning::ParamEstimator::database
const DatabaseTable< ALLOC > & database() const
returns the database on which we perform the counts

gum::ApproximationScheme::ApproximationScheme
ApproximationScheme(bool v=false)
Definition: approximationScheme.cpp:37

gum::Instantiation
Class for assigning/browsing values to tuples of discrete variables.
Definition: instantiation.h:80

gum::ArcGraphPart::arcs
const ArcSet & arcs() const
returns the set of arcs stored within the ArcGraphPart
Definition: arcGraphPart_inl.h:36

gum::learning::DAG2BNLearner::clone
virtual DAG2BNLearner< ALLOC > * clone() const
virtual copy constructor
Definition: DAG2BNLearner_tpl.h:106

gum::MultiDimDecorator::set
virtual void set(const Instantiation &i, const GUM_SCALAR &value) const final
Default implementation of MultiDimContainer::set().
Definition: multiDimDecorator_tpl.h:154

gum::Instantiation::setFirst
void setFirst()
Assign the first values to the tuple of the Instantiation.
Definition: instantiation_inl.h:333

gum::BayesNet::endTopologyTransformation
void endTopologyTransformation()
terminates a sequence of insertions/deletions of arcs by adjusting all CPTs dimensions.
Definition: BayesNet_tpl.h:598

gum::learning::DAG2BNLearner
A class that, given a structure and a parameter estimator returns a full Bayes net.
Definition: DAG2BNLearner.h:49

gum::MultiDimDecorator::variablesSequence
virtual const Sequence< const DiscreteVariable *> & variablesSequence() const final
Returns a const ref to the sequence of DiscreteVariable*.
Definition: multiDimDecorator_tpl.h:309

gum::learning::ParamEstimator
The base class for estimating parameters of CPTs.
Definition: paramEstimator.h:47

gum::DAG
Base class for dag.
Definition: DAG.h:99

gum::DAGmodel::dag
const DAG & dag() const
Returns a constant reference to the dag of this Bayes Net.
Definition: DAGmodel_inl.h:60

GUM_ERROR
#define GUM_ERROR(type, msg)
Definition: exceptions.h:52

gum::VariableNodeMap::get
const DiscreteVariable & get(NodeId id) const
Returns a discrete variable given it&#39;s node id.

gum::Instantiation::end
bool end() const
Returns true if the Instantiation reached the end.
Definition: instantiation_inl.h:224

gum::ApproximationScheme::updateApproximationScheme
void updateApproximationScheme(unsigned int incr=1)
Update the scheme w.r.t the new error and increment steps.
Definition: approximationScheme_inl.h:204

gum::learning::DAG2BNLearner::DAG2BNLearner
DAG2BNLearner(const allocator_type &alloc=allocator_type())
default constructor