db/d47/DAG2BNLearner__tpl_8h_source.html

/****************************************************************************

 *   This file is part of the aGrUM/pyAgrum library.                        *

 *                                                                          *

 *   Copyright (c) 2005-2026 by                                             *

 *       - Pierre-Henri WUILLEMIN(_at_LIP6)                                 *

 *       - Christophe GONZALES(_at_AMU)                                     *

 *                                                                          *

 *   The aGrUM/pyAgrum library is free software; you can redistribute it    *

 *   and/or modify it under the terms of either :                           *

 *                                                                          *

 *    - the GNU Lesser General Public License as published by               *

 *      the Free Software Foundation, either version 3 of the License,      *

 *      or (at your option) any later version,                              *

 *    - the MIT license (MIT),                                              *

 *    - or both in dual license, as here.                                   *

 *                                                                          *

 *   (see https://agrum.gitlab.io/articles/dual-licenses-lgplv3mit.html)    *

 *                                                                          *

 *   This aGrUM/pyAgrum library is distributed in the hope that it will be  *

 *   useful, but WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED,          *

 *   INCLUDING BUT NOT LIMITED TO THE WARRANTIES MERCHANTABILITY or FITNESS *

 *   FOR A PARTICULAR PURPOSE  AND NONINFRINGEMENT. IN NO EVENT SHALL THE   *

 *   AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER *

 *   LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,        *

 *   ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR  *

 *   OTHER DEALINGS IN THE SOFTWARE.                                        *

 *                                                                          *

 *   See LICENCES for more details.                                         *

 *                                                                          *

 *   SPDX-FileCopyrightText: Copyright 2005-2026                            *

 *       - Pierre-Henri WUILLEMIN(_at_LIP6)                                 *

 *       - Christophe GONZALES(_at_AMU)                                     *

 *   SPDX-License-Identifier: LGPL-3.0-or-later OR MIT                      *

 *                                                                          *

 *   Contact  : info_at_agrum_dot_org                                       *

 *   homepage : http://agrum.gitlab.io                                      *

 *   gitlab   : https://gitlab.com/agrumery/agrum                           *

 *                                                                          *

 ****************************************************************************/


#pragma once


#include <agrum/BN/learning/paramUtils/DAG2BNLearner.h>   // to ease IDE parser


namespace gum {


  namespace learning {


    template < GUM_Numeric GUM_SCALAR >

    void DAG2BNLearner::_probaVarReordering_(gum::Tensor< GUM_SCALAR >&       pot,

                                             const gum::Tensor< GUM_SCALAR >& other_pot) {

      // check that the variables are identical

      if (!pot.variablesSequence().diffSet(other_pot.variablesSequence()).empty()) {

        GUM_ERROR(gum::CPTError, "the tensors do not have the same variables")

      }


      // perform the copy

      Instantiation i(other_pot);

      Instantiation j(pot);

      for (i.setFirst(); !i.end(); ++i) {

        j.setVals(i);

        pot.set(j, other_pot[i]);

      }

    }


    template < GUM_Numeric GUM_SCALAR >


    BayesNet< GUM_SCALAR > DAG2BNLearner::createBN(ParamEstimator& estimator, const DAG& dag) {

      return DAG2BNLearner()._createBN_(estimator, dag, false);

    }


    template < GUM_Numeric GUM_SCALAR >

    BayesNet< GUM_SCALAR > DAG2BNLearner::_createBN_(ParamEstimator& estimator,

                                                     const DAG&      dag,

                                                     const bool      compute_log_likelihood) {

      BayesNet< GUM_SCALAR > bn;

      log_likelihood_EM_ = 0.0;


      // create a bn with dummy parameters corresponding to the dag

      const auto& node2cols = estimator.nodeId2Columns();

      const auto& database  = estimator.database();

      if (node2cols.empty()) {

        for (const auto id: dag) {

          bn.add(dynamic_cast< const DiscreteVariable& >(database.variable(id)), id);

        }

      } else {

        for (const auto id: dag) {

          const std::size_t col = node2cols.second(id);

          bn.add(dynamic_cast< const DiscreteVariable& >(database.variable(col)), id);

        }

      }


      // add the arcs

      bn.beginTopologyTransformation();

      for (const auto& arc: dag.arcs()) {

        bn.addArc(arc.tail(), arc.head());

      }

      bn.endTopologyTransformation();


      // estimate the parameters

      const VariableNodeMap& varmap = bn.variableNodeMap();

      for (const auto id: dag) {

        // get the CPT of node id and its variables in the correct order

        auto&       pot  = const_cast< Tensor< GUM_SCALAR >& >(bn.cpt(id));

        const auto& vars = pot.variablesSequence();


        // get the conditioning variables: they are all the variables except

        // the last one in pot

        std::vector< NodeId > conditioning_ids(vars.size() - 1);

        for (auto i = std::size_t(1); i < vars.size(); ++i) {

          conditioning_ids[i - 1] = varmap.get(*(vars[i]));

        }


        log_likelihood_EM_

            += estimator.setParameters(id, conditioning_ids, pot, compute_log_likelihood);

      }


      return bn;

    }


    template < GUM_Numeric GUM_SCALAR >


    BayesNet< GUM_SCALAR > DAG2BNLearner::createBNwithEM(ParamEstimator& bootstrap_estimator,

                                                         ParamEstimator& EM_estimator,

                                                         const DAG&      dag) {

      // for EM estimations, we need to disable caches

      bootstrap_estimator.clear();

      EM_estimator.clear();


      // bootstrap EM by learning an initial model

      BayesNet< GUM_SCALAR > bn = createBN< GUM_SCALAR >(bootstrap_estimator, dag);


      return _performEM_(bootstrap_estimator, EM_estimator, std::move(bn));

    }


    template < GUM_Numeric GUM_SCALAR >


    BayesNet< GUM_SCALAR > DAG2BNLearner::createBNwithEM(ParamEstimator& bootstrap_estimator,

                                                         ParamEstimator& EM_estimator,

                                                         const BayesNet< GUM_SCALAR >& bn) {

      // for EM estimations, we need to disable caches

      bootstrap_estimator.clear();

      EM_estimator.clear();


      auto bn_copy(bn);

      return createBNwithEM(bootstrap_estimator, EM_estimator, std::move(bn_copy));

    }


    template < GUM_Numeric GUM_SCALAR >


    BayesNet< GUM_SCALAR > DAG2BNLearner::createBNwithEM(ParamEstimator& bootstrap_estimator,

                                                         ParamEstimator& EM_estimator,

                                                         BayesNet< GUM_SCALAR >&& bn) {

      // estimate the parameters of the fully zeroed CPTs using the bootstrap estimator

      const VariableNodeMap& varmap = bn.variableNodeMap();

      for (const auto id: bn.internalDag()) {

        // get the CPT of node id and its variables in the correct order

        auto& pot = const_cast< Tensor< GUM_SCALAR >& >(bn.cpt(id));


        // check if the CPT contains only zeroes

        bool all_zeroed = true;

        for (gum::Instantiation inst(pot); !inst.end(); inst.inc()) {

          if (pot[inst] != 0.0) {

            all_zeroed = false;

            break;

          }

        }


        // estimate the initial parameters of pot if all_zeroed

        if (all_zeroed) {

          // get the conditioning variables: they are all the variables except

          // the first one in pot

          const auto&           vars = pot.variablesSequence();

          std::vector< NodeId > conditioning_ids(vars.size() - 1);

          for (auto i = std::size_t(1); i < vars.size(); ++i) {

            conditioning_ids[i - 1] = varmap.get(*(vars[i]));

          }


          // estimate the initial parameters of pot

          bootstrap_estimator.setParameters(id, conditioning_ids, pot, false);

        }

      }


      return _performEM_(bootstrap_estimator, EM_estimator, std::move(bn));

    }


    template < GUM_Numeric GUM_SCALAR >

    BayesNet< GUM_SCALAR > DAG2BNLearner::_performEM_(ParamEstimator&          bootstrap_estimator,

                                                      ParamEstimator&          EM_estimator,

                                                      BayesNet< GUM_SCALAR >&& bn) {

      // if there exist no missing value, there is no need to apply EM

      if (!EM_estimator.database().hasMissingValues()) {

        // here we start/stop the approx scheme to be able to display the number

        // of EM iterations

        initApproximationScheme();

        stopApproximationScheme();


        auto bn_copy(bn);

        return bn_copy;

      }


      if (!this->isEnabledMinEpsilonRate() && !this->isEnabledEpsilon() && !this->isEnabledMaxIter()

          && !this->isEnabledMaxTime()) {

        GUM_ERROR(OperationNotAllowed,

                  "EM cannot be executed because no stopping criterion among "

                      << "{min rate, min diff, max iter, max time} has been selected")

      }


      // as bn will be modified, be sure that the DAG is kept unchanged

      const DAG dag = bn.internalDag();


      // perturb the CPTs to initialize EM

      if (noiseEM_ != 0.0) {

        for (const auto& node: bn.nodes()) {

          bn.cpt(node).noising(noiseEM_).normalizeAsCPT();

        }

      }


      // perform EM

      EM_estimator.setBayesNet(bn);

      initApproximationScheme();


      // compute the initial value of the log-likelihood

      log_likelihood_EM_            = 0.0;

      const VariableNodeMap& varmap = bn.variableNodeMap();

      EM_estimator.counter_.clear();   // for EM estimations, we need to disable caches

      for (const auto& node: bn.nodes()) {

        // get node's CPT and its conditioning variables: they are all the

        // variables except the first one in pot

        const auto&           pot  = const_cast< Tensor< GUM_SCALAR >& >(bn.cpt(node));

        const auto&           vars = pot.variablesSequence();

        std::vector< NodeId > conditioning_ids(vars.size() - 1);

        for (auto i = std::size_t(1); i < vars.size(); ++i) {

          conditioning_ids[i - 1] = varmap.get(*(vars[i]));

        }


        // compute the log-likelihood

        IdCondSet     idset(node, conditioning_ids, true);

        const auto&   N_ijk = EM_estimator.counter_.counts(idset, true);

        Instantiation inst(pot);

        for (std::size_t k = 0, end = pot.domainSize(); k < end; ++k, inst.inc()) {

          if (N_ijk[k]) { log_likelihood_EM_ += N_ijk[k] * std::log(pot[inst]); }

        }

      }

      double current_log_likelihood = log_likelihood_EM_;


      // it may happen (luckily very seldom) that EM will decrease the

      // log-likelihood instead of increasing it (see Table 5 on p28 of

      // https://faculty.washington.edu/fxia/courses/LING572/EM_collins97.pdf

      // for an example of such a behavior). In this case, instead of iterating

      // EM and producing worst and worst Bayes nets, we stop the iterations

      // early and we return the best Bayes net found so far.

      BayesNet< GUM_SCALAR > best_bn;

      bool                   must_return_best_bn    = false;

      unsigned int           nb_dec_likelihood_iter = 0;

      double                 delta                  = 0;


      do {

        // bugfix for parallel execution of VariableElimination

        const auto& xdag = bn.internalDag();

        for (const auto node: xdag) {

          xdag.parents(node);

          xdag.children(node);

        }


        EM_estimator.counter_.clear();   // for EM estimations, we need to disable caches

        BayesNet< GUM_SCALAR > new_bn = _createBN_< GUM_SCALAR >(EM_estimator, dag, true);

        updateApproximationScheme();


        if (log_likelihood_EM_ >= current_log_likelihood) {

          // here, we increased the log-likelihood, it is fine

          nb_dec_likelihood_iter = 0;

          must_return_best_bn    = false;

        } else {

          // here, we decreased the log-likelihood, so we should keep track of the

          // best Bayes net found so far. If we decreased too many times the

          // log-likelihood, we should even stop EM

          ++nb_dec_likelihood_iter;

          if (nb_dec_likelihood_iter == 1) {

            best_bn             = bn;   // bn is the Bayes net computed at the previous step

            must_return_best_bn = true;

          }

          if (nb_dec_likelihood_iter > max_nb_dec_likelihood_iter_) {

            stopApproximationScheme();

            return best_bn;

          }

        }


        // compute the difference in log-likelihood

        delta                  = log_likelihood_EM_ - current_log_likelihood;

        current_log_likelihood = log_likelihood_EM_;


        bn = std::move(new_bn);

      } while (continueApproximationScheme(this->isEnabledMinEpsilonRate() ? -log_likelihood_EM_

                                                                           : delta));


      stopApproximationScheme();   // just to be sure of the approximationScheme

                                   // has been notified of the end of loop


      return must_return_best_bn ? best_bn : bn;

    }


  }   // namespace learning


} /* namespace gum */

DAG2BNLearner.h
A class that, given a structure and a parameter estimator returns a full Bayes net.

gum::ApproximationScheme::updateApproximationScheme
void updateApproximationScheme(unsigned int incr=1)
Update the scheme w.r.t the new error and increment steps.
Definition approximationScheme_inl.h:209

gum::ApproximationScheme::isEnabledEpsilon
bool isEnabledEpsilon() const override
Returns true if stopping criterion on epsilon is enabled, false otherwise.
Definition approximationScheme_inl.h:82

gum::ApproximationScheme::isEnabledMaxTime
bool isEnabledMaxTime() const override
Returns true if stopping criterion on timeout is enabled, false otherwise.
Definition approximationScheme_inl.h:147

gum::ApproximationScheme::isEnabledMinEpsilonRate
bool isEnabledMinEpsilonRate() const override
Returns true if stopping criterion on epsilon rate is enabled, false otherwise.
Definition approximationScheme_inl.h:103

gum::ApproximationScheme::continueApproximationScheme
bool continueApproximationScheme(double error)
Update the scheme w.r.t the new error.
Definition approximationScheme.cpp:69

gum::ApproximationScheme::initApproximationScheme
void initApproximationScheme()
Initialise the scheme.
Definition approximationScheme_inl.h:190

gum::ApproximationScheme::stopApproximationScheme
void stopApproximationScheme()
Stop the approximation scheme.
Definition approximationScheme_inl.h:222

gum::ApproximationScheme::isEnabledMaxIter
bool isEnabledMaxIter() const override
Returns true if stopping criterion on max iterations is enabled, false otherwise.
Definition approximationScheme_inl.h:123

gum::DAG
Base class for dag.
Definition DAG.h:121

gum::DiscreteVariable
Base class for discrete random variable.
Definition discreteVariable.h:80

gum::Instantiation
Class for assigning/browsing values to tuples of discrete variables.
Definition instantiation.h:102

gum::Instantiation::end
bool end() const
Returns true if the Instantiation reached the end.
Definition instantiation_inl.h:203

gum::MultiDimDecorator::variablesSequence
const Sequence< const DiscreteVariable * > & variablesSequence() const final
Returns a const ref to the sequence of DiscreteVariable*.
Definition multiDimDecorator_tpl.h:314

gum::MultiDimDecorator::set
void set(const Instantiation &i, const GUM_ELEMENT &value) const final
Default implementation of MultiDimContainer::set().
Definition multiDimDecorator_tpl.h:171

gum::MultiDimDecorator::domainSize
Size domainSize() const final
Returns the product of the variables domain size.
Definition multiDimDecorator_tpl.h:183

OperationNotAllowed
Exception : operation not allowed.

gum::VariableNodeMap
Container used to map discrete variables with nodes.
Definition variableNodeMap.h:68

gum::VariableNodeMap::get
const DiscreteVariable & get(NodeId id) const
Returns a discrete variable given it's node id.

gum::learning::DAG2BNLearner::createBN
static BayesNet< GUM_SCALAR > createBN(ParamEstimator &estimator, const DAG &dag)
create a BN from a DAG using a one pass generator (typically ML)
Definition DAG2BNLearner_tpl.h:76

gum::learning::DAG2BNLearner::DAG2BNLearner
DAG2BNLearner()
default constructor

gum::learning::DAG2BNLearner::createBNwithEM
BayesNet< GUM_SCALAR > createBNwithEM(ParamEstimator &bootstrap_estimator, ParamEstimator &EM_estimator, const DAG &dag)
creates a BN with a given structure (dag) using the EM algorithm
Definition DAG2BNLearner_tpl.h:132

gum::learning::IDatabaseTable::hasMissingValues
bool hasMissingValues() const
indicates whether the database contains some missing values

gum::learning::ParamEstimator
The base class for estimating parameters of CPTs.
Definition paramEstimator.h:67

gum::learning::ParamEstimator::counter_
RecordCounter counter_
the record counter used to parse the database
Definition paramEstimator.h:271

gum::learning::ParamEstimator::nodeId2Columns
const Bijection< NodeId, std::size_t > & nodeId2Columns() const
returns the mapping from ids to column positions in the database

gum::learning::ParamEstimator::setParameters
double setParameters(const NodeId target_node, const std::vector< NodeId > &conditioning_nodes, Tensor< GUM_SCALAR > &pot, const bool compute_log_likelihood=false)
sets a CPT's parameters and, possibly, return its log-likelihhod

gum::learning::ParamEstimator::clear
virtual void clear()
clears all the data structures from memory

gum::learning::ParamEstimator::setBayesNet
void setBayesNet(const BayesNet< GUM_SCALAR > &new_bn)
assign a new Bayes net to all the counter's generators depending on a BN

gum::learning::ParamEstimator::database
const DatabaseTable & database() const
returns the database on which we perform the counts

gum::learning::RecordCounter::clear
void clear()
clears all the last database-parsed counting from memory

gum::learning::RecordCounter::counts
const std::vector< double > & counts(const IdCondSet &ids, const bool check_discrete_vars=false)
returns the counts over all the variables in an IdCondSet

GUM_ERROR
#define GUM_ERROR(type, msg)
Definition exceptions.h:76

gum::learning
include the inlined functions if necessary
Definition CSVParser.h:55

gum
gum is the global namespace for all aGrUM entities
Definition agrum.h:46