d7/d95/BNLearner__tpl_8h_source.html

/****************************************************************************

 *   This file is part of the aGrUM/pyAgrum library.                        *

 *                                                                          *

 *   Copyright (c) 2005-2025 by                                             *

 *       - Pierre-Henri WUILLEMIN(_at_LIP6)                                 *

 *       - Christophe GONZALES(_at_AMU)                                     *

 *                                                                          *

 *   The aGrUM/pyAgrum library is free software; you can redistribute it    *

 *   and/or modify it under the terms of either :                           *

 *                                                                          *

 *    - the GNU Lesser General Public License as published by               *

 *      the Free Software Foundation, either version 3 of the License,      *

 *      or (at your option) any later version,                              *

 *    - the MIT license (MIT),                                              *

 *    - or both in dual license, as here.                                   *

 *                                                                          *

 *   (see https://agrum.gitlab.io/articles/dual-licenses-lgplv3mit.html)    *

 *                                                                          *

 *   This aGrUM/pyAgrum library is distributed in the hope that it will be  *

 *   useful, but WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED,          *

 *   INCLUDING BUT NOT LIMITED TO THE WARRANTIES MERCHANTABILITY or FITNESS *

 *   FOR A PARTICULAR PURPOSE  AND NONINFRINGEMENT. IN NO EVENT SHALL THE   *

 *   AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER *

 *   LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,        *

 *   ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR  *

 *   OTHER DEALINGS IN THE SOFTWARE.                                        *

 *                                                                          *

 *   See LICENCES for more details.                                         *

 *                                                                          *

 *   SPDX-FileCopyrightText: Copyright 2005-2025                            *

 *       - Pierre-Henri WUILLEMIN(_at_LIP6)                                 *

 *       - Christophe GONZALES(_at_AMU)                                     *

 *   SPDX-License-Identifier: LGPL-3.0-or-later OR MIT                      *

 *                                                                          *

 *   Contact  : info_at_agrum_dot_org                                       *

 *   homepage : http://agrum.gitlab.io                                      *

 *   gitlab   : https://gitlab.com/agrumery/agrum                           *

 *                                                                          *

 ****************************************************************************/

#pragma once


#include <fstream>


#ifndef DOXYGEN_SHOULD_SKIP_THIS


// to help IDE parser

#  include <agrum/BN/learning/BNLearner.h>

#  include <agrum/BN/learning/BNLearnUtils/BNLearnerListener.h>


namespace gum {


  namespace learning {

    template < typename GUM_SCALAR >

    BNLearner< GUM_SCALAR >::BNLearner(const std::string&                filename,

                                       const std::vector< std::string >& missingSymbols,

                                       const bool                        induceTypes) :

        IBNLearner(filename, missingSymbols, induceTypes) {

      GUM_CONSTRUCTOR(BNLearner);

    }


    template < typename GUM_SCALAR >

    BNLearner< GUM_SCALAR >::BNLearner(const DatabaseTable& db) : IBNLearner(db) {

      GUM_CONSTRUCTOR(BNLearner);

    }


    template < typename GUM_SCALAR >

    BNLearner< GUM_SCALAR >::BNLearner(const std::string&                 filename,

                                       const gum::BayesNet< GUM_SCALAR >& bn,

                                       const std::vector< std::string >&  missing_symbols) :

        IBNLearner(filename, bn, missing_symbols) {

      GUM_CONSTRUCTOR(BNLearner);

    }


    template < typename GUM_SCALAR >

    BNLearner< GUM_SCALAR >::BNLearner(const BNLearner< GUM_SCALAR >& src) : IBNLearner(src) {

      GUM_CONSTRUCTOR(BNLearner);

    }


    template < typename GUM_SCALAR >

    BNLearner< GUM_SCALAR >::BNLearner(BNLearner< GUM_SCALAR >&& src) : IBNLearner(src) {

      GUM_CONSTRUCTOR(BNLearner);

    }


    template < typename GUM_SCALAR >

    BNLearner< GUM_SCALAR >::~BNLearner() {

      GUM_DESTRUCTOR(BNLearner);

    }


    // ##########################################################################

    // ##########################################################################


    template < typename GUM_SCALAR >

    BNLearner< GUM_SCALAR >&

        BNLearner< GUM_SCALAR >::operator=(const BNLearner< GUM_SCALAR >& src) {

      IBNLearner::operator=(src);

      return *this;

    }


    template < typename GUM_SCALAR >

    BNLearner< GUM_SCALAR >&

        BNLearner< GUM_SCALAR >::operator=(BNLearner< GUM_SCALAR >&& src) noexcept {

      IBNLearner::operator=(std::move(src));

      return *this;

    }


    template < typename GUM_SCALAR >

    BayesNet< GUM_SCALAR > BNLearner< GUM_SCALAR >::learnBN() {

      // create the score, the prior and the estimator

      auto notification = checkScorePriorCompatibility();

      if (notification != "") { std::cout << "[aGrUM notification] " << notification << std::endl; }

      createPrior_();

      createScore_();


      std::unique_ptr< ParamEstimator > param_estimator(

          createParamEstimator_(scoreDatabase_.parser(), true));


      return dag2BN_.createBN< GUM_SCALAR >(*(param_estimator.get()), learnDag_());

    }


    // check that the database contains the nodes of the dag, else raise an exception

    template < typename GUM_SCALAR >

    void BNLearner< GUM_SCALAR >::_checkDAGCompatibility_(const DAG& dag) {

      // if the dag contains no node, this is compatible with the database

      if (dag.size() == 0) return;


      // check that the dag corresponds to the database

      std::vector< NodeId > ids;

      ids.reserve(dag.sizeNodes());

      for (const auto node: dag)

        ids.push_back(node);

      std::sort(ids.begin(), ids.end());


      if (ids.back() >= scoreDatabase_.names().size()) {

        std::stringstream str;

        str << "Learning parameters corresponding to the dag is impossible "

            << "because the database does not contain the following nodeID";

        std::vector< NodeId > bad_ids;

        for (const auto node: ids) {

          if (node >= scoreDatabase_.names().size()) bad_ids.push_back(node);

        }

        if (bad_ids.size() > 1) str << 's';

        str << ": ";

        bool deja = false;

        for (const auto node: bad_ids) {

          if (deja) str << ", ";

          else deja = true;

          str << node;

        }

        GUM_ERROR(MissingVariableInDatabase, str.str())

      }

    }


    // learns a BN (its parameters) using a basic learning when its structure is known

    template < typename GUM_SCALAR >

    BayesNet< GUM_SCALAR > BNLearner< GUM_SCALAR >::_learnParameters_(const DAG& dag,

                                                                      bool takeIntoAccountScore) {

      // if the dag contains no node, return an empty BN

      if (dag.size() == 0) return BayesNet< GUM_SCALAR >();


      // be sure that the database contains dag's node ids

      _checkDAGCompatibility_(dag);


      // create the prior

      createPrior_();


      // check that the database does not contain any missing value

      if (scoreDatabase_.databaseTable().hasMissingValues()

          || ((priorDatabase_ != nullptr)

              && (priorType_ == BNLearnerPriorType::DIRICHLET_FROM_DATABASE)

              && priorDatabase_->databaseTable().hasMissingValues())) {

        GUM_ERROR(MissingValueInDatabase,

                  "In general, the BNLearner is unable to cope with "

                      << "missing values in databases. To learn parameters in "

                      << "such situations, you should first use method " << "useEM()");

      }


      // create the usual estimator

      DBRowGeneratorParser parser(scoreDatabase_.databaseTable().handler(), DBRowGeneratorSet());

      std::unique_ptr< ParamEstimator > param_estimator(

          createParamEstimator_(parser, takeIntoAccountScore));


      return dag2BN_.createBN< GUM_SCALAR >(*(param_estimator.get()), dag);

    }


    // initialize the parameter learning by EM

    template < typename GUM_SCALAR >

    std::pair< std::shared_ptr< ParamEstimator >, std::shared_ptr< ParamEstimator > >

        BNLearner< GUM_SCALAR >::_initializeEMParameterLearning_(const DAG& dag,

                                                                 bool       takeIntoAccountScore) {

      // be sure that the database contains dag's node ids

      _checkDAGCompatibility_(dag);


      // create the prior

      createPrior_();


      // propagate the messages of dag2BN_ to the BNLearner so that the objects that listen

      // to the BNLearner can be informed of the progress of the EM's execution by dag2BN_

      // BNLearnerListener listener(this, dag2BN_);


      // get the column types

      const auto&       database = scoreDatabase_.databaseTable();

      const std::size_t nb_vars  = database.nbVariables();

      const std::vector< gum::learning::DBTranslatedValueType > col_types(

          nb_vars,

          gum::learning::DBTranslatedValueType::DISCRETE);


      // create the bootstrap estimator

      DBRowGenerator4CompleteRows generator_bootstrap(col_types);

      DBRowGeneratorSet           genset_bootstrap;

      genset_bootstrap.insertGenerator(generator_bootstrap);

      DBRowGeneratorParser              parser_bootstrap(database.handler(), genset_bootstrap);

      std::shared_ptr< ParamEstimator > param_estimator_bootstrap(

          createParamEstimator_(parser_bootstrap, takeIntoAccountScore));


      // create the EM estimator

      BayesNet< GUM_SCALAR >         dummy_bn;

      DBRowGeneratorEM< GUM_SCALAR > generator_EM(col_types, dummy_bn);

      DBRowGenerator&                gen_EM = generator_EM;   // fix for g++-4.8

      DBRowGeneratorSet              genset_EM;

      genset_EM.insertGenerator(gen_EM);

      DBRowGeneratorParser              parser_EM(database.handler(), genset_EM);

      std::shared_ptr< ParamEstimator > param_estimator_EM(

          createParamEstimator_(parser_EM, takeIntoAccountScore));


      return {param_estimator_bootstrap, param_estimator_EM};

    }


    // learns a BN (its parameters) with EM when its structure is known

    template < typename GUM_SCALAR >

    BayesNet< GUM_SCALAR >

        BNLearner< GUM_SCALAR >::_learnParametersWithEM_(const DAG& dag,

                                                         bool       takeIntoAccountScore) {

      // if the dag contains no node, return an empty BN

      if (dag.size() == 0) return BayesNet< GUM_SCALAR >();


      // get a pair containing the bootstrap and the EM estimators

      auto estimators = _initializeEMParameterLearning_(dag, takeIntoAccountScore);


      // perform the EM algorithm

      return dag2BN_.createBNwithEM< GUM_SCALAR >(*(estimators.first.get()),

                                                  *(estimators.second.get()),

                                                  dag);

    }


    template < typename GUM_SCALAR >

    BayesNet< GUM_SCALAR >

        BNLearner< GUM_SCALAR >::_learnParametersWithEM_(const BayesNet< GUM_SCALAR >& bn,

                                                         bool takeIntoAccountScore) {

      // if the dag contains no node, return an empty BN

      if (bn.dag().size() == 0) return BayesNet< GUM_SCALAR >();


      // get a pair containing the bootstrap and the EM estimators

      auto estimators = _initializeEMParameterLearning_(bn.dag(), takeIntoAccountScore);


      return dag2BN_.createBNwithEM< GUM_SCALAR >(*(estimators.first.get()),

                                                  *(estimators.second.get()),

                                                  bn);

    }


    template < typename GUM_SCALAR >

    BayesNet< GUM_SCALAR > BNLearner< GUM_SCALAR >::learnParameters(const DAG& dag,

                                                                    bool takeIntoAccountScore) {

      if (!scoreDatabase_.databaseTable().hasMissingValues() || !useEM_) {

        // here, we learn without EM

        return _learnParameters_(dag, takeIntoAccountScore);

      } else {

        // here we learn with EM

        return _learnParametersWithEM_(dag, takeIntoAccountScore);

      }

    }


    template < typename GUM_SCALAR >

    BayesNet< GUM_SCALAR >

        BNLearner< GUM_SCALAR >::learnParameters(const BayesNet< GUM_SCALAR >& bn,

                                                 bool takeIntoAccountScore) {

      if (!scoreDatabase_.databaseTable().hasMissingValues() || !useEM_) {

        DAG         dag;

        const auto& db = scoreDatabase_.databaseTable();

        for (const auto n: bn.nodes()) {

          dag.addNodeWithId(db.columnFromVariableName(bn.variable(n).name()));

        }

        for (const auto& arc: bn.arcs()) {

          dag.addArc(db.columnFromVariableName(bn.variable(arc.tail()).name()),

                     db.columnFromVariableName(bn.variable(arc.head()).name()));

        }


        // create le DAG en fonction des

        return _learnParameters_(dag, takeIntoAccountScore);

      } else {

        return _learnParametersWithEM_(bn, takeIntoAccountScore);

      }

    }


    template < typename GUM_SCALAR >

    BayesNet< GUM_SCALAR > BNLearner< GUM_SCALAR >::learnParameters(bool take_into_account_score) {

      return learnParameters(initialDag_, take_into_account_score);

    }


    template < typename GUM_SCALAR >

    NodeProperty< Sequence< std::string > >

        BNLearner< GUM_SCALAR >::_labelsFromBN_(const std::string&            filename,

                                                const BayesNet< GUM_SCALAR >& src) {

      std::ifstream in(filename, std::ifstream::in);


      if ((in.rdstate() & std::ifstream::failbit) != 0) {

        GUM_ERROR(gum::IOError, "File " << filename << " not found")

      }


      CSVParser parser(in, filename);

      parser.next();

      auto names = parser.current();


      NodeProperty< Sequence< std::string > > modals;


      for (gum::Idx col = 0; col < names.size(); col++) {

        try {

          gum::NodeId graphId = src.idFromName(names[col]);

          modals.insert(col, gum::Sequence< std::string >());


          for (gum::Size i = 0; i < src.variable(graphId).domainSize(); ++i)

            modals[col].insert(src.variable(graphId).label(i));

        } catch (const gum::NotFound&) {

          // no problem : a column not in the BN...

        }

      }


      return modals;

    }


    template < typename GUM_SCALAR >

    std::string BNLearner< GUM_SCALAR >::toString() const {

      const auto st = state();


      Size maxkey = 0;

      for (const auto& tuple: st)

        if (std::get< 0 >(tuple).length() > maxkey) maxkey = std::get< 0 >(tuple).length();


      std::stringstream s;

      for (const auto& tuple: st) {

        s << std::setiosflags(std::ios::left) << std::setw(maxkey) << std::get< 0 >(tuple) << " : "

          << std::get< 1 >(tuple);

        if (std::get< 2 >(tuple) != "") s << "  (" << std::get< 2 >(tuple) << ")";

        s << std::endl;

      }

      return s.str();

    }


    template < typename GUM_SCALAR >

    std::vector< std::tuple< std::string, std::string, std::string > >

        BNLearner< GUM_SCALAR >::state() const {

      std::vector< std::tuple< std::string, std::string, std::string > > vals;


      std::string key;

      std::string comment;

      const auto& db = database();


      vals.emplace_back("Filename", filename_, "");

      vals.emplace_back("Size",

                        "(" + std::to_string(nbRows()) + "," + std::to_string(nbCols()) + ")",

                        "");


      std::string vars = "";

      for (NodeId i = 0; i < db.nbVariables(); i++) {

        if (i > 0) vars += ", ";

        vars += nameFromId(i) + "[" + std::to_string(db.domainSize(i)) + "]";

      }

      vals.emplace_back("Variables", vars, "");

      vals.emplace_back("Induced types", inducedTypes_ ? "True" : "False", "");

      vals.emplace_back("Missing values", hasMissingValues() ? "True" : "False", "");


      key = "Algorithm";

      switch (selectedAlgo_) {

        case AlgoType::GREEDY_HILL_CLIMBING :

          vals.emplace_back(key, "Greedy Hill Climbing", "");

          break;

        case AlgoType::K2 : {

          vals.emplace_back(key, "K2", "");

          const auto& k2order = algoK2_.order();

          vars                = "";

          for (NodeId i = 0; i < k2order.size(); i++) {

            if (i > 0) vars += ", ";

            vars += nameFromId(k2order.atPos(i));

          }

          vals.emplace_back("K2 order", vars, "");

        } break;

        case AlgoType::LOCAL_SEARCH_WITH_TABU_LIST :

          vals.emplace_back(key, "Local Search with Tabu List", "");

          vals.emplace_back("Tabu list size", std::to_string(nbDecreasingChanges_), "");

          break;

        case AlgoType::MIIC : vals.emplace_back(key, "MIIC", ""); break;

        default : vals.emplace_back(key, "(unknown)", "?"); break;

      }


      key = "Score";


      if (isScoreBased()) {

        switch (scoreType_) {

          case ScoreType::K2 : vals.emplace_back(key, "K2", ""); break;

          case ScoreType::AIC : vals.emplace_back(key, "AIC", ""); break;

          case ScoreType::BIC : vals.emplace_back(key, "BIC", ""); break;

          case ScoreType::BD : vals.emplace_back(key, "BD", ""); break;

          case ScoreType::BDeu : vals.emplace_back(key, "BDeu", ""); break;

          case ScoreType::LOG2LIKELIHOOD : vals.emplace_back(key, "Log2Likelihood", ""); break;

          default : vals.emplace_back(key, "(unknown)", "?"); break;

        }

      }


      if (isConstraintBased()) {

        key = "Correction";

        switch (kmodeMiic_) {

          case CorrectedMutualInformation::KModeTypes::MDL :

            vals.emplace_back(key, "MDL", "");

            break;

          case CorrectedMutualInformation::KModeTypes::NML :

            vals.emplace_back(key, "NML", "");

            break;

          case CorrectedMutualInformation::KModeTypes::NoCorr :

            vals.emplace_back(key, "No correction", "");

            break;

          default : vals.emplace_back(key, "(unknown)", "?"); break;

        }

      }


      key     = "Prior";

      comment = checkScorePriorCompatibility();

      switch (priorType_) {

        case BNLearnerPriorType::NO_prior : vals.emplace_back(key, "-", comment); break;

        case BNLearnerPriorType::DIRICHLET_FROM_DATABASE :

          vals.emplace_back(key, "Dirichlet", comment);

          vals.emplace_back("Dirichlet from database", priorDbname_, "");

          break;

        case BNLearnerPriorType::DIRICHLET_FROM_BAYESNET :

          vals.emplace_back(key, "Dirichlet", comment);

          vals.emplace_back("Dirichlet from Bayesian network : ", _prior_bn_.toString(), "");

          break;

        case BNLearnerPriorType::BDEU : vals.emplace_back(key, "BDEU", comment); break;

        case BNLearnerPriorType::SMOOTHING : vals.emplace_back(key, "Smoothing", comment); break;

        default : vals.emplace_back(key, "(unknown)", "?"); break;

      }


      if (priorType_ != BNLearnerPriorType::NO_prior)

        vals.emplace_back("Prior weight", std::to_string(priorWeight_), "");


      if (databaseWeight() != double(nbRows())) {

        vals.emplace_back("Database weight", std::to_string(databaseWeight()), "");

      }


      if (useEM_) {

        comment = "";

        if (!hasMissingValues()) comment = "But no missing values in this database";

        vals.emplace_back("use EM", "True", "");

        std::stringstream s;

        s << "[";

        bool first = true;

        if (dag2BN_.isEnabledMinEpsilonRate()) {

          s << "MinRate: " << dag2BN_.minEpsilonRate();

          first = false;

        }

        if (dag2BN_.isEnabledEpsilon()) {

          if (!first) s << ", ";

          first = false;

          s << "MinDiff: " << dag2BN_.epsilon();

        }

        if (dag2BN_.isEnabledMaxIter()) {

          if (!first) s << ", ";

          first = false;

          s << "MaxIter: " << dag2BN_.maxIter();

        }

        if (dag2BN_.isEnabledMaxTime()) {

          if (!first) s << ", ";

          first = false;

          s << "MaxTime: " << dag2BN_.maxTime();

        }

        s << "]";

        vals.emplace_back("EM stopping criteria", s.str(), comment);

      }


      std::string res;

      bool        nofirst;

      if (constraintIndegree_.maxIndegree() < std::numeric_limits< Size >::max()) {

        vals.emplace_back("Constraint Max InDegree",

                          std::to_string(constraintIndegree_.maxIndegree()),

                          "");

      }

      if (!constraintForbiddenArcs_.arcs().empty()) {

        res     = "{";

        nofirst = false;

        for (const auto& arc: constraintForbiddenArcs_.arcs()) {

          if (nofirst) res += ", ";

          else nofirst = true;

          res += nameFromId(arc.tail()) + "->" + nameFromId(arc.head());

        }

        res += "}";

        vals.emplace_back("Constraint Forbidden Arcs", res, "");

      }

      if (!constraintMandatoryArcs_.arcs().empty()) {

        res     = "{";

        nofirst = false;

        for (const auto& arc: constraintMandatoryArcs_.arcs()) {

          if (nofirst) res += ", ";

          else nofirst = true;

          res += nameFromId(arc.tail()) + "->" + nameFromId(arc.head());

        }

        res += "}";

        vals.emplace_back("Constraint Mandatory Arcs", res, "");

      }

      if (!constraintPossibleEdges_.edges().empty()) {

        res     = "{";

        nofirst = false;

        for (const auto& edge: constraintPossibleEdges_.edges()) {

          if (nofirst) res += ", ";

          else nofirst = true;

          res += nameFromId(edge.first()) + "--" + nameFromId(edge.second());

        }

        res += "}";

        vals.emplace_back("Constraint Possible Edges", res, "");

      }

      if (!constraintSliceOrder_.sliceOrder().empty()) {

        res               = "{";

        nofirst           = false;

        const auto& order = constraintSliceOrder_.sliceOrder();

        for (const auto& p: order) {

          if (nofirst) res += ", ";

          else nofirst = true;

          res += nameFromId(p.first) + ":" + std::to_string(p.second);

        }

        res += "}";

        vals.emplace_back("Constraint Slice Order", res, "");

      }

      if (!constraintNoParentNodes_.nodes().empty()) {

        res     = "{";

        nofirst = false;

        for (const auto& node: constraintNoParentNodes_.nodes()) {

          if (nofirst) res += ", ";

          else nofirst = true;

          res += nameFromId(node);

        }

        res += "}";

        vals.emplace_back("Constraint No Parent Nodes", res, "");

      }

      if (!constraintNoChildrenNodes_.nodes().empty()) {

        res     = "{";

        nofirst = false;

        for (const auto& node: constraintNoChildrenNodes_.nodes()) {

          if (nofirst) res += ", ";

          else nofirst = true;

          res += nameFromId(node);

        }

        res += "}";

        vals.emplace_back("Constraint No Children Nodes", res, "");

      }

      if (initialDag_.size() != 0) {

        vals.emplace_back("Initial DAG", "True", initialDag_.toDot());

      }


      return vals;

    }


    template < typename GUM_SCALAR >

    void BNLearner< GUM_SCALAR >::copyState(const BNLearner< GUM_SCALAR >& learner) {

      switch (learner.selectedAlgo_) {

        case AlgoType::GREEDY_HILL_CLIMBING : useGreedyHillClimbing(); break;

        case AlgoType::K2 : useK2(learner.algoK2_.order()); break;

        case AlgoType::LOCAL_SEARCH_WITH_TABU_LIST :

          useLocalSearchWithTabuList(learner.nbDecreasingChanges_);

          break;

        case AlgoType::MIIC : useMIIC(); break;

      }


      switch (learner.scoreType_) {

        case ScoreType::K2 : useScoreK2(); break;

        case ScoreType::AIC : useScoreAIC(); break;

        case ScoreType::BIC : useScoreBIC(); break;

        case ScoreType::BD : useScoreBD(); break;

        case ScoreType::BDeu : useScoreBDeu(); break;

        case ScoreType::LOG2LIKELIHOOD : useScoreLog2Likelihood(); break;

      }


      switch (learner.kmodeMiic_) {

        case CorrectedMutualInformation::KModeTypes::MDL : useMDLCorrection(); break;

        case CorrectedMutualInformation::KModeTypes::NML : useNMLCorrection(); break;

        case CorrectedMutualInformation::KModeTypes::NoCorr : useNoCorrection(); break;

      }


      switch (learner.priorType_) {

        case BNLearnerPriorType::NO_prior : useNoPrior(); break;

        case BNLearnerPriorType::DIRICHLET_FROM_DATABASE :

          useDirichletPrior(learner.priorDbname_, learner.priorWeight_);

          break;

        case BNLearnerPriorType::DIRICHLET_FROM_BAYESNET :

          useDirichletPrior(learner._prior_bn_);

          break;

        case BNLearnerPriorType::BDEU : useBDeuPrior(learner.priorWeight_); break;

        case BNLearnerPriorType::SMOOTHING : useSmoothingPrior(learner.priorWeight_); break;

      }


      useEM_   = learner.useEM_;

      noiseEM_ = learner.noiseEM_;

      dag2BN_  = learner.dag2BN_;


      setMaxIndegree(learner.constraintIndegree_.maxIndegree());

      for (const auto src: learner.constraintNoParentNodes_.nodes()) {

        try {

          const auto dst = idFromName(learner.nameFromId(src));

          addNoParentNode(dst);

        } catch (const MissingVariableInDatabase&) {

          // nothing to do

        }

      }

      for (const auto src: learner.constraintNoChildrenNodes_.nodes()) {

        try {

          const auto dst = idFromName(learner.nameFromId(src));

          addNoChildrenNode(dst);

        } catch (const MissingVariableInDatabase&) {

          // nothing to do

        }

      }

      for (const auto& arc: learner.constraintForbiddenArcs_.arcs()) {

        try {

          const auto src = idFromName(learner.nameFromId(arc.tail()));

          const auto dst = idFromName(learner.nameFromId(arc.head()));

          addForbiddenArc(src, dst);

        } catch (const MissingVariableInDatabase&) {

          // nothing to do

        }

      }

      for (const auto& arc: learner.constraintMandatoryArcs_.arcs()) {

        try {

          const auto src = idFromName(learner.nameFromId(arc.tail()));

          const auto dst = idFromName(learner.nameFromId(arc.head()));

          addMandatoryArc(src, dst);

        } catch (const MissingVariableInDatabase&) {

          // nothing to do

        }

      }

      for (const auto& edge: learner.constraintPossibleEdges_.edges()) {

        try {

          const auto src = idFromName(learner.nameFromId(edge.first()));

          const auto dst = idFromName(learner.nameFromId(edge.second()));

          addPossibleEdge(src, dst);

        } catch (const MissingVariableInDatabase&) {

          // nothing to do

        }

      }

      if (!learner.constraintSliceOrder_.sliceOrder().empty()) {

        NodeProperty< NodeId > slice_order;

        for (const auto& p: learner.constraintSliceOrder_.sliceOrder()) {

          try {

            slice_order.insert(idFromName(learner.nameFromId(p.first)), p.second);

          } catch (const MissingVariableInDatabase&) {

            // nothing to do

          }

        }

        setSliceOrder(slice_order);

      }

    }


    template < typename GUM_SCALAR >

    void BNLearner< GUM_SCALAR >::createPrior_() {

      // first, save the old prior, to be delete if everything is ok

      Prior* old_prior = prior_;


      // create the new prior

      switch (priorType_) {

        case BNLearnerPriorType::NO_prior :

          prior_ = new NoPrior(scoreDatabase_.databaseTable(), scoreDatabase_.nodeId2Columns());

          break;


        case BNLearnerPriorType::SMOOTHING :

          prior_

              = new SmoothingPrior(scoreDatabase_.databaseTable(), scoreDatabase_.nodeId2Columns());

          break;


        case BNLearnerPriorType::DIRICHLET_FROM_DATABASE :

          if (priorDatabase_ != nullptr) {

            delete priorDatabase_;

            priorDatabase_ = nullptr;

          }


          priorDatabase_

              = new Database(priorDbname_, scoreDatabase_, scoreDatabase_.missingSymbols());


          prior_ = new DirichletPriorFromDatabase(scoreDatabase_.databaseTable(),

                                                  priorDatabase_->parser(),

                                                  priorDatabase_->nodeId2Columns());

          break;


        case BNLearnerPriorType::DIRICHLET_FROM_BAYESNET :

          prior_

              = new DirichletPriorFromBN< GUM_SCALAR >(scoreDatabase_.databaseTable(), &_prior_bn_);

          break;


        case BNLearnerPriorType::BDEU :

          prior_ = new BDeuPrior(scoreDatabase_.databaseTable(), scoreDatabase_.nodeId2Columns());

          break;


        default : GUM_ERROR(OperationNotAllowed, "The BNLearner does not support yet this prior")

      }


      // do not forget to assign a weight to the prior

      prior_->setWeight(priorWeight_);


      // remove the old prior, if any

      if (old_prior != nullptr) delete old_prior;

    }


    template < typename GUM_SCALAR >

    INLINE std::ostream& operator<<(std::ostream& output, const BNLearner< GUM_SCALAR >& learner) {

      output << learner.toString();

      return output;

    }

  } /* namespace learning */


} /* namespace gum */


#endif /* DOXYGEN_SHOULD_SKIP_THIS */

BNLearnerListener.h
A listener that allows BNLearner to be used as a proxy for its inner algorithms.

BNLearner.h
A basic pack of learning algorithms that can easily be used.

gum::BayesNet
Class representing a Bayesian network.
Definition BayesNet.h:93

MissingValueInDatabase
Error: The database contains some missing values.

MissingVariableInDatabase
Error: A name of variable is not found in the database.

OperationNotAllowed
Exception : operation not allowed.

gum::Sequence< std::string >

gum::learning::BNLearner::BNLearner
BNLearner(const std::string &filename, const std::vector< std::string > &missingSymbols={"?"}, const bool induceTypes=true)
default constructor

gum::learning::IBNLearner
A pack of learning algorithms that can easily be used.
Definition IBNLearner.h:98

GUM_ERROR
#define GUM_ERROR(type, msg)
Definition exceptions.h:72

gum::Size
std::size_t Size
In aGrUM, hashed values are unsigned long int.
Definition types.h:74

gum::Idx
Size Idx
Type for indexes.
Definition types.h:79

gum::NodeId
Size NodeId
Type for node ids.
Definition graphElements.h:117

gum::learning::DBTranslatedValueType::DISCRETE
@ DISCRETE
Definition DBTranslatedValue.h:139

gum::learning
include the inlined functions if necessary
Definition CSVParser.h:54

gum
gum is the global namespace for all aGrUM entities
Definition agrum.h:46

operator<<
std::ostream & operator<<(std::ostream &out, const TiXmlNode &base)
Definition tinyxml.cpp:1516