d8/d30/fmdpLearner_8h_source.html

/****************************************************************************

 *   This file is part of the aGrUM/pyAgrum library.                        *

 *                                                                          *

 *   Copyright (c) 2005-2025 by                                             *

 *       - Pierre-Henri WUILLEMIN(_at_LIP6)                                 *

 *       - Christophe GONZALES(_at_AMU)                                     *

 *                                                                          *

 *   The aGrUM/pyAgrum library is free software; you can redistribute it    *

 *   and/or modify it under the terms of either :                           *

 *                                                                          *

 *    - the GNU Lesser General Public License as published by               *

 *      the Free Software Foundation, either version 3 of the License,      *

 *      or (at your option) any later version,                              *

 *    - the MIT license (MIT),                                              *

 *    - or both in dual license, as here.                                   *

 *                                                                          *

 *   (see https://agrum.gitlab.io/articles/dual-licenses-lgplv3mit.html)    *

 *                                                                          *

 *   This aGrUM/pyAgrum library is distributed in the hope that it will be  *

 *   useful, but WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED,          *

 *   INCLUDING BUT NOT LIMITED TO THE WARRANTIES MERCHANTABILITY or FITNESS *

 *   FOR A PARTICULAR PURPOSE  AND NONINFRINGEMENT. IN NO EVENT SHALL THE   *

 *   AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER *

 *   LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,        *

 *   ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR  *

 *   OTHER DEALINGS IN THE SOFTWARE.                                        *

 *                                                                          *

 *   See LICENCES for more details.                                         *

 *                                                                          *

 *   SPDX-FileCopyrightText: Copyright 2005-2025                            *

 *       - Pierre-Henri WUILLEMIN(_at_LIP6)                                 *

 *       - Christophe GONZALES(_at_AMU)                                     *

 *   SPDX-License-Identifier: LGPL-3.0-or-later OR MIT                      *

 *                                                                          *

 *   Contact  : info_at_agrum_dot_org                                       *

 *   homepage : http://agrum.gitlab.io                                      *

 *   gitlab   : https://gitlab.com/agrumery/agrum                           *

 *                                                                          *

 ****************************************************************************/


// =========================================================================

#ifndef GUM_FMDP_LEARNER_H

#define GUM_FMDP_LEARNER_H

// =========================================================================

// =========================================================================

#include <agrum/FMDP/learning/datastructure/imddi.h>

#include <agrum/FMDP/learning/datastructure/iti.h>

#include <agrum/FMDP/SDyna/Strategies/ILearningStrategy.h>


// =========================================================================

// =========================================================================


namespace gum {


  template < TESTNAME    VariableAttributeSelection,

             TESTNAME    RewardAttributeSelection,

             LEARNERNAME LearnerSelection >


  class FMDPLearner: public ILearningStrategy {

    using VariableLearnerType =

        typename LearnerSelect< LearnerSelection,

                                IMDDI< VariableAttributeSelection, false >,

                                ITI< VariableAttributeSelection, false > >::type;


    using RewardLearnerType = typename LearnerSelect< LearnerSelection,

                                                      IMDDI< RewardAttributeSelection, true >,

                                                      ITI< RewardAttributeSelection, true > >::type;


    using VarLearnerTable = HashTable< const DiscreteVariable*, VariableLearnerType* >;


    public:

    // ==========================================================================

    // ==========================================================================


    // ###################################################################

    // ###################################################################

    FMDPLearner(double learningThreshold, bool actionReward, double similarityThreshold = 0.05);


    // ###################################################################

    // ###################################################################

    ~FMDPLearner();


    // ###################################################################

    // ###################################################################


    public:

    // ==========================================================================

    // ==========================================================================

    void initialize(FMDP< double >* fmdp);


    // ==========================================================================

    // ==========================================================================


    MultiDimFunctionGraph< double >* _instantiateFunctionGraph_() {

      return _instantiateFunctionGraph_(Int2Type< LearnerSelection >());

    }


    MultiDimFunctionGraph< double >* _instantiateFunctionGraph_(Int2Type< IMDDILEARNER >) {

      return MultiDimFunctionGraph< double,

                                    ExactTerminalNodePolicy >::getReducedAndOrderedInstance();

    }


    MultiDimFunctionGraph< double >* _instantiateFunctionGraph_(Int2Type< ITILEARNER >) {

      return MultiDimFunctionGraph< double, ExactTerminalNodePolicy >::getTreeInstance();

    }


    // ==========================================================================

    // ==========================================================================


    VariableLearnerType* _instantiateVarLearner_(MultiDimFunctionGraph< double >* target,

                                                 gum::VariableSet&                mainVariables,

                                                 const DiscreteVariable*          learnedVar) {

      return _instantiateVarLearner_(target,

                                     mainVariables,

                                     learnedVar,

                                     Int2Type< LearnerSelection >());

    }


    VariableLearnerType* _instantiateVarLearner_(MultiDimFunctionGraph< double >* target,

                                                 gum::VariableSet&                mainVariables,

                                                 const DiscreteVariable*          learnedVar,

                                                 Int2Type< IMDDILEARNER >) {

      return new VariableLearnerType(target,

                                     _learningThreshold_,

                                     _similarityThreshold_,

                                     mainVariables,

                                     learnedVar);

    }


    VariableLearnerType* _instantiateVarLearner_(MultiDimFunctionGraph< double >* target,

                                                 gum::VariableSet&                mainVariables,

                                                 const DiscreteVariable*          learnedVar,

                                                 Int2Type< ITILEARNER >) {

      return new VariableLearnerType(target, _learningThreshold_, mainVariables, learnedVar);

    }


    // ==========================================================================

    // ==========================================================================


    RewardLearnerType* _instantiateRewardLearner_(MultiDimFunctionGraph< double >* target,

                                                  gum::VariableSet&                mainVariables) {

      return _instantiateRewardLearner_(target, mainVariables, Int2Type< LearnerSelection >());

    }


    RewardLearnerType* _instantiateRewardLearner_(MultiDimFunctionGraph< double >* target,

                                                  gum::VariableSet&                mainVariables,

                                                  Int2Type< IMDDILEARNER >) {

      return new RewardLearnerType(target,

                                   _learningThreshold_,

                                   _similarityThreshold_,

                                   mainVariables);

    }


    RewardLearnerType* _instantiateRewardLearner_(MultiDimFunctionGraph< double >* target,

                                                  gum::VariableSet&                mainVariables,

                                                  Int2Type< ITILEARNER >) {

      return new RewardLearnerType(target, _learningThreshold_, mainVariables);

    }


    // ###################################################################

    // ###################################################################


    public:

    // ==========================================================================

    // ==========================================================================

    bool addObservation(Idx actionId, const Observation* obs);


    // ==========================================================================

    // ==========================================================================

    void updateFMDP();


    // ###################################################################

    // ###################################################################


    public:

    // ==========================================================================

    // ==========================================================================

    Size size();


    // ==========================================================================

    // ==========================================================================


    const IVisitableGraphLearner* varLearner(Idx actionId, const DiscreteVariable* var) const {

      return _actionLearners_[actionId]->getWithDefault(var, nullptr);

    }


    virtual double rMax() const { return _rmax_; }


    private:

    double _rmax_;


    public:

    virtual double modaMax() const { return _modaMax_; }


    private:

    double _modaMax_;


    private:

    FMDP< double >* _fmdp_;


    HashTable< Idx, VarLearnerTable* > _actionLearners_;


    bool                                 _actionReward_;

    HashTable< Idx, RewardLearnerType* > _actionRewardLearners_;

    RewardLearnerType*                   _rewardLearner_;


    const double _learningThreshold_;

    const double _similarityThreshold_;

  };


} /* namespace gum */


#include <agrum/FMDP/learning/fmdpLearner_tpl.h>


#endif   // GUM_FMDP_LEARNER_H

ILearningStrategy.h
Headers of the Learning Strategy interface.

double

gum::DiscreteVariable
Base class for discrete random variable.
Definition discreteVariable.h:78

gum::ExactTerminalNodePolicy
Implementation of a Terminal Node Policy that maps nodeid directly to value.
Definition ExactTerminalNodePolicy.h:70

gum::FMDPLearner::_instantiateVarLearner_
VariableLearnerType * _instantiateVarLearner_(MultiDimFunctionGraph< double > *target, gum::VariableSet &mainVariables, const DiscreteVariable *learnedVar, Int2Type< ITILEARNER >)
Initializes the learner.
Definition fmdpLearner.h:156

gum::FMDPLearner::_instantiateRewardLearner_
RewardLearnerType * _instantiateRewardLearner_(MultiDimFunctionGraph< double > *target, gum::VariableSet &mainVariables, Int2Type< ITILEARNER >)
Initializes the learner.
Definition fmdpLearner.h:180

gum::FMDPLearner::RewardLearnerType
typename LearnerSelect< LearnerSelection, IMDDI< RewardAttributeSelection, true >, ITI< RewardAttributeSelection, true > >::type RewardLearnerType
Definition fmdpLearner.h:82

gum::FMDPLearner::_actionRewardLearners_
HashTable< Idx, RewardLearnerType * > _actionRewardLearners_
Definition fmdpLearner.h:259

gum::FMDPLearner::_similarityThreshold_
const double _similarityThreshold_
Definition fmdpLearner.h:263

gum::FMDPLearner::_instantiateRewardLearner_
RewardLearnerType * _instantiateRewardLearner_(MultiDimFunctionGraph< double > *target, gum::VariableSet &mainVariables)
Initializes the learner.
Definition fmdpLearner.h:166

gum::FMDPLearner::~FMDPLearner
~FMDPLearner()
Default destructor.
Definition fmdpLearner_tpl.h:81

gum::FMDPLearner::_instantiateVarLearner_
VariableLearnerType * _instantiateVarLearner_(MultiDimFunctionGraph< double > *target, gum::VariableSet &mainVariables, const DiscreteVariable *learnedVar, Int2Type< IMDDILEARNER >)
Initializes the learner.
Definition fmdpLearner.h:145

gum::FMDPLearner::rMax
virtual double rMax() const
learnerSize
Definition fmdpLearner.h:238

gum::FMDPLearner::_instantiateFunctionGraph_
MultiDimFunctionGraph< double > * _instantiateFunctionGraph_()
Initializes the learner.
Definition fmdpLearner.h:120

gum::FMDPLearner::modaMax
virtual double modaMax() const
learnerSize
Definition fmdpLearner.h:244

gum::FMDPLearner::_modaMax_
double _modaMax_
learnerSize
Definition fmdpLearner.h:247

gum::FMDPLearner::size
Size size()
learnerSize
Definition fmdpLearner_tpl.h:189

gum::FMDPLearner::_instantiateFunctionGraph_
MultiDimFunctionGraph< double > * _instantiateFunctionGraph_(Int2Type< ITILEARNER >)
Initializes the learner.
Definition fmdpLearner.h:129

gum::FMDPLearner::updateFMDP
void updateFMDP()
Starts an update of datastructure in the associated FMDP.
Definition fmdpLearner_tpl.h:213

gum::FMDPLearner::_fmdp_
FMDP< double > * _fmdp_
The FMDP to store the learned model.
Definition fmdpLearner.h:254

gum::FMDPLearner::_rmax_
double _rmax_
learnerSize
Definition fmdpLearner.h:241

gum::FMDPLearner::_actionReward_
bool _actionReward_
Definition fmdpLearner.h:258

gum::FMDPLearner::VarLearnerTable
HashTable< const DiscreteVariable *, VariableLearnerType * > VarLearnerTable
Definition fmdpLearner.h:86

gum::FMDPLearner::varLearner
const IVisitableGraphLearner * varLearner(Idx actionId, const DiscreteVariable *var) const
extractCount
Definition fmdpLearner.h:234

gum::FMDPLearner::_learningThreshold_
const double _learningThreshold_
Definition fmdpLearner.h:262

gum::FMDPLearner::_rewardLearner_
RewardLearnerType * _rewardLearner_
Definition fmdpLearner.h:260

gum::FMDPLearner::FMDPLearner
FMDPLearner(double learningThreshold, bool actionReward, double similarityThreshold=0.05)
Default constructor.
Definition fmdpLearner_tpl.h:68

gum::FMDPLearner::initialize
void initialize(FMDP< double > *fmdp)
Initializes the learner.
Definition fmdpLearner_tpl.h:109

gum::FMDPLearner::_actionLearners_
HashTable< Idx, VarLearnerTable * > _actionLearners_
Definition fmdpLearner.h:256

gum::FMDPLearner::_instantiateRewardLearner_
RewardLearnerType * _instantiateRewardLearner_(MultiDimFunctionGraph< double > *target, gum::VariableSet &mainVariables, Int2Type< IMDDILEARNER >)
Initializes the learner.
Definition fmdpLearner.h:171

gum::FMDPLearner::VariableLearnerType
typename LearnerSelect< LearnerSelection, IMDDI< VariableAttributeSelection, false >, ITI< VariableAttributeSelection, false > >::type VariableLearnerType
Definition fmdpLearner.h:77

gum::FMDPLearner::_instantiateFunctionGraph_
MultiDimFunctionGraph< double > * _instantiateFunctionGraph_(Int2Type< IMDDILEARNER >)
Initializes the learner.
Definition fmdpLearner.h:124

gum::FMDPLearner::_instantiateVarLearner_
VariableLearnerType * _instantiateVarLearner_(MultiDimFunctionGraph< double > *target, gum::VariableSet &mainVariables, const DiscreteVariable *learnedVar)
Initializes the learner.
Definition fmdpLearner.h:136

gum::FMDPLearner::addObservation
bool addObservation(Idx actionId, const Observation *obs)
Gives to the learner a new transition.
Definition fmdpLearner_tpl.h:161

gum::FMDP< double >

gum::HashTable
The class for generic Hash Tables.
Definition hashTable.h:637

gum::ILearningStrategy
<agrum/FMDP/SDyna/ILearningStrategy.h>
Definition ILearningStrategy.h:74

gum::IMDDI
Definition imddi.h:74

gum::ITI
Learn a graphical representation of a function as a decision tree.
Definition iti.h:79

gum::IVisitableGraphLearner
<agrum/FMDP/SDyna/IVisitableGraphLearner.h>
Definition IVisitableGraphLearner.h:71

gum::MultiDimFunctionGraph< double >

gum::MultiDimFunctionGraph::getTreeInstance
static MultiDimFunctionGraph< GUM_SCALAR, TerminalNodePolicy > * getTreeInstance()
Returns an arborescent instance.
Definition multiDimFunctionGraph_tpl.h:616

gum::Observation
Definition observation.h:73

fmdpLearner_tpl.h
Template Implementations of the FMDPLearner class.

gum::Size
std::size_t Size
In aGrUM, hashed values are unsigned long int.
Definition types.h:74

gum::Idx
Size Idx
Type for indexes.
Definition types.h:79

imddi.h
Headers of the IMDDI class.

iti.h
Headers of the ITI class.

gum
gum is the global namespace for all aGrUM entities
Definition agrum.h:46

gum::VariableSet
Set< const DiscreteVariable * > VariableSet
Definition discreteVariable.h:187

gum::LEARNERNAME
LEARNERNAME
Definition templateStrategy.h:87

gum::TESTNAME
TESTNAME
Definition templateStrategy.h:60

gum::Int2Type
Definition templateStrategy.h:56

gum::LearnerSelect
Definition templateStrategy.h:90