![]() |
aGrUM 2.3.2
a C++ library for (probabilistic) graphical models
|
#include <agrum/FMDP/learning/fmdpLearner.h>
Private Types | |
| using | VariableLearnerType |
| using | RewardLearnerType |
| using | VarLearnerTable = HashTable< const DiscreteVariable*, VariableLearnerType* > |
Private Attributes | |
| FMDP< double > * | _fmdp_ |
| The FMDP to store the learned model. | |
| HashTable< Idx, VarLearnerTable * > | _actionLearners_ |
| bool | _actionReward_ |
| HashTable< Idx, RewardLearnerType * > | _actionRewardLearners_ |
| RewardLearnerType * | _rewardLearner_ |
| const double | _learningThreshold_ |
| const double | _similarityThreshold_ |
Miscelleanous methods | |
| double | _rmax_ |
| learnerSize | |
| double | _modaMax_ |
| learnerSize | |
| Size | size () |
| learnerSize | |
| const IVisitableGraphLearner * | varLearner (Idx actionId, const DiscreteVariable *var) const |
| extractCount | |
| virtual double | rMax () const |
| learnerSize | |
| virtual double | modaMax () const |
| learnerSize | |
Definition at line 76 of file fmdpLearner.h.
|
private |
Definition at line 82 of file fmdpLearner.h.
|
private |
Definition at line 77 of file fmdpLearner.h.
|
private |
Definition at line 86 of file fmdpLearner.h.
| gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::FMDPLearner | ( | double | learningThreshold, |
| bool | actionReward, | ||
| double | similarityThreshold = 0.05 ) |
Default constructor.
Definition at line 67 of file fmdpLearner_tpl.h.
References FMDPLearner(), _actionReward_, _learningThreshold_, _rewardLearner_, and _similarityThreshold_.
Referenced by FMDPLearner(), and ~FMDPLearner().
| gum::FMDPLearner< VariableAttributeSelection, RewardAttributeSelection, LearnerSelection >::~FMDPLearner | ( | ) |
Default destructor.
Definition at line 80 of file fmdpLearner_tpl.h.
References FMDPLearner(), _actionLearners_, _actionRewardLearners_, and _rewardLearner_.
|
inline |
Initializes the learner.
Definition at line 120 of file fmdpLearner.h.
References _instantiateFunctionGraph_().
Referenced by _instantiateFunctionGraph_(), and initialize().
|
inline |
|
inline |
Initializes the learner.
Definition at line 129 of file fmdpLearner.h.
References gum::MultiDimFunctionGraph< GUM_SCALAR, TerminalNodePolicy >::getTreeInstance().
|
inline |
Initializes the learner.
Definition at line 166 of file fmdpLearner.h.
References _instantiateRewardLearner_().
Referenced by _instantiateRewardLearner_(), and initialize().
|
inline |
Initializes the learner.
Definition at line 171 of file fmdpLearner.h.
References _learningThreshold_, and _similarityThreshold_.
|
inline |
Initializes the learner.
Definition at line 180 of file fmdpLearner.h.
References _learningThreshold_.
|
inline |
Initializes the learner.
Definition at line 136 of file fmdpLearner.h.
References _instantiateVarLearner_().
Referenced by _instantiateVarLearner_(), and initialize().
|
inline |
Initializes the learner.
Definition at line 145 of file fmdpLearner.h.
References _learningThreshold_, and _similarityThreshold_.
|
inline |
Initializes the learner.
Definition at line 156 of file fmdpLearner.h.
References _learningThreshold_.
|
virtual |
Gives to the learner a new transition.
| actionId | : the action on which the transition was made |
| obs | : the observed transition |
Implements gum::ILearningStrategy.
Definition at line 160 of file fmdpLearner_tpl.h.
References _actionLearners_, _actionReward_, _actionRewardLearners_, _fmdp_, _rewardLearner_, _rmax_, and gum::Observation::reward().
|
virtual |
Initializes the learner.
Implements gum::ILearningStrategy.
Definition at line 108 of file fmdpLearner_tpl.h.
References _actionLearners_, _actionReward_, _actionRewardLearners_, _fmdp_, _instantiateFunctionGraph_(), _instantiateRewardLearner_(), _instantiateVarLearner_(), _modaMax_, _rewardLearner_, _rmax_, gum::Set< Key >::insert(), and gum::MultiDimFunctionGraph< GUM_SCALAR, TerminalNodePolicy >::setTableName().
|
inlinevirtual |
learnerSize
Implements gum::ILearningStrategy.
Definition at line 244 of file fmdpLearner.h.
References _modaMax_.
|
inlinevirtual |
learnerSize
Implements gum::ILearningStrategy.
Definition at line 238 of file fmdpLearner.h.
References _rmax_.
|
virtual |
learnerSize
Implements gum::ILearningStrategy.
Definition at line 188 of file fmdpLearner_tpl.h.
References _actionLearners_, _actionReward_, _actionRewardLearners_, _fmdp_, and _rewardLearner_.
|
virtual |
Starts an update of datastructure in the associated FMDP.
Implements gum::ILearningStrategy.
Definition at line 212 of file fmdpLearner_tpl.h.
References _actionLearners_, _actionReward_, _actionRewardLearners_, _fmdp_, and _rewardLearner_.
|
inlinevirtual |
extractCount
Implements gum::ILearningStrategy.
Definition at line 234 of file fmdpLearner.h.
References _actionLearners_.
|
private |
Definition at line 256 of file fmdpLearner.h.
Referenced by ~FMDPLearner(), addObservation(), initialize(), size(), updateFMDP(), and varLearner().
|
private |
Definition at line 258 of file fmdpLearner.h.
Referenced by FMDPLearner(), addObservation(), initialize(), size(), and updateFMDP().
|
private |
Definition at line 259 of file fmdpLearner.h.
Referenced by ~FMDPLearner(), addObservation(), initialize(), size(), and updateFMDP().
|
private |
The FMDP to store the learned model.
Definition at line 254 of file fmdpLearner.h.
Referenced by addObservation(), initialize(), size(), and updateFMDP().
|
private |
Definition at line 262 of file fmdpLearner.h.
Referenced by FMDPLearner(), _instantiateRewardLearner_(), _instantiateRewardLearner_(), _instantiateVarLearner_(), and _instantiateVarLearner_().
|
private |
learnerSize
Definition at line 247 of file fmdpLearner.h.
Referenced by initialize(), and modaMax().
|
private |
Definition at line 260 of file fmdpLearner.h.
Referenced by FMDPLearner(), ~FMDPLearner(), addObservation(), initialize(), size(), and updateFMDP().
|
private |
learnerSize
Definition at line 241 of file fmdpLearner.h.
Referenced by addObservation(), initialize(), and rMax().
|
private |
Definition at line 263 of file fmdpLearner.h.
Referenced by FMDPLearner(), _instantiateRewardLearner_(), and _instantiateVarLearner_().