CVPolicyLearner Class Reference
#include <ctdpolicylearner.h>
Inheritance diagram for CVPolicyLearner:
List of all
members.
|
Public Member Functions
|
|
|
CVPolicyLearner
(CStateReward
*rewardFunction,
CDynamicModel *dynModel,
CDynamicModelInputDerivationCalculator *dynModeldInput,
CGradientVFunction
*vFunction,
CVFunctionInputDerivationCalculator
*vFunctionInputDerivation,
CContinuousActionGradientPolicy
*gradientPolicy,
CCAGradientPolicyInputDerivationCalculator
*policydInput, std::list<
CStateModifier *
> *stateModifiers, int
nForwardView)
|
|
virtual
|
~CVPolicyLearner
()
|
|
virtual void
|
nextStep (CStateCollection *oldState,
CAction *action, double
reward, CStateCollection
*nextState)
|
| |
virtual function, to be implemented by
subclass
|
|
virtual void
|
newEpisode ()
|
| |
tells the Listener that a new Episode has
startet.
|
|
|
CVPolicyLearner
(CStateReward
*rewardFunction,
CTransitionFunction
*dynModel,
CTransitionFunctionInputDerivationCalculator
*dynModeldInput,
CAbstractVFunction
*vFunction,
CVFunctionInputDerivationCalculator
*vFunctionInputDerivation,
CContinuousActionGradientPolicy
*gradientPolicy,
CCAGradientPolicyInputDerivationCalculator
*policydInput, std::list<
CStateModifier *
> *stateModifiers, int
nForwardView)
|
|
virtual
|
~CVPolicyLearner
()
|
|
virtual void
|
nextStep (CStateCollection *oldState,
CAction *action, double
reward, CStateCollection
*nextState)
|
| |
virtual function, to be implemented by
subclass
|
|
virtual void
|
newEpisode ()
|
| |
tells the Listener that a new Episode has
startet.
|
|
void
|
calculateGradient
(std::list< CStateCollectionImpl *
> *states, std::list< ColumnVector * > *Drewards,
std::list< CContinuousActionData *
> *actionDatas, CFeatureList *policyGradient)
|
Protected Types
|
|
typedef std::list< CFeatureList * >
|
CStateGradient |
|
typedef std::list< CFeatureList * >
|
CStateGradient |
Protected Member Functions
|
|
void
|
getDNextState
(CStateGradient
*stateGradient1,
CStateGradient
*stateGradient2,
CStateCollection
*currentState, CContinuousActionData
*data)
|
|
void
|
multMatrixFeatureList
(Matrix *matrix, CFeatureList *features, int
index, std::list< CFeatureList * >
*newFeatures)
|
|
void
|
getDNextState
(CStateGradient
*stateGradient1,
CStateGradient
*stateGradient2,
CStateCollection
*currentState, CContinuousActionData
*data)
|
|
void
|
multMatrixFeatureList
(Matrix *matrix, CFeatureList *features, int
index, std::list< CFeatureList * >
*newFeatures)
|
Protected Attributes
|
|
CGradientVFunction
*
|
vFunction |
| |
learned VFunction
|
|
CVFunctionInputDerivationCalculator
*
|
vFunctionInputDerivation |
|
CContinuousActionGradientPolicy
*
|
gradientPolicy |
|
CCAGradientPolicyInputDerivationCalculator
*
|
policydInput |
|
ColumnVector *
|
dReward |
|
ColumnVector *
|
dVFunction |
|
Matrix *
|
dPolicy |
|
Matrix *
|
dModelInput |
|
CContinuousActionData
*
|
data |
|
std::list< CStateGradient * >
*
|
stateGradients |
|
CStateGradient *
|
stateGradient1 |
|
CStateGradient *
|
stateGradient2 |
|
CStateGradient *
|
dModelGradient |
|
CStateReward
*
|
rewardFunction |
|
CDynamicModel *
|
dynModel |
|
CDynamicModelInputDerivationCalculator *
|
dynModeldInput |
|
CStateCollectionImpl
*
|
tempStateCol |
|
CFeatureList
*
|
policyGradient |
|
int
|
nForwardView |
|
CAbstractVFunction
*
|
vFunction |
|
CVFunctionInputDerivationCalculator
*
|
vFunctionInputDerivation |
|
CContinuousActionGradientPolicy
*
|
gradientPolicy |
|
CCAGradientPolicyInputDerivationCalculator
*
|
policydInput |
|
ColumnVector *
|
dReward |
|
ColumnVector *
|
dVFunction |
|
Matrix *
|
dPolicy |
|
Matrix *
|
dModelInput |
|
CContinuousActionData
*
|
data |
|
std::list< CStateGradient * >
*
|
stateGradients |
|
CStateGradient *
|
stateGradient1 |
|
CStateGradient *
|
stateGradient2 |
|
CStateGradient *
|
dModelGradient |
|
CStateReward
*
|
rewardFunction |
|
CTransitionFunction
*
|
dynModel |
|
CTransitionFunctionInputDerivationCalculator
*
|
dynModeldInput |
|
CStateCollectionImpl
*
|
tempStateCol |
|
CFeatureList
*
|
policyGradient |
|
std::list< CStateCollectionImpl *
> *
|
pastStates |
|
std::list< ColumnVector * > *
|
pastDRewards |
|
std::list< CContinuousActionData *
> *
|
pastActions |
|
std::list< CStateCollectionImpl *
> *
|
statesResource |
|
std::list< ColumnVector * > *
|
rewardsResource |
|
std::list< CContinuousActionData *
> *
|
actionsResource |
|
std::list< CStateModifier * >
*
|
stateModifiers |
Member Typedef Documentation
Constructor & Destructor Documentation
| virtual
CVPolicyLearner::~CVPolicyLearner
|
( |
|
) |
[virtual] |
|
| virtual
CVPolicyLearner::~CVPolicyLearner
|
( |
|
) |
[virtual] |
|
Member Function Documentation
| void
CVPolicyLearner::multMatrixFeatureList
|
( |
Matrix * |
matrix,
|
|
|
CFeatureList *
|
features,
|
|
|
int |
index,
|
|
|
std::list< CFeatureList * > *
|
newFeatures |
|
) |
[protected] |
|
| void
CVPolicyLearner::multMatrixFeatureList
|
( |
Matrix * |
matrix,
|
|
|
CFeatureList *
|
features,
|
|
|
int |
index,
|
|
|
std::list< CFeatureList * > *
|
newFeatures |
|
) |
[protected] |
|
| virtual void
CVPolicyLearner::newEpisode
|
( |
|
) |
[virtual] |
|
| |
tells the Listener that a new Episode has startet.
Reimplemented from CSemiMDPListener.
|
| virtual void
CVPolicyLearner::newEpisode
|
( |
|
) |
[virtual] |
|
| |
tells the Listener that a new Episode has startet.
Reimplemented from CSemiMDPListener.
|
Member Data Documentation
The documentation for this class was generated from the following
files:
|