CPEGASUSAnalyticalPolicyGradientCalculator Class Reference
#include <cpegasus.h>
Inheritance diagram for
CPEGASUSAnalyticalPolicyGradientCalculator:
List of all members.
|
Public Member Functions
|
|
|
CPEGASUSAnalyticalPolicyGradientCalculator
(CAgent *agent,
CContinuousActionGradientPolicy
*policy,
CCAGradientPolicyInputDerivationCalculator
*policyInputDerivation, CTransitionFunctionEnvironment
*dynModel,
CTransitionFunctionInputDerivationCalculator
*dynModeldInput,
CStateReward
*reward, int numStartStates, int horizon, double gamma)
|
|
|
~CPEGASUSAnalyticalPolicyGradientCalculator
()
|
|
virtual void
|
getPEGASUSGradient
(CFeatureList
*gradientFeatures, CStateList *startStates)
|
|
virtual void
|
nextStep
(CStateCollection *oldState,
CAction *action,
CStateCollection
*newState)
|
| |
sends the Listener the S-A-S tuple from a
new step
|
|
virtual void
|
newEpisode
()
|
| |
tells the Listener that a new Episode has
startet.
|
Protected Member Functions
|
|
void
|
multMatrixFeatureList
(Matrix *matrix, CFeatureList *features, int
index, std::list< CFeatureList * >
*newFeatures)
|
Protected Attributes
|
|
ColumnVector *
|
dReward |
|
Matrix *
|
dPolicy |
|
Matrix *
|
dModelInput |
|
std::list< CFeatureList * > *
|
stateGradient1 |
|
std::list< CFeatureList * > *
|
stateGradient2 |
|
std::list< CFeatureList * > *
|
dModelGradient |
|
CFeatureList
*
|
episodeGradient |
|
CStateReward
*
|
rewardFunction |
|
CTransitionFunctionInputDerivationCalculator
*
|
dynModeldInput |
|
CCAGradientPolicyInputDerivationCalculator
*
|
policydInput |
|
int
|
steps |
|
CAgent *
|
agent |
Constructor & Destructor Documentation
|
CPEGASUSAnalyticalPolicyGradientCalculator::~CPEGASUSAnalyticalPolicyGradientCalculator
|
( |
|
) |
|
|
Member Function Documentation
| virtual void
CPEGASUSAnalyticalPolicyGradientCalculator::getPEGASUSGradient
|
( |
CFeatureList *
|
gradientFeatures,
|
|
|
CStateList *
|
startStates |
|
) |
[virtual] |
|
| void
CPEGASUSAnalyticalPolicyGradientCalculator::multMatrixFeatureList
|
( |
Matrix * |
matrix,
|
|
|
CFeatureList *
|
features,
|
|
|
int |
index,
|
|
|
std::list< CFeatureList * > *
|
newFeatures |
|
) |
[protected] |
|
| virtual void
CPEGASUSAnalyticalPolicyGradientCalculator::newEpisode
|
( |
|
) |
[virtual] |
|
| |
tells the Listener that a new Episode has startet.
Reimplemented from CSemiMDPListener.
|
| |
sends the Listener the S-A-S tuple from a new step
Reimplemented from CSemiMDPListener.
|
Member Data Documentation
The documentation for this class was generated from the following
file:
|