00001
00002
00003
00004
00005
00006
00007
00008
00009
00010
00011
00012
00013
00014
00015
00016
00017
00018
00019
00020
00021
00022
00023
00024
00025
00026
00027
00028
00029
00030
00031
00032 #ifndef CSEMIMDPLISTENER_H
00033 #define CSEMIMDPLISTENER_H
00034
00035 #include "cparameters.h"
00036
00037 class CAction;
00038 class CState;
00039 class CStateCollection;
00040 class CRewardFunction;
00041
00043
00059 class CSemiMDPListener : virtual public CParameterObject
00060 {
00061 public:
00062 bool enabled;
00063
00064 CSemiMDPListener() {enabled = true;};
00065
00067 virtual void nextStep(CStateCollection *, CAction *, CStateCollection *) {};
00069 virtual void intermediateStep(CStateCollection *, CAction *, CStateCollection *) {};
00071 virtual void newEpisode() {};
00072 };
00073
00074
00076
00080 class CSemiMDPRewardListener : public CSemiMDPListener
00081 {
00082 protected:
00084 CRewardFunction *semiMDPRewardFunction;
00085
00086 public:
00088 CSemiMDPRewardListener(CRewardFunction *semiMDPRewardFunction);
00089
00091 virtual void nextStep(CStateCollection *oldState, CAction *action, CStateCollection *nextState);
00093 virtual void nextStep(CStateCollection *, CAction *, double , CStateCollection *) {};
00094
00096 virtual void intermediateStep(CStateCollection *oldState, CAction *action, CStateCollection *nextState);
00098 virtual void intermediateStep(CStateCollection *, CAction *, double , CStateCollection *) {};
00099
00100 void setRewardFunction(CRewardFunction *semiMDPRewardFunction);
00101 CRewardFunction *getRewardFunction();
00102 };
00103
00105
00112 class CAdaptiveParameterFromNStepsCalculator : public CAdaptiveParameterUnBoundedValuesCalculator, public CSemiMDPListener
00113 {
00114 protected:
00115 int targetValue;
00116 int nStepsPerUpdate;
00117 public:
00118 CAdaptiveParameterFromNStepsCalculator(CParameters *targetObject, string targetParameter, int nStepsPerUpdate, int functionKind, double param0, double paramScale, double targetOffset, double targetScale);
00119 virtual ~CAdaptiveParameterFromNStepsCalculator();
00120
00121 virtual void nextStep(CStateCollection *, CAction *, CStateCollection *);
00122 virtual void onParametersChanged(){CAdaptiveParameterUnBoundedValuesCalculator::onParametersChanged();};
00123
00124 virtual void resetCalculator();
00125 };
00126
00128
00135 class CAdaptiveParameterFromNEpisodesCalculator : public CAdaptiveParameterUnBoundedValuesCalculator, public CSemiMDPListener
00136 {
00137 protected:
00138 int targetValue;
00139 public:
00140 CAdaptiveParameterFromNEpisodesCalculator(CParameters *targetObject, string targetParameter, int functionKind, double param0, double paramScale, double targetOffset, double targetScale);
00141 virtual ~CAdaptiveParameterFromNEpisodesCalculator();
00142
00143 virtual void newEpisode();
00144 virtual void onParametersChanged(){CAdaptiveParameterUnBoundedValuesCalculator::onParametersChanged();};
00145
00146 virtual void resetCalculator();
00147 };
00148
00149
00151
00159 class CAdaptiveParameterFromAverageRewardCalculator : public CAdaptiveParameterBoundedValuesCalculator, public CSemiMDPRewardListener
00160 {
00161 protected:
00162 double alpha;
00163 double targetValue;
00164 int nSteps;
00165 int nStepsPerUpdate;
00166 public:
00167 CAdaptiveParameterFromAverageRewardCalculator(CParameters *targetObject, string targetParameter, CRewardFunction *reward, int nStepsPerUpdate, int functionKind, double paramMin, double paramMax, double targetMin, double targetMax, double alpha);
00168 ~CAdaptiveParameterFromAverageRewardCalculator();
00169
00170 virtual void nextStep(CStateCollection *oldState, CAction *action, double reward, CStateCollection *newState);
00171 virtual void onParametersChanged();
00172
00173 virtual void resetCalculator();
00174 };
00175
00176 #endif // CSEMIMDPLISTENER_H
00177