Qualia  0.2
QLearningSoftmaxPolicy.h
Go to the documentation of this file.
1 /*
2  * QLearningSoftmaxPolicy.h
3  *
4  * (c) 2011 Sofian Audry -- info(@)sofianaudry(.)com
5  *
6  * This program is free software: you can redistribute it and/or modify
7  * it under the terms of the GNU General Public License as published by
8  * the Free Software Foundation, either version 3 of the License, or
9  * (at your option) any later version.
10  *
11  * This program is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14  * GNU General Public License for more details.
15  *
16  * You should have received a copy of the GNU General Public License
17  * along with this program. If not, see <http://www.gnu.org/licenses/>.
18  */
19 
20 #ifndef QLEARNINGSOFTMAXPOLICY_H_
21 #define QLEARNINGSOFTMAXPOLICY_H_
22 
23 #include "Policy.h"
24 #include "QLearningAgent.h"
25 #include <math.h>
26 
34 public:
37  float temperature;
38 
41  float epsilon;
42 
43  QLearningSoftmaxPolicy(float temperature = 1.0, float epsilon = 0.0);
44  virtual ~QLearningSoftmaxPolicy();
45 
46  virtual void chooseAction(Action* action, const Observation* observation);
47 };
48 
49 #endif /* QLEARNINGSOFTMAXPOLICY_H_ */