-
Notifications
You must be signed in to change notification settings - Fork 2
Expand file tree
/
Copy pathControl.h
More file actions
102 lines (92 loc) · 2.69 KB
/
Control.h
File metadata and controls
102 lines (92 loc) · 2.69 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
/*
* Copyright 2014 Saminda Abeyruwan (saminda@cs.miami.edu)
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
* Control.h
*
* Created on: Aug 19, 2012
* Author: sam
*/
#ifndef CONTROL_H_
#define CONTROL_H_
#include "Action.h"
#include "Vector.h"
#include "Function.h"
#include "Policy.h"
#include "Predictor.h"
namespace RLLib
{
template<class T>
class Control: public ParameterizedFunction<T>
{
public:
virtual ~Control()
{
}
virtual const Action<T>* initialize(const Vector<T>* x) =0;
virtual void reset() =0;
virtual const Action<T>* proposeAction(const Vector<T>* x) =0;
virtual const Action<T>* step(const Vector<T>* x_t, const Action<T>* a_t,
const Vector<T>* x_tp1, const T& r_tp1, const T& z_tp1) =0;
virtual T computeValueFunction(const Vector<T>* x) const =0;
virtual const Predictor<T>* predictor() const =0;
};
template<class T>
class OnPolicyControlLearner: public Control<T>
{
public:
virtual ~OnPolicyControlLearner()
{
}
};
template<class T>
class OffPolicyControlLearner: public Control<T>
{
public:
virtual ~OffPolicyControlLearner()
{
}
virtual void learn(const Vector<T>* x_t, const Action<T>* a_t, const Vector<T>* x_tp1,
const T& r_tp1, const T& z_tp1) = 0;
};
template<class T>
class ActorOffPolicy: public ParameterizedFunction<T>
{
public:
virtual ~ActorOffPolicy()
{
}
virtual void initialize() =0;
virtual void reset() =0;
virtual void update(const Representations<T>* phi_t, const Action<T>* a_t, T const& rho_t,
const T& delta_t) =0;
virtual PolicyDistribution<T>* policy() const =0;
virtual const Action<T>* proposeAction(const Representations<T>* phi) =0;
virtual T pi(const Action<T>* a) const =0;
};
template<class T>
class ActorOnPolicy: public ParameterizedFunction<T>
{
public:
virtual ~ActorOnPolicy()
{
}
virtual void initialize() =0;
virtual void reset() =0;
virtual void update(const Representations<T>* phi_t, const Action<T>* a_t, T delta) =0;
virtual PolicyDistribution<T>* policy() const =0;
virtual const Action<T>* proposeAction(const Representations<T>* phi) =0;
};
} // namespace RLLib
#endif /* CONTROL_H_ */