OptImpSampling.jl/src/control.jl at main · axsk/OptImpSampling.jl · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
using FLoops: @floop
using StaticArrays

# b + σu
function controlled_drift(D, xx, p, t, ::Val{n}, f::F, g::G, u::U) where {n,F,G,U}
    x = SVector{n}(@view xx[1:n])
    ux = u(x,t)
    gx = g(x,p,t)
    if isa(gx, Matrix)
        D[1:end-1] .= f(x,p,t) .+ gx * ux
    else
        D[1:end-1] .= f(x,p,t) .+ gx .* ux
    end
    D[end] = sum(abs2, ux) / 2
end

function controlled_noise(D, xx, p, t, ::Val{n}, g::G, u::U) where {n,G,U}
    x = SVector{n}(@view xx[1:n])
    gx = g(x,p,t)
    D .= 0
    if isa(gx, AbstractMatrix)
        D[1:n, 1:n] .= gx
    elseif isa(gx, AbstractVector)
        for i in 1:n
            D[i,i] = gx[i]
        end
    else
        for i in 1:n
            D[i,i] = gx
        end
    end
    D[end, 1:end-1] .= u(x,t)
end

# specialize on the dimension of the problem for SVector
GirsanovSDE(sde, u::F) where F = GirsanovSDE(sde, u, Val(length(sde.u0)))

""" Construct the SDE problem for Girsanov with control u """
function GirsanovSDE(sde, u::U, ::Val{n}) where {n, U}
    nrp = zeros(n+1, n+1)  # we could do with (n+1,n) but SROCK2 only takes square noise
    u0 = vcat(sde.u0, 0)   # append the girsanov dimension

    try
        u(sde.u0, 0)
    catch
        error("control `u` has wrong signature")
    end

    drift(D,x,p,t) = controlled_drift(D,x,p,t, Val(n), sde.f, sde.g, u)
    noise(D,x,p,t) = controlled_noise(D,x,p,t, Val(n), sde.g, u)

    return StochasticDiffEq.SDEProblem(drift, noise, u0, sde.tspan, sde.p; noise=sde.noise,
        noise_rate_prototype = nrp, sde.kwargs...)
end

## TODO: where do we use this?
function CompoundSDE(sde, u::U, v::Val{n} = Val(length(sde.u0))) where {n, U}
    nrp = zeros(n+1, n+1)
    u0 = vcat(sde.u0, 1.)

    f = sde.f
    g = sde.g

    function drift(D, xx, p, t)
        x = SVector{n}(@view xx[1:n])
        ux = u(x,t)
        gx = g(x,p,t)
        D[1:end-1] .= f(x,p,t) .+ gx .* ux
        D[end] = - xx[end] * sum(abs2, ux) / 2
    end

    function noise(D,xx,p,t)
        x = SVector{n}(@view xx[1:n])
        ux = u(x,t)
        gx = g(x,p,t)
        D .= 0
        for i in 1:n
            D[i,i] = gx
        end
        D[end, 1:end-1] .= -xx[end] * ux
    end

    return StochasticDiffEq.SDEProblem(drift, noise, u0, sde.tspan, sde.p;
        noise=sde.noise, noise_rate_prototype = nrp, sde.kwargs...)
end

nocontrol(x, t) = zero(x)

" convenience wrapper for obtaining X[end] and the Girsanov Weight"
function girsanovsample(cde, x0)
    u0 = vcat(x0, 0)
    sol=solve(cde; u0=u0)
    x = sol[end][1:end-1]
    w = exp(-sol[end][end])
    return x::Vector{Float64}, w::Float64
end

# TODO: maybe use DiffEq MC interface
function girsanovbatch(cde, xs, n)
    dim, nx = size(xs)
    ys ::Array{Float64, 3} = zeros(dim, nx, n)
    ws ::Array{Float64, 2} = zeros(nx, n)
    @floop for i in 1:nx, j in 1:n  # using @floop allows threaded iteration over i AND j
            ys[:, i, j], ws[i, j] = girsanovsample(cde, xs[:, i])
    end
    return ys, ws
end

" optcontrol(chis, Q, T, sigma, i)

optimal control u(x,t) = -∇log(Z)
for Z = Kχᵢ if Kχ = exp(Qt) χ.
Given it terms of the known generator Q"
function optcontrol(chis, Q, T, sigma, i)
    function u(x,t)
        dlogz = Zygote.gradient(x) do x  # this should prob. be ForwardDiff
            Z = exp(Q*(T-t)) * chis(x)
            log(Z[i])
        end
        return sigma' * dlogz
    end
    return u
end

""" K on {v₁, v₂} acts like a shift-scale, represented by `Shiftscale` """
struct Shiftscale
    a::Float64
    q::Float64
end

function Shiftscale(data::AbstractArray, T=1)
    a, b = extrema(data)
    lambda = b-a
    a = a/(1-lambda)
    q = log(lambda) / T
    return Shiftscale(a, q)
end

function (s::Shiftscale)(data, T=1)
    lambda = exp(T * s.q)
    return data .* lambda .+ s.a * (1-lambda)
end

function invert(s, data, T=1)
    lambda = exp(T*s.q)
    return (data .- s.a * (1-lambda)) ./ lambda
end

# TODO: check if this gives the same results as ociso
" optcontrol(chi, kchi::Array, T, sigma)

assume χ = a1 + bϕ with Kᵀϕ = λϕ = exp(qT)
then Kᵀχ = λχ + a(1-λ)1
given minima and maxima of Kᵀχ we can estimate λ and a
and therefore compute the optimal control for Kχ = E[χ]
u* = -σᵀ∇Φ = σᵀ∇log(Kχ) "

function optcontrol(chi::F, S::Shiftscale, T, sigma) where F
    function u(x,t)
        #x = SVector{length(x)}(x)
        dlogz = ForwardDiff.gradient(x) do x
            lambda = exp(S.q*(T-t))
            Z = lambda * first(chi(x)) + S.a*(1-lambda)
            if Z < 0
                @warn("negative log in control encountered")
                return 0.
            end
            log(Z)
        end #:: Vector{Float64}  # TODO: this should be inferred!
        return sigma' * dlogz
    end
    return u
end

# convenience wrapper using the original sde to extract noise and T
function optcontrol(model, S::Shiftscale, sde)
    sigma = sde.g(nothing, nothing, nothing)
    T = sde.tspan[end]
    optcontrol(model, S, T, sigma)
end

### Tests

function test_GirsanovSDE()
    sde = SDEProblem(Doublewell())
    cde = GirsanovSDE(sde, nocontrol)
    ys, ws = girsanovbatch(cde, rand(1,2), 3)
end

function test_optcontrol()
    sde = SDEProblem(Doublewell())
    model = fluxnet([1,3,3,1])
    u = optcontrol(model, Shiftscale(1,0), 1, 1)
    cde = GirsanovSDE(sde, u)
    ys, ws = girsanovbatch(cde, rand(1,2), 3)
end

function test_compare_controls()
    model = fluxnet()
    S = Shiftscale(0, 0)

    u = optcontrol(model, S, 1., 1.)
    c1 = u([1.], 1)

    ocp = OptChiControl(model, S)
    c2 = control(ocp, [1.], 1.)

    @assert c1 == c2
end