85 lines
2.0 KiB
Julia
85 lines
2.0 KiB
Julia
function process_func(ex, params)
|
||
@capture(shortdef(ex), (args__,) -> body_)
|
||
body = il(graphm(body))
|
||
body = map(x -> x in params ? :(self.$x) : x, body)
|
||
return args, body
|
||
end
|
||
|
||
function build_type(T, params)
|
||
quote
|
||
type $T
|
||
$(params...)
|
||
$([symbol("Δ", s) for s in params]...)
|
||
end
|
||
$T($(params...)) = $T($(params...),
|
||
$((:(zeros($p)) for p in params)...))
|
||
end
|
||
end
|
||
|
||
function build_forward(body, args)
|
||
body = cut_forward(body, args)
|
||
cse(body)
|
||
end
|
||
|
||
function build_backward(body, x, params)
|
||
Δs, Δloops = cut_backward(body, [x])
|
||
back = IVertex{Any}(Flow.Do())
|
||
for param in params
|
||
haskey(Δs, :(self.$param)) || continue
|
||
k = symbol("Δ", param)
|
||
ksym = Expr(:quote, k)
|
||
ex = Δs[:(self.$param)]
|
||
for Δloop in Δloops
|
||
ex = addΔ(ex, get(Δloop, :(self.$param), vertex(0)))
|
||
end
|
||
thread!(back, @v(setfield!(:self, ksym, :(self.$k) + ex)))
|
||
end
|
||
ex = Δs[x]
|
||
for Δloop in Δloops
|
||
ex = addΔ(ex, get(Δloop, x, vertex(0)))
|
||
end
|
||
thread!(back, @flow(tuple($ex)))
|
||
cse(back)
|
||
end
|
||
|
||
function build_update(T, params)
|
||
updates = []
|
||
for p in params
|
||
Δp = symbol("Δ", p)
|
||
push!(updates, :(self.$p += self.$Δp; fill!(self.$Δp, 0)))
|
||
end
|
||
:(update!(self::$T) = $(updates...))
|
||
end
|
||
|
||
function process_type(ex)
|
||
@capture(ex, type T_ fs__ end)
|
||
@destruct [params = true || [],
|
||
funcs = false || []] = groupby(x->isa(x, Symbol), fs)
|
||
@assert length(funcs) == 1
|
||
args, body = process_func(funcs[1], params)
|
||
@assert length(args) == 1
|
||
quote
|
||
$(build_type(T, params))
|
||
(self::$T)($(args...),) = $(syntax(build_forward(body, args)))
|
||
back!(self::$T, Δ, $(args...)) = $(syntax(build_backward(body, args[1], params)))
|
||
$(build_update(T, params))
|
||
end |> longdef
|
||
end
|
||
|
||
# process_type(:(type Sigmoid
|
||
# W
|
||
# b
|
||
# bp
|
||
# x -> σ(W*x+b)
|
||
# end)) |> prettify
|
||
|
||
process_type(:(type Recurrent
|
||
Wxh; Whh; Bh
|
||
Why; By
|
||
|
||
function (x)
|
||
hidden = σ( Wxh*x + Whh*Delay(hidden) + Bh )
|
||
y = σ( Why*hidden + By )
|
||
end
|
||
end)) |> prettify
|