Flux.jl/src/backend/tensorflow/model.jl

type Model
  model::Any
  session::Session
  params::Dict{Flux.Param,Tensor}
  inputs::Vector{Tensor}
  output::Any
end

function makesession(model, inputs; session = Session(Graph()))
  params, output = tograph(model, inputs...)
  run(session, initialize_all_variables())
  Model(model, session, params, inputs, output)
end

function makesession(model, n::Integer; session = Session(Graph()))
  makesession(model, [placeholder(Float32) for _ = 1:n], session = session)
end

tf(model) = makesession(model, 1)

function storeparams!(sess, params)
  for (p, t) in params
    p.x = run(sess, t)
  end
end

storeparams!(m::Model) = storeparams!(m.session, m.params)

ismultioutput(m::Model) = !isa(m.output, Tensor)

function batch(xs)
  dims = ndims(xs)-1
  T = Array{eltype(xs),dims}
  B = Array{eltype(xs),dims+1}
  Batch{T,B}(xs)
end

function runmodel(m, args...)
  @assert length(args) == length(m.inputs)
  output = run(m.session, m.output, Dict(zip(m.inputs, args)))
  ismultioutput(m) ? (batch.(output)...,) : batch(output)
end

function (m::Model)(args::Batch...)
  runmodel(m, args...)
end

function (m::Model)(args...)
  output = m(map(batchone, args)...)
  ismultioutput(m) ? map(first, output) : first(output)
end

for f in :[back!, update!].args
  @eval function Flux.$f(m::Model, args...)
    error($(string(f)) * " is not yet supported on TensorFlow models")
  end
end

import Juno: info

function Flux.train!(m::Model, train, test=[]; epoch = 1, η = 0.1,
                     loss = (y, y′) -> reduce_sum((y - y′).^2)/2,
                     opt = TensorFlow.train.GradientDescentOptimizer(η))
  i = 0
  Y = placeholder(Float32)
  Loss = loss(m.output, Y)
  minimize_op = TensorFlow.train.minimize(opt, Loss)
  for e in 1:epoch
    info("Epoch $e\n")
    @progress for (x, y) in train
      y, cur_loss, _ = run(m.session, vcat(m.output, Loss, minimize_op),
                           Dict(m.inputs[1]=>batchone(x), Y=>batchone(y)))
      if i % 5000 == 0
        @show y
        @show accuracy(m, test)
      end
      i += 1
    end
  end
end
-												tf reorg

											
										
										
											2016-10-26 13:25:10 +00:00
+								type Model
-												handle state on julia side

											
										
										
											2016-10-28 20:17:48 +00:00
+								  model::Any
-												tf reorg

											
										
										
											2016-10-26 13:25:10 +00:00
+								  session::Session
-												better handling for reused params

											
										
										
											2016-10-28 15:06:56 +00:00
+								  params::Dict{Flux.Param,Tensor}
-												tf reorg

											
										
										
											2016-10-26 13:25:10 +00:00
+								  inputs::Vector{Tensor}
-												handle state on julia side

											
										
										
											2016-10-28 20:17:48 +00:00
+								  output::Any
-												tf reorg

											
										
										
											2016-10-26 13:25:10 +00:00
+								end
-												makesession refactor

											
										
										
											2016-12-20 17:18:40 +00:00
+								function makesession(model, inputs; session = Session(Graph()))
 								  params, output = tograph(model, inputs...)
 								  run(session, initialize_all_variables())
 								  Model(model, session, params, inputs, output)
 								end
 								function makesession(model, n::Integer; session = Session(Graph()))
 								  makesession(model, [placeholder(Float32) for _ = 1:n], session = session)
 								end
-												handling of multiple outputs

											
										
										
											2016-10-28 19:50:27 +00:00
-												makesession refactor

											
										
										
											2016-12-20 17:18:40 +00:00
+								tf(model) = makesession(model, 1)
 								function storeparams!(sess, params)
 								  for (p, t) in params
 								    p.x = run(sess, t)
 								  end
-												tf reorg

											
										
										
											2016-10-26 13:25:10 +00:00
+								end
-												makesession refactor

											
										
										
											2016-12-20 17:18:40 +00:00
+								storeparams!(m::Model) = storeparams!(m.session, m.params)
 								ismultioutput(m::Model) = !isa(m.output, Tensor)
-												use batching api

											
										
										
											2016-10-28 16:00:31 +00:00
+								function batch(xs)
 								  dims = ndims(xs)-1
 								  T = Array{eltype(xs),dims}
 								  B = Array{eltype(xs),dims+1}
 								  Batch{T,B}(xs)
 								end
-												tf reorg

											
										
										
											2016-10-26 13:25:10 +00:00
-												explicit hidden state batching

											
										
										
											2016-11-15 23:44:11 +00:00
+								function runmodel(m, args...)
-												tf reorg

											
										
										
											2016-10-26 13:25:10 +00:00
+								  @assert length(args) == length(m.inputs)
-												handling of multiple outputs

											
										
										
											2016-10-28 19:50:27 +00:00
+								  output = run(m.session, m.output, Dict(zip(m.inputs, args)))
 								  ismultioutput(m) ? (batch.(output)...,) : batch(output)
-												tf reorg

											
										
										
											2016-10-26 13:25:10 +00:00
+								end
-												explicit hidden state batching

											
										
										
											2016-11-15 23:44:11 +00:00
+								function (m::Model)(args::Batch...)
 								  runmodel(m, args...)
 								end
-												handling of multiple outputs

											
										
										
											2016-10-28 19:50:27 +00:00
+								function (m::Model)(args...)
 								  output = m(map(batchone, args)...)
 								  ismultioutput(m) ? map(first, output) : first(output)
 								end
-												tf reorg

											
										
										
											2016-10-26 13:25:10 +00:00
-												remove gradient support for now

											
										
										
											2016-12-20 16:37:43 +00:00
+								for f in :[back!, update!].args
 								  @eval function Flux.$f(m::Model, args...)
 								    error($(string(f)) * " is not yet supported on TensorFlow models")
 								  end
-												tf reorg

											
										
										
											2016-10-26 13:25:10 +00:00
+								end
 								import Juno: info
 								function Flux.train!(m::Model, train, test=[]; epoch = 1, η = 0.1,
 								                     loss = (y, y′) -> reduce_sum((y - y′).^2)/2,
 								                     opt = TensorFlow.train.GradientDescentOptimizer(η))
 								  i = 0
 								  Y = placeholder(Float32)
-												split out makesession logic

											
										
										
											2016-10-30 12:10:44 +00:00
+								  Loss = loss(m.output, Y)
-												tf reorg

											
										
										
											2016-10-26 13:25:10 +00:00
+								  minimize_op = TensorFlow.train.minimize(opt, Loss)
 								  for e in 1:epoch
 								    info("Epoch $e\n")
 								    @progress for (x, y) in train
-												split out makesession logic

											
										
										
											2016-10-30 12:10:44 +00:00
+								      y, cur_loss, _ = run(m.session, vcat(m.output, Loss, minimize_op),
-												use batching api

											
										
										
											2016-10-28 16:00:31 +00:00
+								                           Dict(m.inputs[1]=>batchone(x), Y=>batchone(y)))
-												tf reorg

											
										
										
											2016-10-26 13:25:10 +00:00
+								      if i % 5000 == 0
 								        @show y
 								        @show accuracy(m, test)
 								      end
 								      i += 1
 								    end
 								  end
 								end