Flux.jl/test/optimise.jl

using Flux.Optimise
using Flux.Optimise: runall
using Flux.Tracker
using Test
@testset "Optimise" begin
  w = randn(10, 10)
  @testset for opt in [ADAMW(), ADAGrad(0.1), AdaMax(), ADADelta(0.9), AMSGrad(),
                       NADAM(), Descent(0.1), ADAM(), Nesterov(), RMSProp(),
                       Momentum()]
    w′ = param(randn(10, 10))
    loss(x) = Flux.mse(w*x, w′*x)
    for t = 1: 10^5
      θ = Params([w′])
      θ̄ = gradient(() -> loss(rand(10)), θ)
      Optimise.update!(opt, θ, θ̄)
    end
    @test Flux.mse(w, w′) < 0.01
  end
end

@testset "Optimiser" begin
  w = randn(10, 10)
  @testset for Opt in [InvDecay, WeightDecay, ExpDecay]
    w′ = param(randn(10, 10))
    loss(x) = Flux.mse(w*x, w′*x)
    opt = Optimiser(Opt(), ADAM(0.001))
    for t = 1:10^5
      l = loss(rand(10))
      back!(l)
      delta = Optimise.apply!(opt, w′.data, w′.grad)
      w′.data .-= delta
    end
    @test Flux.mse(w, w′) < 0.01
  end
end

@testset "Training Loop" begin
  i = 0
  l = param(1)

  Flux.train!(() -> (sleep(0.1); i += 1; l),
              (),
              Iterators.repeated((), 100),
              Descent(),
              cb = Flux.throttle(() -> (i > 3 && Flux.stop()), 1))

  @test 3 < i < 50

  # Test multiple callbacks
  x = 0
  fs = [() -> (), () -> x = 1]
  cbs = runall(fs)
  cbs()
  @test x == 1
end
-												improve optimizers

											
										
										
											2017-10-12 08:31:38 +00:00
+								using Flux.Optimise
-												re-add removed call function

											
										
										
											2018-11-08 13:14:57 +00:00
+								using Flux.Optimise: runall
-												improve optimizers

											
										
										
											2017-10-12 08:31:38 +00:00
+								using Flux.Tracker
-												utils errors fixed

											
										
										
											2018-08-11 12:54:59 +00:00
+								using Test
-												improve optimizers

											
										
										
											2017-10-12 08:31:38 +00:00
+								@testset "Optimise" begin
-												regression testing

											
										
										
											2017-12-08 17:10:29 +00:00
+								  w = randn(10, 10)
-												simpler/nicer training loop

											
										
										
											2019-02-28 14:58:42 +00:00
+								  @testset for opt in [ADAMW(), ADAGrad(0.1), AdaMax(), ADADelta(0.9), AMSGrad(),
 								                       NADAM(), Descent(0.1), ADAM(), Nesterov(), RMSProp(),
 								                       Momentum()]
-												updated tests

											
										
										
											2018-09-14 15:02:56 +00:00
+								    w′ = param(randn(10, 10))
 								    loss(x) = Flux.mse(w*x, w′*x)
 								    for t = 1: 10^5
-												simpler/nicer training loop

											
										
										
											2019-02-28 14:58:42 +00:00
+								      θ = Params([w′])
 								      θ̄ = gradient(() -> loss(rand(10)), θ)
 								      Optimise.update!(opt, θ, θ̄)
-												updated tests

											
										
										
											2018-09-14 15:02:56 +00:00
+								    end
 								    @test Flux.mse(w, w′) < 0.01
-												regression testing

											
										
										
											2017-12-08 17:10:29 +00:00
+								  end
-												improve optimizers

											
										
										
											2017-10-12 08:31:38 +00:00
+								end
-												closes #127

											
										
										
											2017-12-13 18:24:56 +00:00
-												fixed weight decay definition

											
										
										
											2018-10-11 04:37:16 +00:00
+								@testset "Optimiser" begin
-												added remaining optimizers and tests

											
										
										
											2018-09-16 12:04:51 +00:00
+								  w = randn(10, 10)
-												decay fixes

											
										
										
											2018-10-27 13:56:42 +00:00
+								  @testset for Opt in [InvDecay, WeightDecay, ExpDecay]
-												added remaining optimizers and tests

											
										
										
											2018-09-16 12:04:51 +00:00
+								    w′ = param(randn(10, 10))
 								    loss(x) = Flux.mse(w*x, w′*x)
-												fixed weight decay definition

											
										
										
											2018-10-11 04:37:16 +00:00
+								    opt = Optimiser(Opt(), ADAM(0.001))
-												added remaining optimizers and tests

											
										
										
											2018-09-16 12:04:51 +00:00
+								    for t = 1:10^5
 								      l = loss(rand(10))
 								      back!(l)
-												update -> apply

											
										
										
											2019-01-28 13:59:23 +00:00
+								      delta = Optimise.apply!(opt, w′.data, w′.grad)
-												added remaining optimizers and tests

											
										
										
											2018-09-16 12:04:51 +00:00
+								      w′.data .-= delta
 								    end
 								    @test Flux.mse(w, w′) < 0.01
-												fixed Compose test

											
										
										
											2018-09-16 12:15:29 +00:00
+								  end
-												added remaining optimizers and tests

											
										
										
											2018-09-16 12:04:51 +00:00
+								end
-												closes #127

											
										
										
											2017-12-13 18:24:56 +00:00
+								@testset "Training Loop" begin
 								  i = 0
 								  l = param(1)
 								  Flux.train!(() -> (sleep(0.1); i += 1; l),
-												tweaks

											
										
										
											2018-10-31 14:58:55 +00:00
+								              (),
-												closes #127

											
										
										
											2017-12-13 18:24:56 +00:00
+								              Iterators.repeated((), 100),
-												tweaks

											
										
										
											2018-10-31 14:58:55 +00:00
+								              Descent(),
-												pulled tracker from upstream

											
										
										
											2018-09-11 13:00:24 +00:00
+								              cb = Flux.throttle(() -> (i > 3 && Flux.stop()), 1))
-												closes #127

											
										
										
											2017-12-13 18:24:56 +00:00
 								  @test 3 < i < 50
-												re-add removed call function

											
										
										
											2018-11-08 13:14:57 +00:00
 								  # Test multiple callbacks
 								  x = 0
 								  fs = [() -> (), () -> x = 1]
 								  cbs = runall(fs)
 								  cbs()
 								  @test x == 1
-												closes #127

											
										
										
											2017-12-13 18:24:56 +00:00
+								end