Flux.jl/test/layers/normalisation.jl

using Flux, Test, Statistics
using Zygote: pullback

evalwgrad(f, x...) = pullback(f, x...)[1]

@testset "Dropout" begin
  x = [1.,2.,3.]
  @test x == Dropout(0.1)(x)
  @test x == evalwgrad(Dropout(0), x)
  @test zero(x) == evalwgrad(Dropout(1), x)

  x = rand(100)
  m = Dropout(0.9)
  y = evalwgrad(m, x)
  @test count(a->a==0, y) > 50
  testmode!(m, true)
  y = evalwgrad(m, x) # should override istraining
  @test count(a->a==0, y) == 0
  testmode!(m, false)
  y = evalwgrad(m, x)
  @test count(a->a==0, y) > 50

  x = rand(Float32, 100)
  m = Chain(Dense(100,100),
            Dropout(0.9))
  y = evalwgrad(m, x)
  @test count(a->a == 0, y) > 50
  testmode!(m, true)
  y = evalwgrad(m, x) # should override istraining
  @test count(a->a == 0, y) == 0

  x = rand(100, 50)
  m = Dropout(0.5, dims = 2)
  y = m(x)
  c = map(i->count(a->a==0, @view y[i, :]), 1:100)
  @test minimum(c) == maximum(c)
  m = Dropout(0.5, dims = 1)
  y = m(x)
  c = map(i->count(a->a==0, @view y[:, i]), 1:50)
  @test minimum(c) == maximum(c)
end

@testset "BatchNorm" begin
  let m = BatchNorm(2), x = [1.0 3.0 5.0;
                             2.0 4.0 6.0]

    @test length(params(m)) == 2

    @test m.β == [0, 0]  # initβ(2)
    @test m.γ == [1, 1]  # initγ(2)
    # initial m.σ is 1
    # initial m.μ is 0

    y = evalwgrad(m, x)
    @test isapprox(y, [-1.22474 0 1.22474; -1.22474 0 1.22474], atol = 1.0e-5)
    # julia> x
    #  2×3 Array{Float64,2}:
    #  1.0  3.0  5.0
    #  2.0  4.0  6.0
    #
    # μ of batch will be
    #  (1. + 3. + 5.) / 3 = 3
    #  (2. + 4. + 6.) / 3 = 4
    #
    # ∴ update rule with momentum:
    #  .1 * 3 + 0 = .3
    #  .1 * 4 + 0 = .4
    @test m.μ ≈ reshape([0.3, 0.4], 2, 1)

    # julia> .1 .* var(x, dims = 2, corrected=false) .* (3 / 2).+ .9 .* [1., 1.]
    # 2×1 Array{Float64,2}:
    #  1.3
    #  1.3
    @test m.σ² ≈ .1 .* var(x, dims = 2, corrected=false) .* (3 / 2).+ .9 .* [1., 1.]

    x′ = m(x)
    @test isapprox(x′[1], (1 .- 0.3) / sqrt(1.3), atol = 1.0e-5)
  end

  # with activation function
  let m = BatchNorm(2, sigmoid), x = [1.0 3.0 5.0;
                                      2.0 4.0 6.0]
    y = m(x)
    @test isapprox(y, sigmoid.((x .- m.μ) ./ sqrt.(m.σ² .+ m.ϵ)), atol = 1.0e-7)
  end

  let m = trainmode!(BatchNorm(2)), x = reshape(Float32.(1:6), 3, 2, 1)
    y = reshape(permutedims(x, [2, 1, 3]), 2, :)
    y = permutedims(reshape(m(y), 2, 3, 1), [2, 1, 3])
    @test m(x) == y
  end

  let m = trainmode!(BatchNorm(2)), x = reshape(Float32.(1:12), 2, 3, 2, 1)
    y = reshape(permutedims(x, [3, 1, 2, 4]), 2, :)
    y = permutedims(reshape(m(y), 2, 2, 3, 1), [2, 3, 1, 4])
    @test m(x) == y
  end

  let m = trainmode!(BatchNorm(2)), x = reshape(Float32.(1:24), 2, 2, 3, 2, 1)
    y = reshape(permutedims(x, [4, 1, 2, 3, 5]), 2, :)
    y = permutedims(reshape(m(y), 2, 2, 2, 3, 1), [2, 3, 4, 1, 5])
    @test m(x) == y
  end

  let m = BatchNorm(32), x = randn(Float32, 416, 416, 32, 1);
    m(x)
    @test (@allocated m(x)) <  100_000_000
  end
end

@testset "InstanceNorm" begin
  # helper functions
  expand_inst = (x, as) -> reshape(repeat(x, outer=[1, as[length(as)]]), as...)
  # begin tests
  let m = InstanceNorm(2), sizes = (3, 2, 2),
        x = reshape(collect(1:prod(sizes)), sizes)

      @test length(params(m)) == 2
      x = Float64.(x)
      @test m.β == [0, 0]  # initβ(2)
      @test m.γ == [1, 1]  # initγ(2)
      y = evalwgrad(m, x)

      #julia> x
      #[:, :, 1] =
      # 1.0  4.0
      # 2.0  5.0
      # 3.0  6.0
      #
      #[:, :, 2] =
      # 7.0  10.0
      # 8.0  11.0
      # 9.0  12.0
      #
      # μ will be
      # (1. + 2. + 3.) / 3 = 2.
      # (4. + 5. + 6.) / 3 = 5.
      #
      # (7. + 8. + 9.) / 3 = 8.
      # (10. + 11. + 12.) / 3 = 11.
      #
      # ∴ update rule with momentum:
      # (1. - .1) * 0 + .1 * (2. + 8.) / 2 = .5
      # (1. - .1) * 0 + .1 * (5. + 11.) / 2 = .8
      @test m.μ ≈ [0.5, 0.8]
      # momentum * var * num_items / (num_items - 1) + (1 - momentum) * sigma_sq
      # julia> reshape(mean(.1 .* var(x, dims = 1, corrected=false) .* (3 / 2), dims=3), :) .+ .9 .* 1.
      # 2-element Array{Float64,1}:
      #  1.
      #  1.
      @test m.σ² ≈ reshape(mean(.1 .* var(x, dims = 1, corrected=false) .* (3 / 2), dims=3), :) .+ .9 .* 1.

      x′ = m(x)
      @test isapprox(x′[1], (1 - 0.5) / sqrt(1. + 1f-5), atol = 1.0e-5)
  end
  # with activation function
  let m = InstanceNorm(2, sigmoid), sizes = (3, 2, 2),
      x = reshape(collect(1:prod(sizes)), sizes)
    x = Float64.(x)
    affine_shape = collect(sizes)
    affine_shape[1] = 1

    y = m(x)
    @test isapprox(y, sigmoid.((x .- expand_inst(m.μ, affine_shape)) ./ sqrt.(expand_inst(m.σ², affine_shape) .+ m.ϵ)), atol = 1.0e-7)
  end

  let m = trainmode!(InstanceNorm(2)), sizes = (2, 4, 1, 2, 3),
      x = Float32.(reshape(collect(1:prod(sizes)), sizes))
    y = reshape(permutedims(x, [3, 1, 2, 4, 5]), :, 2, 3)
    y = reshape(m(y), sizes...)
    @test m(x) == y
  end

  # check that μ, σ², and the output are the correct size for higher rank tensors
  let m = InstanceNorm(2), sizes = (5, 5, 3, 4, 2, 6),
      x = reshape(Float32.(collect(1:prod(sizes))), sizes)
    y = evalwgrad(m, x)
    @test size(m.μ) == (sizes[end - 1], )
    @test size(m.σ²) == (sizes[end - 1], )
    @test size(y) == sizes
  end

  # show that instance norm is equal to batch norm when channel and batch dims are squashed
  let m_inorm = trainmode!(InstanceNorm(2)), m_bnorm = trainmode!(BatchNorm(12)), sizes = (5, 5, 3, 4, 2, 6),
      x = reshape(Float32.(collect(1:prod(sizes))), sizes)
    @test m_inorm(x) == reshape(m_bnorm(reshape(x, (sizes[1:end - 2]..., :, 1))), sizes)
  end

  let m = InstanceNorm(32), x = randn(Float32, 416, 416, 32, 1);
    m(x)
    @test (@allocated m(x)) <  100_000_000
  end

end

if VERSION >= v"1.1"
@testset "GroupNorm" begin
  # begin tests
  squeeze(x) = dropdims(x, dims = tuple(findall(size(x) .== 1)...)) # To remove all singular dimensions

  let m = GroupNorm(4,2), sizes = (3,4,2),
        x = reshape(collect(1:prod(sizes)), sizes)

      @test length(params(m)) == 2
      x = Float64.(x)
      @test m.β == [0, 0, 0, 0]  # initβ(32)
      @test m.γ == [1, 1, 1, 1]  # initγ(32)

      y = evalwgrad(m, x)

      #julia> x
      #[:, :, 1]  =
      # 1.0  4.0  7.0  10.0
      # 2.0  5.0  8.0  11.0
      # 3.0  6.0  9.0  12.0
      #
      #[:, :, 2] =
      # 13.0  16.0  19.0  22.0
      # 14.0  17.0  20.0  23.0
      # 15.0  18.0  21.0  24.0
      #
      # μ will be
      # (1. + 2. + 3. + 4. + 5. + 6.) / 6 = 3.5
      # (7. + 8. + 9. + 10. + 11. + 12.) / 6 = 9.5
      #
      # (13. + 14. + 15. + 16. + 17. + 18.) / 6 = 15.5
      # (19. + 20. + 21. + 22. + 23. + 24.) / 6 = 21.5
      #
      # μ =
      # 3.5   15.5
      # 9.5   21.5
      #
      # ∴ update rule with momentum:
      # (1. - .1) * 0 + .1 * (3.5 + 15.5) / 2 = 0.95
      # (1. - .1) * 0 + .1 * (9.5 + 21.5) / 2 = 1.55
      @test m.μ ≈ [0.95, 1.55]

      # julia> mean(var(reshape(x,3,2,2,2),dims=(1,2)).* .1,dims=2) .+ .9*1.
      # 2-element Array{Float64,1}:
      #  1.25
      #  1.25
      @test m.σ² ≈ mean(squeeze(var(reshape(x,3,2,2,2),dims=(1,2))).*.1,dims=2) .+ .9*1.

      x′ = m(x)
      @test isapprox(x′[1], (1 - 0.95) / sqrt(1.25 + 1f-5), atol = 1.0e-5)
  end
  # with activation function
  let m = GroupNorm(4,2, sigmoid), sizes = (3, 4, 2),
      x = reshape(collect(1:prod(sizes)), sizes)
    x = Float64.(x)
    μ_affine_shape = ones(Int,length(sizes) + 1)
    μ_affine_shape[end-1] = 2 # Number of groups

    affine_shape = ones(Int,length(sizes) + 1)
    affine_shape[end-2] = 2 # Channels per group
    affine_shape[end-1] = 2 # Number of groups
    affine_shape[1] = sizes[1]
    affine_shape[end] = sizes[end]

    og_shape = size(x)

    y = m(x)
    x_ = reshape(x,affine_shape...)
    out = reshape(sigmoid.((x_ .- reshape(m.μ,μ_affine_shape...)) ./ sqrt.(reshape(m.σ²,μ_affine_shape...) .+ m.ϵ)),og_shape)
    @test isapprox(y, out, atol = 1.0e-7)
  end

  let m = trainmode!(GroupNorm(2,2)), sizes = (2, 4, 1, 2, 3),
      x = Float32.(reshape(collect(1:prod(sizes)), sizes))
    y = reshape(permutedims(x, [3, 1, 2, 4, 5]), :, 2, 3)
    y = reshape(m(y), sizes...)
    @test m(x) == y
  end

  # check that μ, σ², and the output are the correct size for higher rank tensors
  let m = GroupNorm(4,2), sizes = (5, 5, 3, 4, 4, 6),
      x = Float32.(reshape(collect(1:prod(sizes)), sizes))
    y = evalwgrad(m, x)
    @test size(m.μ) == (m.G,1)
    @test size(m.σ²) == (m.G,1)
    @test size(y) == sizes
  end

  # show that group norm is the same as instance norm when the group size is the same as the number of channels
  let IN = trainmode!(InstanceNorm(4)), GN = trainmode!(GroupNorm(4,4)), sizes = (2,2,3,4,5),
      x = Float32.(reshape(collect(1:prod(sizes)), sizes))
    @test IN(x) ≈ GN(x)
  end

  # show that group norm is the same as batch norm for a group of size 1 and batch of size 1
  let BN = trainmode!(BatchNorm(4)), GN = trainmode!(GroupNorm(4,4)), sizes = (2,2,3,4,1),
      x = Float32.(reshape(collect(1:prod(sizes)), sizes))
    @test BN(x) ≈ GN(x)
  end
end
end
-												normalise test fixes

											
										
										
											2019-09-10 15:19:55 +00:00
+								using Flux, Test, Statistics
-												pkg up

											
										
										
											2019-09-19 17:33:33 +00:00
+								using Zygote: pullback
-												passing tests... ish

											
										
										
											2019-03-08 15:00:32 +00:00
-												Added testmode! functionality back to normalization layers.

											
										
										
											2020-02-21 05:27:36 +00:00
+								evalwgrad(f, x...) = pullback(f, x...)[1]
-												reorganise

											
										
										
											2017-10-26 10:46:12 +00:00
 								@testset "Dropout" begin
-												add dropout

											
										
										
											2017-10-23 08:12:53 +00:00
+								  x = [1.,2.,3.]
-												passing tests... ish

											
										
										
											2019-03-08 15:00:32 +00:00
+								  @test x == Dropout(0.1)(x)
-												Added testmode! functionality back to normalization layers.

											
										
										
											2020-02-21 05:27:36 +00:00
+								  @test x == evalwgrad(Dropout(0), x)
 								  @test zero(x) == evalwgrad(Dropout(1), x)
-												add dropout

											
										
										
											2017-10-23 08:12:53 +00:00
 								  x = rand(100)
 								  m = Dropout(0.9)
-												Added testmode! functionality back to normalization layers.

											
										
										
											2020-02-21 05:27:36 +00:00
+								  y = evalwgrad(m, x)
-												add dropout

											
										
										
											2017-10-23 08:12:53 +00:00
+								  @test count(a->a==0, y) > 50
-												Added testmode! functionality back to normalization layers.

											
										
										
											2020-02-21 05:27:36 +00:00
+								  testmode!(m, true)
 								  y = evalwgrad(m, x) # should override istraining
-												add dropout

											
										
										
											2017-10-23 08:12:53 +00:00
+								  @test count(a->a==0, y) == 0
-												Added testmode! functionality back to normalization layers.

											
										
										
											2020-02-21 05:27:36 +00:00
+								  testmode!(m, false)
 								  y = evalwgrad(m, x)
-												setmode! -> testmode!

											
										
										
											2017-10-23 14:23:29 +00:00
+								  @test count(a->a==0, y) > 50
-												add dropout

											
										
										
											2017-10-23 08:12:53 +00:00
-												passing tests... ish

											
										
										
											2019-03-08 15:00:32 +00:00
+								  x = rand(Float32, 100)
-												add dropout

											
										
										
											2017-10-23 08:12:53 +00:00
+								  m = Chain(Dense(100,100),
 								            Dropout(0.9))
-												Added testmode! functionality back to normalization layers.

											
										
										
											2020-02-21 05:27:36 +00:00
+								  y = evalwgrad(m, x)
-												add == and < for tracked arrays

											
										
										
											2017-10-23 09:41:08 +00:00
+								  @test count(a->a == 0, y) > 50
-												Added testmode! functionality back to normalization layers.

											
										
										
											2020-02-21 05:27:36 +00:00
+								  testmode!(m, true)
 								  y = evalwgrad(m, x) # should override istraining
-												add == and < for tracked arrays

											
										
										
											2017-10-23 09:41:08 +00:00
+								  @test count(a->a == 0, y) == 0
-												noise shape for dropout

											
										
										
											2019-01-22 15:51:38 +00:00
 								  x = rand(100, 50)
-												make dims as field of Dropout

											
										
										
											2019-05-10 15:45:50 +00:00
+								  m = Dropout(0.5, dims = 2)
 								  y = m(x)
-												noise shape for dropout

											
										
										
											2019-01-22 15:51:38 +00:00
+								  c = map(i->count(a->a==0, @view y[i, :]), 1:100)
 								  @test minimum(c) == maximum(c)
-												make dims as field of Dropout

											
										
										
											2019-05-10 15:45:50 +00:00
+								  m = Dropout(0.5, dims = 1)
 								  y = m(x)
-												change `dims` as unbroadcasted dims and keyword argument

											
										
										
											2019-04-04 17:19:20 +00:00
+								  c = map(i->count(a->a==0, @view y[:, i]), 1:50)
 								  @test minimum(c) == maximum(c)
-												add dropout

											
										
										
											2017-10-23 08:12:53 +00:00
+								end
-												batchnorm: add test cases

											
										
										
											2017-10-30 05:24:35 +00:00
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								@testset "BatchNorm" begin
 								  let m = BatchNorm(2), x = [1.0 3.0 5.0;
 .0 4.0 6.0]
-												fix normalisation layer params

											
										
										
											2019-09-19 14:33:24 +00:00
+								    @test length(params(m)) == 2
-												broken normalisation layer params

											
										
										
											2019-09-19 13:12:11 +00:00
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								    @test m.β == [0, 0]  # initβ(2)
 								    @test m.γ == [1, 1]  # initγ(2)
 								    # initial m.σ is 1
 								    # initial m.μ is 0
-												Added testmode! functionality back to normalization layers.

											
										
										
											2020-02-21 05:27:36 +00:00
+								    y = evalwgrad(m, x)
-												BatchNorm test corrected

											
										
										
											2019-06-11 15:04:48 +00:00
+								    @test isapprox(y, [-1.22474 0 1.22474; -1.22474 0 1.22474], atol = 1.0e-5)
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								    # julia> x
 								    #  2×3 Array{Float64,2}:
 								    #  1.0  3.0  5.0
 								    #  2.0  4.0  6.0
 								    #
 								    # μ of batch will be
 								    #  (1. + 3. + 5.) / 3 = 3
 								    #  (2. + 4. + 6.) / 3 = 4
 								    #
 								    # ∴ update rule with momentum:
 								    #  .1 * 3 + 0 = .3
 								    #  .1 * 4 + 0 = .4
 								    @test m.μ ≈ reshape([0.3, 0.4], 2, 1)
 								    # julia> .1 .* var(x, dims = 2, corrected=false) .* (3 / 2).+ .9 .* [1., 1.]
 								    # 2×1 Array{Float64,2}:
 								    #  1.3
 								    #  1.3
 								    @test m.σ² ≈ .1 .* var(x, dims = 2, corrected=false) .* (3 / 2).+ .9 .* [1., 1.]
-												BatchNorm test corrected

											
										
										
											2019-06-11 15:04:48 +00:00
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								    x′ = m(x)
 								    @test isapprox(x′[1], (1 .- 0.3) / sqrt(1.3), atol = 1.0e-5)
 								  end
 								  # with activation function
-												rm last uses of param/data

											
										
										
											2019-08-19 14:09:32 +00:00
+								  let m = BatchNorm(2, sigmoid), x = [1.0 3.0 5.0;
 .0 4.0 6.0]
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								    y = m(x)
-												rm last uses of param/data

											
										
										
											2019-08-19 14:09:32 +00:00
+								    @test isapprox(y, sigmoid.((x .- m.μ) ./ sqrt.(m.σ² .+ m.ϵ)), atol = 1.0e-7)
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								  end
-												Added trainmode! and updated docs with warning

											
										
										
											2020-03-01 18:30:41 +00:00
+								  let m = trainmode!(BatchNorm(2)), x = reshape(Float32.(1:6), 3, 2, 1)
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								    y = reshape(permutedims(x, [2, 1, 3]), 2, :)
 								    y = permutedims(reshape(m(y), 2, 3, 1), [2, 1, 3])
 								    @test m(x) == y
 								  end
-												Added trainmode! and updated docs with warning

											
										
										
											2020-03-01 18:30:41 +00:00
+								  let m = trainmode!(BatchNorm(2)), x = reshape(Float32.(1:12), 2, 3, 2, 1)
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								    y = reshape(permutedims(x, [3, 1, 2, 4]), 2, :)
 								    y = permutedims(reshape(m(y), 2, 2, 3, 1), [2, 3, 1, 4])
 								    @test m(x) == y
 								  end
-												Added trainmode! and updated docs with warning

											
										
										
											2020-03-01 18:30:41 +00:00
+								  let m = trainmode!(BatchNorm(2)), x = reshape(Float32.(1:24), 2, 2, 3, 2, 1)
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								    y = reshape(permutedims(x, [4, 1, 2, 3, 5]), 2, :)
 								    y = permutedims(reshape(m(y), 2, 2, 2, 3, 1), [2, 3, 4, 1, 5])
 								    @test m(x) == y
 								  end
 								  let m = BatchNorm(32), x = randn(Float32, 416, 416, 32, 1);
 								    m(x)
 								    @test (@allocated m(x)) <  100_000_000
 								  end
 								end
 								@testset "InstanceNorm" begin
 								  # helper functions
 								  expand_inst = (x, as) -> reshape(repeat(x, outer=[1, as[length(as)]]), as...)
 								  # begin tests
 								  let m = InstanceNorm(2), sizes = (3, 2, 2),
-												broken normalisation layer params

											
										
										
											2019-09-19 13:12:11 +00:00
+								        x = reshape(collect(1:prod(sizes)), sizes)
-												fix normalisation layer params

											
										
										
											2019-09-19 14:33:24 +00:00
+								      @test length(params(m)) == 2
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								      x = Float64.(x)
 								      @test m.β == [0, 0]  # initβ(2)
 								      @test m.γ == [1, 1]  # initγ(2)
-												Added testmode! functionality back to normalization layers.

											
										
										
											2020-02-21 05:27:36 +00:00
+								      y = evalwgrad(m, x)
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
 								      #julia> x
 								      #[:, :, 1] =
 								      # 1.0  4.0
 								      # 2.0  5.0
 								      # 3.0  6.0
 								      #
 								      #[:, :, 2] =
 								      # 7.0  10.0
 								      # 8.0  11.0
 								      # 9.0  12.0
 								      #
 								      # μ will be
 								      # (1. + 2. + 3.) / 3 = 2.
 								      # (4. + 5. + 6.) / 3 = 5.
 								      #
 								      # (7. + 8. + 9.) / 3 = 8.
 								      # (10. + 11. + 12.) / 3 = 11.
 								      #
 								      # ∴ update rule with momentum:
 								      # (1. - .1) * 0 + .1 * (2. + 8.) / 2 = .5
 								      # (1. - .1) * 0 + .1 * (5. + 11.) / 2 = .8
 								      @test m.μ ≈ [0.5, 0.8]
 								      # momentum * var * num_items / (num_items - 1) + (1 - momentum) * sigma_sq
 								      # julia> reshape(mean(.1 .* var(x, dims = 1, corrected=false) .* (3 / 2), dims=3), :) .+ .9 .* 1.
 								      # 2-element Array{Float64,1}:
 								      #  1.
 								      #  1.
 								      @test m.σ² ≈ reshape(mean(.1 .* var(x, dims = 1, corrected=false) .* (3 / 2), dims=3), :) .+ .9 .* 1.
 								      x′ = m(x)
 								      @test isapprox(x′[1], (1 - 0.5) / sqrt(1. + 1f-5), atol = 1.0e-5)
 								  end
 								  # with activation function
 								  let m = InstanceNorm(2, sigmoid), sizes = (3, 2, 2),
 								      x = reshape(collect(1:prod(sizes)), sizes)
 								    x = Float64.(x)
 								    affine_shape = collect(sizes)
 								    affine_shape[1] = 1
 								    y = m(x)
-												rm last uses of param/data

											
										
										
											2019-08-19 14:09:32 +00:00
+								    @test isapprox(y, sigmoid.((x .- expand_inst(m.μ, affine_shape)) ./ sqrt.(expand_inst(m.σ², affine_shape) .+ m.ϵ)), atol = 1.0e-7)
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								  end
-												Added trainmode! and updated docs with warning

											
										
										
											2020-03-01 18:30:41 +00:00
+								  let m = trainmode!(InstanceNorm(2)), sizes = (2, 4, 1, 2, 3),
-												normalise test fixes

											
										
										
											2019-09-10 15:19:55 +00:00
+								      x = Float32.(reshape(collect(1:prod(sizes)), sizes))
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								    y = reshape(permutedims(x, [3, 1, 2, 4, 5]), :, 2, 3)
 								    y = reshape(m(y), sizes...)
 								    @test m(x) == y
 								  end
 								  # check that μ, σ², and the output are the correct size for higher rank tensors
 								  let m = InstanceNorm(2), sizes = (5, 5, 3, 4, 2, 6),
-												normalise test fixes

											
										
										
											2019-09-10 15:19:55 +00:00
+								      x = reshape(Float32.(collect(1:prod(sizes))), sizes)
-												Added testmode! functionality back to normalization layers.

											
										
										
											2020-02-21 05:27:36 +00:00
+								    y = evalwgrad(m, x)
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								    @test size(m.μ) == (sizes[end - 1], )
 								    @test size(m.σ²) == (sizes[end - 1], )
 								    @test size(y) == sizes
 								  end
 								  # show that instance norm is equal to batch norm when channel and batch dims are squashed
-												Added trainmode! and updated docs with warning

											
										
										
											2020-03-01 18:30:41 +00:00
+								  let m_inorm = trainmode!(InstanceNorm(2)), m_bnorm = trainmode!(BatchNorm(12)), sizes = (5, 5, 3, 4, 2, 6),
-												normalise test fixes

											
										
										
											2019-09-10 15:19:55 +00:00
+								      x = reshape(Float32.(collect(1:prod(sizes))), sizes)
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								    @test m_inorm(x) == reshape(m_bnorm(reshape(x, (sizes[1:end - 2]..., :, 1))), sizes)
 								  end
 								  let m = InstanceNorm(32), x = randn(Float32, 416, 416, 32, 1);
 								    m(x)
 								    @test (@allocated m(x)) <  100_000_000
 								  end
 								end
-												guard test on 1.0

											
										
										
											2019-11-15 15:59:42 +00:00
+								if VERSION >= v"1.1"
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								@testset "GroupNorm" begin
 								  # begin tests
 								  squeeze(x) = dropdims(x, dims = tuple(findall(size(x) .== 1)...)) # To remove all singular dimensions
 								  let m = GroupNorm(4,2), sizes = (3,4,2),
-												broken normalisation layer params

											
										
										
											2019-09-19 13:12:11 +00:00
+								        x = reshape(collect(1:prod(sizes)), sizes)
-												fix normalisation layer params

											
										
										
											2019-09-19 14:33:24 +00:00
+								      @test length(params(m)) == 2
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								      x = Float64.(x)
 								      @test m.β == [0, 0, 0, 0]  # initβ(32)
 								      @test m.γ == [1, 1, 1, 1]  # initγ(32)
-												Added testmode! functionality back to normalization layers.

											
										
										
											2020-02-21 05:27:36 +00:00
+								      y = evalwgrad(m, x)
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
 								      #julia> x
 								      #[:, :, 1]  =
 								      # 1.0  4.0  7.0  10.0
 								      # 2.0  5.0  8.0  11.0
 								      # 3.0  6.0  9.0  12.0
 								      #
 								      #[:, :, 2] =
 								      # 13.0  16.0  19.0  22.0
 								      # 14.0  17.0  20.0  23.0
 								      # 15.0  18.0  21.0  24.0
 								      #
 								      # μ will be
 								      # (1. + 2. + 3. + 4. + 5. + 6.) / 6 = 3.5
 								      # (7. + 8. + 9. + 10. + 11. + 12.) / 6 = 9.5
 								      #
 								      # (13. + 14. + 15. + 16. + 17. + 18.) / 6 = 15.5
 								      # (19. + 20. + 21. + 22. + 23. + 24.) / 6 = 21.5
 								      #
 								      # μ =
 								      # 3.5   15.5
 								      # 9.5   21.5
 								      #
 								      # ∴ update rule with momentum:
 								      # (1. - .1) * 0 + .1 * (3.5 + 15.5) / 2 = 0.95
 								      # (1. - .1) * 0 + .1 * (9.5 + 21.5) / 2 = 1.55
 								      @test m.μ ≈ [0.95, 1.55]
 								      # julia> mean(var(reshape(x,3,2,2,2),dims=(1,2)).* .1,dims=2) .+ .9*1.
 								      # 2-element Array{Float64,1}:
 								      #  1.25
 								      #  1.25
 								      @test m.σ² ≈ mean(squeeze(var(reshape(x,3,2,2,2),dims=(1,2))).*.1,dims=2) .+ .9*1.
 								      x′ = m(x)
 								      @test isapprox(x′[1], (1 - 0.95) / sqrt(1.25 + 1f-5), atol = 1.0e-5)
 								  end
 								  # with activation function
 								  let m = GroupNorm(4,2, sigmoid), sizes = (3, 4, 2),
-												rm last uses of param/data

											
										
										
											2019-08-19 14:09:32 +00:00
+								      x = reshape(collect(1:prod(sizes)), sizes)
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								    x = Float64.(x)
 								    μ_affine_shape = ones(Int,length(sizes) + 1)
 								    μ_affine_shape[end-1] = 2 # Number of groups
 								    affine_shape = ones(Int,length(sizes) + 1)
 								    affine_shape[end-2] = 2 # Channels per group
 								    affine_shape[end-1] = 2 # Number of groups
 								    affine_shape[1] = sizes[1]
 								    affine_shape[end] = sizes[end]
 								    og_shape = size(x)
 								    y = m(x)
 								    x_ = reshape(x,affine_shape...)
-												rm last uses of param/data

											
										
										
											2019-08-19 14:09:32 +00:00
+								    out = reshape(sigmoid.((x_ .- reshape(m.μ,μ_affine_shape...)) ./ sqrt.(reshape(m.σ²,μ_affine_shape...) .+ m.ϵ)),og_shape)
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								    @test isapprox(y, out, atol = 1.0e-7)
 								  end
-												Added trainmode! and updated docs with warning

											
										
										
											2020-03-01 18:30:41 +00:00
+								  let m = trainmode!(GroupNorm(2,2)), sizes = (2, 4, 1, 2, 3),
-												normalise test fixes

											
										
										
											2019-09-10 15:19:55 +00:00
+								      x = Float32.(reshape(collect(1:prod(sizes)), sizes))
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								    y = reshape(permutedims(x, [3, 1, 2, 4, 5]), :, 2, 3)
 								    y = reshape(m(y), sizes...)
 								    @test m(x) == y
 								  end
 								  # check that μ, σ², and the output are the correct size for higher rank tensors
 								  let m = GroupNorm(4,2), sizes = (5, 5, 3, 4, 4, 6),
-												normalise test fixes

											
										
										
											2019-09-10 15:19:55 +00:00
+								      x = Float32.(reshape(collect(1:prod(sizes)), sizes))
-												Added testmode! functionality back to normalization layers.

											
										
										
											2020-02-21 05:27:36 +00:00
+								    y = evalwgrad(m, x)
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								    @test size(m.μ) == (m.G,1)
 								    @test size(m.σ²) == (m.G,1)
 								    @test size(y) == sizes
 								  end
 								  # show that group norm is the same as instance norm when the group size is the same as the number of channels
-												Added trainmode! and updated docs with warning

											
										
										
											2020-03-01 18:30:41 +00:00
+								  let IN = trainmode!(InstanceNorm(4)), GN = trainmode!(GroupNorm(4,4)), sizes = (2,2,3,4,5),
-												normalise test fixes

											
										
										
											2019-09-10 15:19:55 +00:00
+								      x = Float32.(reshape(collect(1:prod(sizes)), sizes))
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								    @test IN(x) ≈ GN(x)
 								  end
 								  # show that group norm is the same as batch norm for a group of size 1 and batch of size 1
-												Added trainmode! and updated docs with warning

											
										
										
											2020-03-01 18:30:41 +00:00
+								  let BN = trainmode!(BatchNorm(4)), GN = trainmode!(GroupNorm(4,4)), sizes = (2,2,3,4,1),
-												normalise test fixes

											
										
										
											2019-09-10 15:19:55 +00:00
+								      x = Float32.(reshape(collect(1:prod(sizes)), sizes))
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								    @test BN(x) ≈ GN(x)
 								  end
-												guard test on 1.0

											
										
										
											2019-11-15 15:59:42 +00:00
+								end
-												Updated tests of normalisation layers.

											
										
										
											2019-06-11 14:35:07 +00:00
+								end