Flux.jl/test/cuda/layers.jl

# Test layers and data/model movements on and off the GPU
# Add tests for layers and their gradients on the GPU
# Most of the forward passes should be fine being applied
# to bitstype objects, but this gives higher coverage for our use-cases
# Check that getting the gradients does not throw

# generic movement tests
@testset "Basic GPU Movement" begin
  @test gradient(x -> sum(gpu(x)), rand(3,3)) isa Tuple
  @test gradient(x -> sum(cpu(x)), gpu(rand(3,3))) isa Tuple
end

# TODO: These layers get into scalar indexing
# `AlphaDropout` throws a compilation error on GPUs,
# whereas, the rest are scalar indexing issues.
const BROKEN_LAYERS = [DepthwiseConv,
		       AlphaDropout,
                       InstanceNorm,
                       GroupNorm]

function gradtest(name::String, layers::Vector, xs = nothing, args...)
  isnothing(xs) && error("Missing input to test the layers against.")
  @testset "$name GPU grad tests" begin
    for layer in layers
      @testset "$layer GPU grad test" begin
        l = gpu(layer(args...))
        xs = gpu(xs)
        if any(x -> isa(l, x), BROKEN_LAYERS)
          ps = Flux.params(l)
          @test_broken gradient(() -> sum(l(xs)), ps) isa Flux.Zygote.Grads
        else
          ps = Flux.params(l)
          @test gradient(() -> sum(l(xs)), ps) isa Flux.Zygote.Grads
          gs = gradient(() -> sum(l(xs)), ps)

          # Handle pooling layers
          if !isempty(ps)
            @test gs[first(ps)] isa Flux.CuArrays.CuArray
          end
        end
      end
    end
  end
end

# Repeats from Conv, CrossCor

r = rand(Float32, 28, 28, 1, 1)
conv_layers = [Conv, ConvTranspose, CrossCor, DepthwiseConv]
gradtest("Conv", conv_layers, r, (2,2), 1=>3)

pooling_layers = [MaxPool, MeanPool]
gradtest("Pooling", pooling_layers, r, (2,2))

dropout_layers = [Dropout, AlphaDropout]
gradtest("Dropout", dropout_layers, r, 0.5f0)

norm_layers = [LayerNorm, BatchNorm]
gradtest("Normalising", norm_layers, rand(Float32, 28,28,3,1), 1)

instancenorm = [InstanceNorm]
gradtest("InstanceNorm", instancenorm, r, 1)

groupnorm = [GroupNorm]
gradtest("GroupNorm", groupnorm, rand(Float32, 28,28,3,1), 3, 1)

const stateless_layers = [Flux.mse,
                          Flux.crossentropy,
                          Flux.logitcrossentropy,
                          Flux.normalise]

const stateless_layers_broadcasted = [Flux.binarycrossentropy,
                                      Flux.logitbinarycrossentropy]

function stateless_gradtest(f, args...)
  @test gradient((args...) -> sum(f(args...)), args...)[1] isa CuArray
end

function stateless_gradtest_broadcasted(f, args...)
  @test gradient((args...) -> sum(f.(args...)), args...)[1] isa CuArray
end

@testset "Stateless GPU grad tests" begin
  x = gpu(rand(3,3))
  y = gpu(rand(3,3))

  for layer in stateless_layers
    if layer == Flux.normalise
      stateless_gradtest(layer, x)
    else
      stateless_gradtest(layer, x, y)
    end
  end

  for layer in stateless_layers_broadcasted
    stateless_gradtest_broadcasted(layer, x, y)
  end
end
add some grad tests on GPU 2019-12-05 12:42:23 +00:00			`# Test layers and data/model movements on and off the GPU`
			`# Add tests for layers and their gradients on the GPU`
			`# Most of the forward passes should be fine being applied`
			`# to bitstype objects, but this gives higher coverage for our use-cases`
			`# Check that getting the gradients does not throw`

			`# generic movement tests`
clearing failures 2020-05-19 18:24:18 +00:00			`@testset "Basic GPU Movement" begin`
			`@test gradient(x -> sum(gpu(x)), rand(3,3)) isa Tuple`
			`@test gradient(x -> sum(cpu(x)), gpu(rand(3,3))) isa Tuple`
			`end`

add comment on broken layers 2020-05-19 18:41:38 +00:00			`# TODO: These layers get into scalar indexing`
			# `AlphaDropout` throws a compilation error on GPUs,
			`# whereas, the rest are scalar indexing issues.`
clearing failures 2020-05-19 18:24:18 +00:00			`const BROKEN_LAYERS = [DepthwiseConv,`
add comment on broken layers 2020-05-19 18:41:38 +00:00			`AlphaDropout,`
			`InstanceNorm,`
			`GroupNorm]`
add some grad tests on GPU 2019-12-05 12:42:23 +00:00
test gradients are allocated on the gpu 2020-01-17 10:22:26 +00:00			`function gradtest(name::String, layers::Vector, xs = nothing, args...)`
			`isnothing(xs) && error("Missing input to test the layers against.")`
formatting fixes 2019-12-05 12:44:04 +00:00			`@testset "$name GPU grad tests" begin`
			`for layer in layers`
			`@testset "$layer GPU grad test" begin`
			`l = gpu(layer(args...))`
			`xs = gpu(xs)`
clearing failures 2020-05-19 18:24:18 +00:00			`if any(x -> isa(l, x), BROKEN_LAYERS)`
test gradients are allocated on the gpu 2020-01-17 10:22:26 +00:00			`ps = Flux.params(l)`
			`@test_broken gradient(() -> sum(l(xs)), ps) isa Flux.Zygote.Grads`
formatting fixes 2019-12-05 12:44:04 +00:00			`else`
test gradients are allocated on the gpu 2020-01-17 10:22:26 +00:00			`ps = Flux.params(l)`
			`@test gradient(() -> sum(l(xs)), ps) isa Flux.Zygote.Grads`
			`gs = gradient(() -> sum(l(xs)), ps)`

			`# Handle pooling layers`
			`if !isempty(ps)`
			`@test gs[first(ps)] isa Flux.CuArrays.CuArray`
			`end`
formatting fixes 2019-12-05 12:44:04 +00:00			`end`
			`end`
			`end`
			`end`
add some grad tests on GPU 2019-12-05 12:42:23 +00:00			`end`

			`# Repeats from Conv, CrossCor`

test gradients are allocated on the gpu 2020-01-17 10:22:26 +00:00			`r = rand(Float32, 28, 28, 1, 1)`
add some grad tests on GPU 2019-12-05 12:42:23 +00:00			`conv_layers = [Conv, ConvTranspose, CrossCor, DepthwiseConv]`
test gradients are allocated on the gpu 2020-01-17 10:22:26 +00:00			`gradtest("Conv", conv_layers, r, (2,2), 1=>3)`
add some grad tests on GPU 2019-12-05 12:42:23 +00:00
			`pooling_layers = [MaxPool, MeanPool]`
test gradients are allocated on the gpu 2020-01-17 10:22:26 +00:00			`gradtest("Pooling", pooling_layers, r, (2,2))`
add some grad tests on GPU 2019-12-05 12:42:23 +00:00
			`dropout_layers = [Dropout, AlphaDropout]`
test gradients are allocated on the gpu 2020-01-17 10:22:26 +00:00			`gradtest("Dropout", dropout_layers, r, 0.5f0)`
add some grad tests on GPU 2019-12-05 12:42:23 +00:00
			`norm_layers = [LayerNorm, BatchNorm]`
clearing failures 2020-05-19 18:24:18 +00:00			`gradtest("Normalising", norm_layers, rand(Float32, 28,28,3,1), 1)`
add some grad tests on GPU 2019-12-05 12:42:23 +00:00
			`instancenorm = [InstanceNorm]`
clearing failures 2020-05-19 18:24:18 +00:00			`gradtest("InstanceNorm", instancenorm, r, 1)`
add some grad tests on GPU 2019-12-05 12:42:23 +00:00
			`groupnorm = [GroupNorm]`
test gradients are allocated on the gpu 2020-01-17 10:22:26 +00:00			`gradtest("GroupNorm", groupnorm, rand(Float32, 28,28,3,1), 3, 1)`
add some grad tests on GPU 2019-12-05 12:42:23 +00:00
			`const stateless_layers = [Flux.mse,`
formatting fixes 2019-12-05 12:44:04 +00:00			`Flux.crossentropy,`
test gradients are allocated on the gpu 2020-01-17 10:22:26 +00:00			`Flux.logitcrossentropy,`
formatting fixes 2019-12-05 12:44:04 +00:00			`Flux.normalise]`
add some grad tests on GPU 2019-12-05 12:42:23 +00:00
			`const stateless_layers_broadcasted = [Flux.binarycrossentropy,`
formatting fixes 2019-12-05 12:44:04 +00:00			`Flux.logitbinarycrossentropy]`
add some grad tests on GPU 2019-12-05 12:42:23 +00:00
			`function stateless_gradtest(f, args...)`
formatting fixes 2019-12-05 12:44:04 +00:00			`@test gradient((args...) -> sum(f(args...)), args...)[1] isa CuArray`
add some grad tests on GPU 2019-12-05 12:42:23 +00:00			`end`

			`function stateless_gradtest_broadcasted(f, args...)`
clearing failures 2020-05-19 18:24:18 +00:00			`@test gradient((args...) -> sum(f.(args...)), args...)[1] isa CuArray`
add some grad tests on GPU 2019-12-05 12:42:23 +00:00			`end`

			`@testset "Stateless GPU grad tests" begin`
formatting fixes 2019-12-05 12:44:04 +00:00			`x = gpu(rand(3,3))`
			`y = gpu(rand(3,3))`

			`for layer in stateless_layers`
			`if layer == Flux.normalise`
			`stateless_gradtest(layer, x)`
			`else`
			`stateless_gradtest(layer, x, y)`
			`end`
			`end`

			`for layer in stateless_layers_broadcasted`
			`stateless_gradtest_broadcasted(layer, x, y)`
			`end`
add some grad tests on GPU 2019-12-05 12:42:23 +00:00			`end`