From a43127f8811836a12ef82a72f767d6a71a7b8412 Mon Sep 17 00:00:00 2001 From: Simon Date: Wed, 15 Aug 2018 12:16:12 +0200 Subject: [PATCH] fix copy_transpose! --- src/cuda/cudnn.jl | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/src/cuda/cudnn.jl b/src/cuda/cudnn.jl index 585b948d..01a368c7 100644 --- a/src/cuda/cudnn.jl +++ b/src/cuda/cudnn.jl @@ -1,6 +1,8 @@ using CuArrays.CUDNN: @check, libcudnn, cudnnStatus_t, libcudnn_handle, cudnnDataType, TensorDesc, FilterDesc +using LinearAlgebra + mutable struct DropoutDesc ptr::Ptr{Nothing} states::CuVector{UInt8} @@ -244,14 +246,14 @@ import ..Tracker: TrackedArray using CUDAnative using CuArrays: @cuindex, cudims -function copy_transpose!(dst::CuArray, src::CuArray) +function LinearAlgebra.copy_transpose!(dst::CuArray, src::CuArray) function kernel(dst, src) I = @cuindex dst dst[I...] = src[reverse(I)...] return end blk, thr = cudims(dst) - @cuda (blk, thr) kernel(dst, src) + @cuda blocks=blk threads=thr kernel(dst, src) return dst end