Merge pull request #45 from tejank10/dilation

MikeInnes · web-flow · commit 1ed81ee256e9 · 2018-05-31T13:58:47.000+01:00
Fixed NaN error in dilation
diff --git a/src/impl/conv.jl b/src/impl/conv.jl
@@ -44,7 +44,7 @@ end
 
 function col2im_2d!{T}(col::AbstractArray{T,2}, img::AbstractArray{T,3}, width::Int, height::Int,
   channels::Int, kernel_w::Int, kernel_h::Int, pad_w::Int, pad_h::Int, stride_w::Int,
-  stride_h::Int, dil_h::Int, dil_w::Int, mode::Int)
+  stride_h::Int, dil_w::Int, dil_h::Int, mode::Int)
 
   height_col = div(height + 2pad_h - (kernel_h - 1) * dil_h - 1, stride_h) + 1
   width_col = div(width + 2pad_w - (kernel_w - 1) * dil_w - 1, stride_w) + 1
@@ -159,26 +159,25 @@ function dilation_dims(w, dilation = 1)
   end
 end
 
-function im2col_dims(w,y,dilation=1)
+function im2col_dims(w,y)
     N = ndims(y)
-    dil = dilation_dims(w, dilation)
     r,c = 1,1
     for i=1:N-2
         r *= size(y,i)
-        c *= dil[i]
+        c *= size(w,i)
     end
-    c *= dil[N-1]
+    c *= size(w,N-1)
     return (r, c)
 end
 
 function conv2d!{T}(y::AbstractArray{T,4}, x::AbstractArray{T,4}, w::AbstractArray{T,4};
                   padding=0, stride=1, dilation=1, mode=0, alpha=T(1))
     if mode != 0 && mode != 1; throw(ArgumentError("conv2d only supports mode=0 or 1.")); end
     Wx,Hx,Cx,Nx = size(x)
-    Ww,Hw,C1,C2 = dilation_dims(w, dilation)
+    Ww,Hw,C1,C2 = size(w)
     if Cx!=C1; throw(DimensionMismatch()); end
     Wy,Hy,Cy,Ny = size(y)
-    x2dims = im2col_dims(w,y,dilation)
+    x2dims = im2col_dims(w,y)
     x2 = similar(x, x2dims)
     (p1,p2) = psize(padding,x)
     (s1,s2) = psize(stride,x)
@@ -197,11 +196,11 @@ function conv2d_grad_w!{T}(dw::AbstractArray{T,4}, x::AbstractArray{T,4}, w::Abs
                    padding=0, stride=1, dilation=1, mode=0, alpha=1)
     # dw = x'*dy
     Wx,Hx,Cx,Nx = size(x)
-    Ww,Hw,C1,C2 = dilation_dims(w, dilation)
+    Ww,Hw,C1,C2 = size(w)
     Wy,Hy,Cy,Ny = size(dy)
     # if mode != 0 && mode != 1; throw(ArgumentError("conv2d only supports mode=0 or 1.")); end
     # @assert Cx==C1 && Cy==C2 && Ny==Nx
-    x2dims = im2col_dims(w,dy,dilation)
+    x2dims = im2col_dims(w,dy)
     x2 = similar(x, x2dims)
     # op(A) is an m-by-k matrix, op(B) is a k-by-n matrix, C is an m-by-n matrix.
     Y,M,N,K = Wy*Hy*Cy,Ww*Hw*Cx,Cy,Wy*Hy
@@ -222,11 +221,11 @@ function conv2d_grad_x!{T}(dx::AbstractArray{T,4}, x::AbstractArray{T,4}, w::Abs
                    padding=0, stride=1, dilation=1, mode=0, alpha=1)
     # dx = dy*w'
     Wx,Hx,Cx,Nx = size(x)
-    Ww,Hw,C1,C2 = dilation_dims(w, dilation)
+    Ww,Hw,C1,C2 = size(w)
     Wy,Hy,Cy,Ny = size(dy)
     # if mode != 0 && mode != 1; throw(ArgumentError("conv2d only supports mode=0 or 1.")); end
     @assert Cx==C1 && Cy==C2 && Ny==Nx
-    x2dims = im2col_dims(w,dy,dilation)
+    x2dims = im2col_dims(w,dy)
     x2 = similar(x, x2dims)
     # op(A) is an m-by-k matrix, op(B) is a k-by-n matrix, C is an m-by-n matrix.
     Y,M,N,K = Wy*Hy*Cy,Wy*Hy,Ww*Hw*Cx,Cy
@@ -266,11 +265,11 @@ function conv3d!{T}(y::AbstractArray{T,5}, x::AbstractArray{T,5}, w::AbstractArr
                   padding=0, stride=1, dilation = 1, mode=0, alpha=T(1))
     if mode != 0 && mode != 1; throw(ArgumentError("conv3d only supports mode=0 or 1.")); end
     Wx,Hx,Dx,Cx,Nx = size(x)
-    Ww,Hw,Dw,C1,C2 = dilation_dims(w, dilation)
+    Ww,Hw,Dw,C1,C2 = size(w)
     if Cx!=C1; throw(DimensionMismatch()); end
     Wy,Hy,Dy,Cy,Ny = size(y)
     # @assert Cy==C2 && Ny==Nx
-    x2dims = im2col_dims(w,y,dilation)
+    x2dims = im2col_dims(w,y)
     x2 = similar(x, x2dims)
     (p1,p2,p3) = psize(padding,x)
     (s1,s2,s3) = psize(stride,x)
@@ -290,11 +289,11 @@ function conv3d_grad_w!{T}(dw::AbstractArray{T,5}, x::AbstractArray{T,5}, w::Abs
                    padding=0, stride=1, dilation = 1, mode=0, alpha=1)
     # dw = x'*dy
     Wx,Hx,Dx,Cx,Nx = size(x)
-    Ww,Hw,Dw,C1,C2 = dilation_dims(w, dilation)
+    Ww,Hw,Dw,C1,C2 = size(w)
     Wy,Hy,Dy,Cy,Ny = size(dy)
     # if mode != 0 && mode != 1; throw(ArgumentError("conv2d only supports mode=0 or 1.")); end
     # @assert Cx==C1 && Cy==C2 && Ny==Nx
-    x2dims = im2col_dims(w,dy,dilation)
+    x2dims = im2col_dims(w,dy)
     x2 = similar(x, x2dims)
     # op(A) is an m-by-k matrix, op(B) is a k-by-n matrix, C is an m-by-n matrix.
     Y,M,N,K = Wy*Hy*Dy*Cy,Ww*Hw*Dw*Cx,Cy,Wy*Hy*Dy
@@ -315,11 +314,11 @@ function conv3d_grad_x!{T}(dx::AbstractArray{T,5}, x::AbstractArray{T,5}, w::Abs
                    padding=0, stride=1, dilation = 1, mode=0, alpha=1)
     # dx = dy*w'
     Wx,Hx,Dx,Cx,Nx = size(x)
-    Ww,Hw,Dw,C1,C2 = dilation_dims(w, dilation)
+    Ww,Hw,Dw,C1,C2 = size(w)
     Wy,Hy,Dy,Cy,Ny = size(dy)
     # if mode != 0 && mode != 1; throw(ArgumentError("conv2d only supports mode=0 or 1.")); end
     @assert Cx==C1 && Cy==C2 && Ny==Nx
-    x2dims = im2col_dims(w,dy,dilation)
+    x2dims = im2col_dims(w,dy)
     x2 = similar(x, x2dims)
     # op(A) is an m-by-k matrix, op(B) is a k-by-n matrix, C is an m-by-n matrix.
     Y,M,N,K = Wy*Hy*Dy*Cy,Wy*Hy*Dy,Ww*Hw*Dw*Cx,Cy
diff --git a/test/conv.jl b/test/conv.jl
@@ -27,6 +27,15 @@ using NNlib: conv, ∇conv_filter, ∇conv_data, ∇maxpool, maxpool
         48 98;
         58 108;
         68 118.]
+
+	# NaN tests for dilation forward pass
+
+	ys = []
+	for idx in 1:1000 		
+    	push!(ys, conv(x, w; dilation=2))
+	end
+	@test !any([any(isnan.(ys[idx])) for idx in 1:1000])
+
     # for gradients, check only size
     # correctness of gradients is cross-checked with CUDNN.jl
     # (it's assumed convolution code won't change often)
@@ -39,6 +48,23 @@ using NNlib: conv, ∇conv_filter, ∇conv_data, ∇maxpool, maxpool
     @test size(y) == (3, 2, 1, 1)
     @test size(∇conv_filter(y, x, w; stride=2, pad=1, dilation=2)) == size(w)
     @test size(∇conv_data(y, x, w; stride=2, pad=1, dilation=2)) == size(x)
+
+	# NaN tests for dilation backward pass: filters
+	dy = randn(size(ys[1]))
+	dws = []
+	for idx in 1:1000
+	    push!(dws, ∇conv_filter(dy, x, w; dilation=2))
+	end
+
+	# NaN tests for dilation backward pass: input
+	dxs = []
+	for idx in 1:1000
+	    push!(dxs, ∇conv_data(dy, x, w; dilation=2))
+	end
+
+	@test !any([any(isnan.(dws[idx])) for idx in 1:1000])
+	@test !any([any(isnan.(dxs[idx])) for idx in 1:1000])
+
 end
 
 
@@ -123,13 +149,37 @@ end
         680 860.
     ]
 
+	# NaN tests for dilation forward pass
+
+	ys = []
+	for idx in 1:1000 		
+    	push!(ys, conv(x, w; dilation=2))
+	end
+	@test !any([any(isnan.(ys[idx])) for idx in 1:1000])
+
     # for gradients, check only size
     # correctness of gradients is cross-checked with CUDNN.jl
     # (it's assumed convolution code won't change often)
 
     @test size(∇conv_filter(reshape(rand(4,3,2), 4, 3, 2, 1, 1), x, w)) == size(w)
     @test size(∇conv_data(reshape(rand(4,3,2), 4, 3, 2, 1, 1), x, w)) == size(x)
 
+	# NaN tests for dilation backward pass: filters
+	dy = randn(size(ys[1]))
+	dws = []
+	for idx in 1:1000
+	    push!(dws, ∇conv_filter(dy, x, w; dilation=2))
+	end
+
+	# NaN tests for dilation backward pass: input
+	dxs = []
+	for idx in 1:1000
+	    push!(dxs, ∇conv_data(dy, x, w; dilation=2))
+	end
+
+	@test !any([any(isnan.(dws[idx])) for idx in 1:1000])
+	@test !any([any(isnan.(dxs[idx])) for idx in 1:1000])
+
 end