Fix numerical errors in the tests

Avik Pal · Avik Pal · commit ee86fbb63168 · 2019-05-01T00:36:39.000+05:30
diff --git a/src/nnpack/NNPACK.jl b/src/nnpack/NNPACK.jl
@@ -35,7 +35,8 @@ Allows NNPACK to intelligently choose which threadpool to use for getting the be
 performance.
 """
 function allocate_threadpool()
-    for i in 1:Int(floor(log2(NNPACK_CPU_THREADS)))
+    global NNPACK_CPU_THREADS = NNPACK_CPU_THREADS > 8 ? UInt64(8) : floor(log2(NNPACK_CPU_THREADS))
+    for i in 1:Int(NNPACK_CPU_THREADS)
         threads = UInt64(2^i)
         push!(shared_threadpool_dict, threads => Ref(pthreadpool_create(threads)))
     end
diff --git a/src/nnpack/performance.jl b/src/nnpack/performance.jl
@@ -1,31 +1,31 @@
 function select_threadpool(cdims::DenseConvDims, batch_size::Int)
     inp_size = input_size(cdims)[1] 
     if batch_size >= 32
-        return shared_threadpool_dict[4][]
+        return shared_threadpool_dict[Int(NNPACK_CPU_THREADS)][]
     elseif batch_size >= 16 && inp_size >= 64
-        return shared_threadpool_dict[4][]
+        return shared_threadpool_dict[Int(NNPACK_CPU_THREADS)][]
     elseif inp_size <= 32
         return C_NULL
     elseif inp_size >= 128
-        return shared_threadpool_dict[4][]
+        return shared_threadpool_dict[Int(NNPACK_CPU_THREADS)][]
     elseif inp_size * batch_size >= 256
-        return shared_threadpool_dict[4][]
+        return shared_threadpool_dict[Int(NNPACK_CPU_THREADS)][]
     end    
     return C_NULL
 end
 
 function select_threadpool(pdims::PoolDims, batch_size::Int)
     inp_size = input_size(pdims)[1] 
     if batch_size >= 32
-        return shared_threadpool_dict[4][]
+        return shared_threadpool_dict[Int(NNPACK_CPU_THREADS)][]
     elseif batch_size >= 16 && inp_size >= 64
-        return shared_threadpool_dict[4][]
+        return shared_threadpool_dict[Int(NNPACK_CPU_THREADS)][]
     elseif inp_size <= 32
         return C_NULL
     elseif inp_size >= 128
-        return shared_threadpool_dict[4][]
+        return shared_threadpool_dict[Int(NNPACK_CPU_THREADS)][]
     elseif inp_size * batch_size >= 256
-        return shared_threadpool_dict[4][]
+        return shared_threadpool_dict[Int(NNPACK_CPU_THREADS)][]
     end    
     return C_NULL
 end
diff --git a/test/conv.jl b/test/conv.jl
@@ -278,27 +278,27 @@ conv_answer_dict = Dict(
                 @testset "$(conv)" begin
                     # First, your basic convolution with no parameters
                     cdims = DenseConvDims(x, w)
-                    @test ddims(conv(x, w, cdims)) == y_plain
+                    @test isapprox(ddims(conv(x, w, cdims)), y_plain, rtol = 1.0e-7)
 
                     # Next, test convolution on views and alternate datatypes:
-                    @test ddims(conv(view(x, repeat([:], ndims(x))...), w, cdims)) == y_plain
-                    @test ddims(conv(Float32.(x), Float32.(w), cdims)) == Float32.(y_plain)
+                    @test isapprox(ddims(conv(view(x, repeat([:], ndims(x))...), w, cdims)), y_plain, rtol = 1.0e-7)
+                    @test isapprox(ddims(conv(Float32.(x), Float32.(w), cdims)), Float32.(y_plain), rtol = 1.0e-7)
 
                     # Next, introduce stride:
                     cdims = DenseConvDims(x, w; stride=2)
-                    @test ddims(conv(x, w, cdims)) == y_stride
+                    @test isapprox(ddims(conv(x, w, cdims)), y_stride, rtol = 1.0e-7)
 
                     # Next, introduce dilation:
                     cdims = DenseConvDims(x, w; dilation=2)
-                    @test ddims(conv(x, w, cdims)) == y_dil
+                    @test isapprox(ddims(conv(x, w, cdims)), y_dil, rtol = 1.0e-7)
 
                     # Next, introduce padding:
                     cdims = DenseConvDims(x, w; padding=1)
-                    @test ddims(conv(x, w, cdims)) == y_pad
+                    @test isapprox(ddims(conv(x, w, cdims)), y_pad, rtol = 1.0e-7)
 
                     # Next, test crosscor/conv with a flipped kernel
                     cdims = DenseConvDims(x, w; flipkernel=true)
-                    @test ddims(conv(x, w, cdims)) == y_flip
+                    @test isapprox(ddims(conv(x, w, cdims)), y_flip, rtol = 1.0e-7)
                 end
             end
 
@@ -312,39 +312,39 @@ conv_answer_dict = Dict(
                     # First, your basic convolution with no parameters
                     cdims = DenseConvDims(x, w)
                     dy = NNlib.conv(x, w, cdims)
-                    @test ddims(∇conv_filter(x, dy, cdims)) == dw
-                    @test ddims(∇conv_data(dy, w,  cdims)) == dx
+                    @test isapprox(ddims(∇conv_filter(x, dy, cdims)), dw, rtol = 1.0e-7)
+                    @test isapprox(ddims(∇conv_data(dy, w,  cdims)), dx, rtol = 1.0e-7)
 
                     # Next, test convolution on views and alternate datatypes:
-                    @test ddims(∇conv_filter(x, view(dy, repeat([:], ndims(dy))...), cdims)) == dw
-                    @test ddims(∇conv_data(view(dy, repeat([:], ndims(dy))...), w,   cdims)) == dx
+                    @test isapprox(ddims(∇conv_filter(x, view(dy, repeat([:], ndims(dy))...), cdims)), dw, rtol = 1.0e-7)
+                    @test isapprox(ddims(∇conv_data(view(dy, repeat([:], ndims(dy))...), w,   cdims)), dx, rtol = 1.0e-7)
 
-                    @test ddims(∇conv_filter(Float32.(x), Float32.(dy), cdims)) == dw
-                    @test ddims(∇conv_data(Float32.(dy),  Float32.(w),  cdims)) == dx
+                    @test isapprox(ddims(∇conv_filter(Float32.(x), Float32.(dy), cdims)), dw, rtol = 1.0e-7)
+                    @test isapprox(ddims(∇conv_data(Float32.(dy),  Float32.(w),  cdims)), dx, rtol = 1.0e-7)
 
                     # Next, introduce stride:
                     cdims = DenseConvDims(x, w; stride=2)
                     dy = NNlib.conv(x, w, cdims)
-                    @test ddims(∇conv_filter(x, dy, cdims)) == dw_stride
-                    @test ddims(∇conv_data(dy, w,  cdims)) == dx_stride
+                    @test isapprox(ddims(∇conv_filter(x, dy, cdims)), dw_stride, rtol = 1.0e-7)
+                    @test isapprox(ddims(∇conv_data(dy, w,  cdims)), dx_stride, rtol = 1.0e-7)
 
                     # Next, introduce dilation:
                     cdims = DenseConvDims(x, w; dilation=2)
                     dy = NNlib.conv(x, w, cdims)
-                    @test ddims(∇conv_filter(x, dy, cdims)) == dw_dil
-                    @test ddims(∇conv_data(dy, w,  cdims)) == dx_dil
+                    @test isapprox(ddims(∇conv_filter(x, dy, cdims)), dw_dil, rtol = 1.0e-7)
+                    @test isapprox(ddims(∇conv_data(dy, w,  cdims)), dx_dil, rtol = 1.0e-7)
 
                     # Next, introduce padding:
                     cdims = DenseConvDims(x, w; padding=1)
                     dy = NNlib.conv(x, w, cdims)
-                    @test ddims(∇conv_filter(x, dy, cdims)) == dw_pad
-                    @test ddims(∇conv_data(dy, w,  cdims)) == dx_pad
+                    @test isapprox(ddims(∇conv_filter(x, dy, cdims)), dw_pad, rtol = 1.0e-7)
+                    @test isapprox(ddims(∇conv_data(dy, w,  cdims)), dx_pad, rtol = 1.0e-7)
 
                     # Next, test crosscor/conv with a flipped kernel
                     cdims = DenseConvDims(x, w; flipkernel=true)
                     dy = NNlib.conv(x, w, cdims)
-                    @test ddims(∇conv_filter(x, dy, cdims)) == dw_flip
-                    @test ddims(∇conv_data(dy, w,  cdims)) == dx_flip
+                    @test isapprox(ddims(∇conv_filter(x, dy, cdims)), dw_flip, rtol = 1.0e-7)
+                    @test isapprox(ddims(∇conv_data(dy, w,  cdims)), dx_flip, rtol = 1.0e-7)
                 end
             end
         end
@@ -481,24 +481,24 @@ end
                     @test ddims(conv(x, w, cdims)) == y_plain
 
                     # Next, test convolution on views and alternate datatypes:
-                    @test ddims(conv(view(x, repeat([:], ndims(x))...), w, cdims)) == y_plain
-                    @test ddims(conv(Float32.(x), Float32.(w), cdims)) == Float32.(y_plain)
+                    @test isapprox(ddims(conv(view(x, repeat([:], ndims(x))...), w, cdims)), y_plain, rtol = 1.0e-7)
+                    @test isapprox(ddims(conv(Float32.(x), Float32.(w), cdims)), Float32.(y_plain), rtol = 1.0e-7)
 
                     # Next, introduce stride:
                     cdims = DepthwiseConvDims(x, w; stride=2)
-                    @test ddims(conv(x, w, cdims)) == y_stride
+                    @test isapprox(ddims(conv(x, w, cdims)), y_stride, rtol = 1.0e-7)
 
                     # Next, introduce dilation:
                     cdims = DepthwiseConvDims(x, w; dilation=2)
-                    @test ddims(conv(x, w, cdims)) == y_dil
+                    @test isapprox(ddims(conv(x, w, cdims)), y_dil, rtol = 1.0e-7)
 
                     # Next, introduce padding:
                     cdims = DepthwiseConvDims(x, w; padding=1)
-                    @test ddims(conv(x, w, cdims)) == y_pad
+                    @test isapprox(ddims(conv(x, w, cdims)), y_pad, rtol = 1.0e-7)
 
                     # Next, test crosscor/conv with a flipped kernel
                     cdims = DepthwiseConvDims(x, w; flipkernel=true)
-                    @test ddims(conv(x, w, cdims)) == y_flip
+                    @test isapprox(ddims(conv(x, w, cdims)), y_flip, rtol = 1.0e-7)
                 end
             end