JuliaGPU
diff --git a/‎src/GPUArrays.jl
Lines changed: 4 additions & 8 deletions b/‎src/GPUArrays.jl
Lines changed: 4 additions & 8 deletions
diff --git a/‎src/abstractarray.jl
Lines changed: 17 additions & 8 deletions b/‎src/abstractarray.jl
Lines changed: 17 additions & 8 deletions
diff --git a/‎src/array.jl
Lines changed: 15 additions & 33 deletions b/‎src/array.jl
Lines changed: 15 additions & 33 deletions
diff --git a/‎src/base.jl
Lines changed: 14 additions & 17 deletions b/‎src/base.jl
Lines changed: 14 additions & 17 deletions
diff --git a/‎src/construction.jl
Lines changed: 14 additions & 17 deletions b/‎src/construction.jl
Lines changed: 14 additions & 17 deletions
diff --git a/‎src/linalg.jl
Lines changed: 2 additions & 2 deletions b/‎src/linalg.jl
Lines changed: 2 additions & 2 deletions
diff --git a/‎src/random.jl
Lines changed: 8 additions & 8 deletions b/‎src/random.jl
Lines changed: 8 additions & 8 deletions
@@ -1,18 +1,18 @@
 module GPUArrays
 
+export GPUArray, gpu_call, thread_blocks_heuristic, global_size, synchronize_threads
+export linear_index, @linearidx, @cartesianidx, convolution!, device, synchronize
+export JLArray
+
 using Serialization
 using Random
 using LinearAlgebra
 using Printf
 
-import Random: rand, rand!
 using LinearAlgebra.BLAS
-import Base: pointer, similar, size, convert
-using Base: @propagate_inbounds, @pure, RefValue
 using Base.Cartesian
 
 using FFTW
-import FFTW: *, plan_ifft!, plan_fft!, plan_fft, plan_ifft, size, plan_bfft, plan_bfft!
 
 include("abstractarray.jl")
 include("abstract_gpu_interface.jl")
@@ -34,8 +34,4 @@ include("array.jl")
 
 include("testsuite.jl")
 
-export GPUArray, gpu_call, thread_blocks_heuristic, global_size, synchronize_threads
-export linear_index, @linearidx, @cartesianidx, convolution!, device, synchronize
-export JLArray
-
 end # module
@@ -1,5 +1,3 @@
-import Base: similar, convert, _reshape, map!, copyto!, map, copy, deepcopy
-
 # Dense GPU Array
 abstract type GPUArray{T, N} <: DenseArray{T, N} end
 
@@ -16,8 +14,11 @@ struct LocalMemory{T} <: GPUArray{T, 1}
     LocalMemory{T}(x::Integer) where T = new{T}(x)
 end
 
-############################################
-# serialization
+
+# input/output
+
+## serialization
+
 import Serialization: AbstractSerializer, serialize, deserialize, serialize_type
 
 function serialize(s::AbstractSerializer, t::T) where T <: GPUArray
@@ -53,6 +54,14 @@ function to_cartesian(A, indices::Tuple)
     CartesianIndices(start, stop)
 end
 
+## showing
+
+Base.print_array(io::IO, x::GPUArray) = Base.print_array(io, collect(x))
+Base.print_array(io::IO, x::LinearAlgebra.Adjoint{<:Any,<:GPUArray}) = Base.print_array(io, LinearAlgebra.adjoint(collect(x.parent)))
+Base.print_array(io::IO, x::LinearAlgebra.Transpose{<:Any,<:GPUArray}) = Base.print_array(io, LinearAlgebra.transpose(collect(x.parent)))
+
+
+# memory operations
 
 ## basic copy methods that dispatch to unsafe_copyto! for linear copies
 
@@ -161,8 +170,8 @@ function Base.copyto!(
     dest
 end
 
-copy(x::GPUArray) = identity.(x)
-deepcopy(x::GPUArray) = copy(x)
+Base.copy(x::GPUArray) = identity.(x)
+Base.deepcopy(x::GPUArray) = copy(x)
 
 #=
 reinterpret taken from julia base/array.jl
@@ -211,13 +220,13 @@ function reinterpret(::Type{T}, a::GPUArray{S}, dims::NTuple{N, Integer}) where
     unsafe_reinterpret(T, a, dims)
 end
 
-function _reshape(A::GPUArray{T}, dims::Dims) where T
+function Base._reshape(A::GPUArray{T}, dims::Dims) where T
     n = length(A)
     prod(dims) == n || throw(DimensionMismatch("parent has $n elements, which is incompatible with size $dims"))
     return unsafe_reinterpret(T, A, dims)
 end
 #ambig
-function _reshape(A::GPUArray{T, 1}, dims::Tuple{Integer}) where T
+function Base._reshape(A::GPUArray{T, 1}, dims::Tuple{Integer}) where T
     n = Base._length(A)
     prod(dims) == n || throw(DimensionMismatch("parent has $n elements, which is incompatible with size $dims"))
     return unsafe_reinterpret(T, A, dims)
 
@@ -24,16 +24,11 @@ end
 
 ## getters
 
-size(x::JLArray) = x.size
+Base.size(x::JLArray) = x.size
 
-pointer(x::JLArray) = pointer(x.data)
+Base.pointer(x::JLArray) = pointer(x.data)
 
 
-## I/O
-Base.print_array(io::IO, x::GPUArray) = Base.print_array(io, collect(x))B
-Base.print_array(io::IO, x::LinearAlgebra.Adjoint{<:Any,<:GPUArray}) = Base.print_array(io, LinearAlgebra.adjoint(collect(x.parent)))
-Base.print_array(io::IO, x::LinearAlgebra.Transpose{<:Any,<:GPUArray}) = Base.print_array(io, LinearAlgebra.transpose(collect(x.parent)))
-
 ## other
 
 """
@@ -45,7 +40,7 @@ end
 
 to_device(state, x::JLArray) = x.data
 to_device(state, x::Tuple) = to_device.(Ref(state), x)
-to_device(state, x::RefValue{<: JLArray}) = RefValue(to_device(state, x[]))
+to_device(state, x::Base.RefValue{<: JLArray}) = Base.RefValue(to_device(state, x[]))
 to_device(state, x) = x
 # creates a `local` vector for each thread group
 to_device(state, x::LocalMemory{T}) where T = LocalMem(ntuple(i-> Vector{T}(x.size), blockdim_x(state)))
@@ -54,11 +49,10 @@ to_blocks(state, x) = x
 # unpacks local memory for each block
 to_blocks(state, x::LocalMem) = x.x[blockidx_x(state)]
 
-similar(::Type{<: JLArray}, ::Type{T}, size::Base.Dims{N}) where {T, N} = JLArray{T, N}(size)
+Base.similar(::Type{<: JLArray}, ::Type{T}, size::Base.Dims{N}) where {T, N} = JLArray{T, N}(size)
 
-function unsafe_reinterpret(::Type{T}, A::JLArray{ET}, size::NTuple{N, Integer}) where {T, ET, N}
-    JLArray(Array(reshape(reinterpret(T, A.data), size)), size)
-end
+unsafe_reinterpret(::Type{T}, A::JLArray, size::Tuple) where T =
+    reshape(reinterpret(T, A.data), size)
 
 function Base.unsafe_copyto!(dest::Array{T}, d_offset::Integer,
                              source::JLArray{T}, s_offset::Integer,
@@ -126,7 +120,6 @@ function AbstractDeviceArray(ptr::Array, shape::Vararg{Integer, N}) where N
     reshape(ptr, shape)
 end
 
-
 function _gpu_call(f, A::JLArray, args::Tuple, blocks_threads::Tuple{T, T}) where T <: NTuple{N, Integer} where N
     blocks, threads = blocks_threads
     idx = ntuple(i-> 1, length(blocks))
@@ -176,32 +169,21 @@ end
 blas_module(::JLArray) = LinearAlgebra.BLAS
 blasbuffer(A::JLArray) = A.data
 
-# defining our own plan type is the easiest way to pass around the plans in Base interface
+# defining our own plan type is the easiest way to pass around the plans in FFTW interface
 # without ambiguities
 
 struct FFTPlan{T}
     p::T
 end
-function plan_fft(A::JLArray; kw_args...)
-    FFTPlan(plan_fft(A.data; kw_args...))
-end
-function plan_fft!(A::JLArray; kw_args...)
-    FFTPlan(plan_fft!(A.data; kw_args...))
-end
-function plan_bfft!(A::JLArray; kw_args...)
-    FFTPlan(plan_bfft!(A.data; kw_args...))
-end
-function plan_bfft(A::JLArray; kw_args...)
-    FFTPlan(plan_bfft(A.data; kw_args...))
-end
-function plan_ifft!(A::JLArray; kw_args...)
-    FFTPlan(plan_ifft!(A.data; kw_args...))
-end
-function plan_ifft(A::JLArray; kw_args...)
-    FFTPlan(plan_ifft(A.data; kw_args...))
-end
 
-function *(plan::FFTPlan, A::JLArray)
+FFTW.plan_fft(A::JLArray; kw_args...) = FFTPlan(plan_fft(A.data; kw_args...))
+FFTW.plan_fft!(A::JLArray; kw_args...) = FFTPlan(plan_fft!(A.data; kw_args...))
+FFTW.plan_bfft!(A::JLArray; kw_args...) = FFTPlan(plan_bfft!(A.data; kw_args...))
+FFTW.plan_bfft(A::JLArray; kw_args...) = FFTPlan(plan_bfft(A.data; kw_args...))
+FFTW.plan_ifft!(A::JLArray; kw_args...) = FFTPlan(plan_ifft!(A.data; kw_args...))
+FFTW.plan_ifft(A::JLArray; kw_args...) = FFTPlan(plan_ifft(A.data; kw_args...))
+
+function Base.:(*)(plan::FFTPlan, A::JLArray)
     x = plan.p * A.data
     JLArray(x)
 end
@@ -1,23 +1,20 @@
-import Base: count, map!, permutedims!, cat_t, vcat, hcat
-using Base: @pure
-
 allequal(x) = true
 allequal(x, y, z...) = x == y && allequal(y, z...)
-function map!(f, y::GPUArray, xs::GPUArray...)
+function Base.map!(f, y::GPUArray, xs::GPUArray...)
     @assert allequal(size.((y, xs...))...)
     return y .= f.(xs...)
 end
-function map(f, y::GPUArray, xs::GPUArray...)
+function Base.map(f, y::GPUArray, xs::GPUArray...)
     @assert allequal(size.((y, xs...))...)
     return f.(y, xs...)
 end
 
 # Break ambiguities with base
-map!(f, y::GPUArray) =
+Base.map!(f, y::GPUArray) =
     invoke(map!, Tuple{Any,GPUArray,Vararg{GPUArray}}, f, y)
-map!(f, y::GPUArray, x::GPUArray) =
+Base.map!(f, y::GPUArray, x::GPUArray) =
     invoke(map!, Tuple{Any,GPUArray, Vararg{GPUArray}}, f, y, x)
-map!(f, y::GPUArray, x1::GPUArray, x2::GPUArray) =
+Base.map!(f, y::GPUArray, x1::GPUArray, x2::GPUArray) =
     invoke(map!, Tuple{Any,GPUArray, Vararg{GPUArray}}, f, y, x1, x2)
 
 
@@ -49,36 +46,36 @@ map!(f, y::GPUArray, x1::GPUArray, x2::GPUArray) =
 #     return dest
 # end
 #
-# function cat_t(dims::Integer, T::Type, x::GPUArray, xs::GPUArray...)
+# function Base.cat_t(dims::Integer, T::Type, x::GPUArray, xs::GPUArray...)
 #     catdims = Base.dims2cat(dims)
 #     shape = Base.cat_shape(catdims, (), size.((x, xs...))...)
 #     dest = Base.cat_similar(x, T, shape)
 #     _cat(dims, dest, x, xs...)
 # end
 #
-# vcat(xs::GPUArray...) = cat(1, xs...)
-# hcat(xs::GPUArray...) = cat(2, xs...)
+# Base.vcat(xs::GPUArray...) = cat(1, xs...)
+# Base.hcat(xs::GPUArray...) = cat(2, xs...)
 
 
 # Base functions that are sadly not fit for the the GPU yet (they only work for Int64)
-@pure @inline function gpu_ind2sub(A::AbstractArray, ind::T) where T
+Base.@pure @inline function gpu_ind2sub(A::AbstractArray, ind::T) where T
     _ind2sub(size(A), ind - T(1))
 end
-@pure @inline function gpu_ind2sub(dims::NTuple{N}, ind::T) where {N, T}
+Base.@pure @inline function gpu_ind2sub(dims::NTuple{N}, ind::T) where {N, T}
     _ind2sub(NTuple{N, T}(dims), ind - T(1))
 end
-@pure @inline _ind2sub(::Tuple{}, ind::T) where {T} = (ind + T(1),)
-@pure @inline function _ind2sub(indslast::NTuple{1}, ind::T) where T
+Base.@pure @inline _ind2sub(::Tuple{}, ind::T) where {T} = (ind + T(1),)
+Base.@pure @inline function _ind2sub(indslast::NTuple{1}, ind::T) where T
     ((ind + T(1)),)
 end
-@pure @inline function _ind2sub(inds, ind::T) where T
+Base.@pure @inline function _ind2sub(inds, ind::T) where T
     r1 = inds[1]
     indnext = div(ind, r1)
     f = T(1); l = r1
     (ind-l*indnext+f, _ind2sub(Base.tail(inds), indnext)...)
 end
 
-@pure function gpu_sub2ind(dims::NTuple{N}, I::NTuple{N2, T}) where {N, N2, T}
+Base.@pure function gpu_sub2ind(dims::NTuple{N}, I::NTuple{N2, T}) where {N, N2, T}
     Base.@_inline_meta
     _sub2ind(NTuple{N, T}(dims), T(1), T(1), I...)
 end
 
@@ -1,16 +1,12 @@
-import Base: fill!, similar, zeros, ones, fill
-
-
-
-function fill(X::Type{<: GPUArray}, val::T, dims::NTuple{N, Integer}) where {T, N}
+function Base.fill(X::Type{<: GPUArray}, val::T, dims::NTuple{N, Integer}) where {T, N}
     res = similar(X, T, dims)
     fill!(res, val)
 end
-function fill(X::Type{<: GPUArray{T}}, val, dims::NTuple{N, Integer}) where {T, N}
+function Base.fill(X::Type{<: GPUArray{T}}, val, dims::NTuple{N, Integer}) where {T, N}
     res = similar(X, T, dims)
     fill!(res, convert(T, val))
 end
-function fill!(A::GPUArray{T}, x) where T
+function Base.fill!(A::GPUArray{T}, x) where T
     gpu_call(A, (A, convert(T, x))) do state, a, val
         idx = @linearidx(a, state)
         @inbounds a[idx] = val
@@ -19,8 +15,8 @@ function fill!(A::GPUArray{T}, x) where T
     A
 end
 
-zeros(T::Type{<: GPUArray}, dims::NTuple{N, Integer}) where N = fill(T, zero(eltype(T)), dims)
-ones(T::Type{<: GPUArray}, dims::NTuple{N, Integer}) where N = fill(T, one(eltype(T)), dims)
+Base.zeros(T::Type{<: GPUArray}, dims::NTuple{N, Integer}) where N = fill(T, zero(eltype(T)), dims)
+Base.ones(T::Type{<: GPUArray}, dims::NTuple{N, Integer}) where N = fill(T, one(eltype(T)), dims)
 
 function uniformscaling_kernel(state, res::AbstractArray{T}, stride, s::UniformScaling) where T
     i = linear_index(state)
@@ -43,10 +39,10 @@ end
 (T::Type{<: GPUArray{X} where X})(dims::NTuple{N, Integer}) where N = similar(T, eltype(T), dims)
 (T::Type{<: GPUArray{X} where X})(::UndefInitializer, dims::NTuple{N, Integer}) where N = similar(T, eltype(T), dims)
 
-similar(x::X, ::Type{T}, size::Base.Dims{N}) where {X <: GPUArray, T, N} = similar(X, T, size)
-similar(::Type{X}, ::Type{T}, size::NTuple{N, Base.OneTo{Int}}) where {X <: GPUArray, T, N} = similar(X, T, length.(size))
+Base.similar(x::X, ::Type{T}, size::Base.Dims{N}) where {X <: GPUArray, T, N} = similar(X, T, size)
+Base.similar(::Type{X}, ::Type{T}, size::NTuple{N, Base.OneTo{Int}}) where {X <: GPUArray, T, N} = similar(X, T, length.(size))
 
-convert(AT::Type{<: GPUArray{T, N}}, A::GPUArray{T, N}) where {T, N} = A
+Base.convert(AT::Type{<: GPUArray{T, N}}, A::GPUArray{T, N}) where {T, N} = A
 
 function indexstyle(x::T) where T
     style = try
@@ -73,7 +69,7 @@ eltype_or(::Type{<: GPUArray}, or) = or
 eltype_or(::Type{<: GPUArray{T}}, or) where T = T
 eltype_or(::Type{<: GPUArray{T, N}}, or) where {T, N} = T
 
-function convert(AT::Type{<: GPUArray}, iter)
+function Base.convert(AT::Type{<: GPUArray}, iter)
     isize = Base.IteratorSize(iter)
     style = indexstyle(iter)
     ettrait = Base.IteratorEltype(iter)
@@ -87,17 +83,18 @@ function convert(AT::Type{<: GPUArray}, iter)
     end
 end
 
-function convert(AT::Type{<: GPUArray{T, N}}, A::DenseArray{T, N}) where {T, N}
+function Base.convert(AT::Type{<: GPUArray{T, N}}, A::DenseArray{T, N}) where {T, N}
     copyto!(AT(Base.size(A)), A)
 end
 
-function convert(AT::Type{<: GPUArray{T1}}, A::DenseArray{T2, N}) where {T1, T2, N}
+function Base.convert(AT::Type{<: GPUArray{T1}}, A::DenseArray{T2, N}) where {T1, T2, N}
     copyto!(similar(AT, T1, size(A)), convert(Array{T1, N}, A))
 end
-function convert(AT::Type{<: GPUArray}, A::DenseArray{T2, N}) where {T2, N}
+
+function Base.convert(AT::Type{<: GPUArray}, A::DenseArray{T2, N}) where {T2, N}
     copyto!(similar(AT, T2, size(A)), A)
 end
 
-function convert(AT::Type{Array{T, N}}, A::GPUArray{CT, CN}) where {T, N, CT, CN}
+function Base.convert(AT::Type{Array{T, N}}, A::GPUArray{CT, CN}) where {T, N, CT, CN}
     convert(AT, copyto!(Array{CT, CN}(undef, size(A)), A))
 end
@@ -90,9 +90,9 @@ function LinearAlgebra.permutedims!(dest::GPUArray, src::GPUArray, perm::NTuple{
 end
 
 
-function copyto!(A::AbstractArray, B::Adjoint{T, <: GPUArray}) where T
+function Base.copyto!(A::AbstractArray, B::Adjoint{T, <: GPUArray}) where T
     copyto!(A, Adjoint(Array(B.parent)))
 end
-function copyto!(A::GPUArray, B::Adjoint{T, <: GPUArray}) where T
+function Base.copyto!(A::GPUArray, B::Adjoint{T, <: GPUArray}) where T
     transpose!(A, B.parent)
 end
@@ -55,7 +55,7 @@ let rand_state_dict = Dict()
         end
     end
 end
-function rand!(A::GPUArray{T}) where T <: Number
+function Random.rand!(A::GPUArray{T}) where T <: Number
     rstates = cached_state(A)
     gpu_call(A, (rstates, A,)) do state, randstates, a
         idx = linear_index(state)
@@ -66,14 +66,14 @@ function rand!(A::GPUArray{T}) where T <: Number
     A
 end
 
-rand(X::Type{<: GPUArray}, i::Integer...) = rand(X, Float32, i...)
-rand(X::Type{<: GPUArray}, size::NTuple{N, Int}) where N = rand(X, Float32, size...)
-rand(X::Type{<: GPUArray{T}}, i::Integer...) where T = rand(X, T, i...)
-rand(X::Type{<: GPUArray{T}}, size::NTuple{N, Int}) where {T, N} = rand(X, T, size...)
-rand(X::Type{<: GPUArray{T, N}}, size::NTuple{N, Integer}) where {T, N} = rand(X, T, size...)
-rand(X::Type{<: GPUArray{T, N}}, size::NTuple{N, Int}) where {T, N} = rand(X, T, size...)
+Random.rand(X::Type{<: GPUArray}, i::Integer...) = rand(X, Float32, i...)
+Random.rand(X::Type{<: GPUArray}, size::NTuple{N, Int}) where N = rand(X, Float32, size...)
+Random.rand(X::Type{<: GPUArray{T}}, i::Integer...) where T = rand(X, T, i...)
+Random.rand(X::Type{<: GPUArray{T}}, size::NTuple{N, Int}) where {T, N} = rand(X, T, size...)
+Random.rand(X::Type{<: GPUArray{T, N}}, size::NTuple{N, Integer}) where {T, N} = rand(X, T, size...)
+Random.rand(X::Type{<: GPUArray{T, N}}, size::NTuple{N, Int}) where {T, N} = rand(X, T, size...)
 
-function rand(X::Type{<: GPUArray}, ::Type{ET}, size::Integer...) where ET
+function Random.rand(X::Type{<: GPUArray}, ::Type{ET}, size::Integer...) where ET
     A = similar(X, ET, size)
     rand!(A)
 end