Skip to content

Commit a8e33c5

Browse files
committed
Testing block_size=16 for AMDGPU
1 parent 3c19fd5 commit a8e33c5

File tree

3 files changed

+2
-4
lines changed

3 files changed

+2
-4
lines changed

README.md

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -139,8 +139,6 @@ Julia v1.11
139139

140140
[Metal](https://github.com/JuliaGPU/Metal.jl)
141141

142-
[Known Issue with `accumulate` Only](https://github.com/JuliaGPU/AcceleratedKernels.jl/issues/10)
143-
144142
</td>
145143
<td>
146144

prototype/accumulate_benchmark.jl

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@ Random.seed!(0)
77

88

99
function akacc(v)
10-
va = AK.accumulate(+, v, init=zero(eltype(v)), block_size=512)
10+
va = AK.accumulate(+, v, init=zero(eltype(v)), block_size=1024)
1111
Metal.synchronize()
1212
va
1313
end

test/runtests.jl

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1064,7 +1064,7 @@ end
10641064
num_elems = rand(1:100_000)
10651065
x = array_from_host(rand(1:1000, num_elems), Int32)
10661066
y = copy(x)
1067-
AK.accumulate!(+, y; init=0, block_size=8)
1067+
AK.accumulate!(+, y; init=0, block_size=16)
10681068
@test all(Array(y) .== accumulate(+, Array(x)))
10691069
end
10701070

0 commit comments

Comments
 (0)