Skip to content

Commit a86a55d

Browse files
committed
All operations using Float32
1 parent a4e8216 commit a86a55d

File tree

1 file changed

+10
-4
lines changed

1 file changed

+10
-4
lines changed

lib/mpsgraphs/matmul.jl

Lines changed: 10 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -10,9 +10,9 @@ function _matmul!(c::MtlArray{Tc}, a::MtlArray{Tab}, b::MtlArray{Tab}, alpha::Nu
1010
placeB => MPSGraphTensorData(b)
1111
)
1212

13-
castA, castB = if Tc != Tab
14-
castTensor(graph, placeA, Tc, "castA"),
15-
castTensor(graph, placeB, Tc, "castB")
13+
castA, castB = if Tab != Float32
14+
castTensor(graph, placeA, Float32, "castA"),
15+
castTensor(graph, placeB, Float32, "castB")
1616
else
1717
placeA, placeB
1818
end
@@ -48,8 +48,14 @@ function _matmul!(c::MtlArray{Tc}, a::MtlArray{Tab}, b::MtlArray{Tab}, alpha::Nu
4848
additionWithPrimaryTensor(graph, afteralpha, betaC)
4949
end
5050

51+
castC = if Tc != Float32
52+
castTensor(graph, afterbeta, Tc, "castC")
53+
else
54+
afterbeta
55+
end
56+
5157
resultdict = Dict{MPSGraphTensor, MPSGraphTensorData}(
52-
afterbeta => outputTensorData
58+
castC => outputTensorData
5359
)
5460

5561
cmdbuf = MPSCommandBuffer(Metal.global_queue(device()))

0 commit comments

Comments
 (0)