We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent ec6b435 commit 7cd4e29Copy full SHA for 7cd4e29
third_party/amd/lib/TritonAMDGPUToLLVM/ElementwiseOpToLLVM.cpp
@@ -1904,7 +1904,8 @@ struct FpToFpOpConversion
1904
(llvm::isa<Float16Type>(srcElementType)) ||
1905
(llvm::isa<BFloat16Type>(srcElementType))) &&
1906
((llvm::isa<Float8E4M3FNType>(dstElementType)) ||
1907
- (llvm::isa<Float8E5M2Type>(dstElementType)))) {
+ (llvm::isa<Float8E5M2Type>(dstElementType))) &&
1908
+ ((roundingMode.has_value()) && (*roundingMode != RoundingMode::RTZ))) {
1909
numElements = 8;
1910
useFP16IntermediateSrc = false;
1911
}
0 commit comments