-
Notifications
You must be signed in to change notification settings - Fork 15.2k
[Flang] Add -ffast-real-mod and direct code for MOD on REAL types #160660
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Changes from 12 commits
8f9868d
ecae88c
85b14eb
d32863a
d06a1ad
313abd0
2572cc0
7cc56df
ed68857
afc2063
3b392c8
6d5836c
5c8304d
52c48db
d7beb16
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
| Original file line number | Diff line number | Diff line change |
|---|---|---|
|
|
@@ -7009,8 +7009,31 @@ mlir::Value IntrinsicLibrary::genMergeBits(mlir::Type resultType, | |
| } | ||
|
|
||
| // MOD | ||
| static mlir::Value genFastMod(fir::FirOpBuilder &builder, mlir::Location loc, | ||
| mlir::Value a, mlir::Value p) { | ||
| auto fastmathFlags = mlir::arith::FastMathFlags::contract; | ||
| auto fastmathAttr = | ||
| mlir::arith::FastMathFlagsAttr::get(builder.getContext(), fastmathFlags); | ||
| mlir::Value divResult = | ||
| mlir::arith::DivFOp::create(builder, loc, a, p, fastmathAttr); | ||
| mlir::Type intType = builder.getIntegerType( | ||
| a.getType().getIntOrFloatBitWidth(), /*signed=*/true); | ||
| mlir::Value intResult = builder.createConvert(loc, intType, divResult); | ||
| mlir::Value cnvResult = builder.createConvert(loc, a.getType(), intResult); | ||
| mlir::Value mulResult = | ||
| mlir::arith::MulFOp::create(builder, loc, cnvResult, p, fastmathAttr); | ||
| mlir::Value subResult = | ||
| mlir::arith::SubFOp::create(builder, loc, a, mulResult, fastmathAttr); | ||
| return subResult; | ||
| } | ||
|
|
||
| mlir::Value IntrinsicLibrary::genMod(mlir::Type resultType, | ||
| llvm::ArrayRef<mlir::Value> args) { | ||
| auto mod = builder.getModule(); | ||
| bool useFastRealMod = false; | ||
| if (auto attr = mod->getAttrOfType<mlir::BoolAttr>("fir.fast_real_mod")) | ||
| useFastRealMod = attr.getValue(); | ||
|
|
||
| assert(args.size() == 2); | ||
| if (resultType.isUnsignedInteger()) { | ||
| mlir::Type signlessType = mlir::IntegerType::get( | ||
|
|
@@ -7022,9 +7045,16 @@ mlir::Value IntrinsicLibrary::genMod(mlir::Type resultType, | |
| if (mlir::isa<mlir::IntegerType>(resultType)) | ||
| return mlir::arith::RemSIOp::create(builder, loc, args[0], args[1]); | ||
|
|
||
| // Use runtime. | ||
| return builder.createConvert( | ||
| loc, resultType, fir::runtime::genMod(builder, loc, args[0], args[1])); | ||
| if (useFastRealMod && resultType.isFloat()) { | ||
|
||
| // If fast MOD for REAL has been requested, generate less precise, | ||
| // but faster code directly. | ||
| return builder.createConvert(loc, resultType, | ||
| genFastMod(builder, loc, args[0], args[1])); | ||
| } else { | ||
| // Use runtime. | ||
| return builder.createConvert( | ||
| loc, resultType, fir::runtime::genMod(builder, loc, args[0], args[1])); | ||
| } | ||
| } | ||
|
|
||
| // MODULO | ||
|
|
||
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,77 @@ | ||
| ! RUN: %flang_fc1 -ffast-real-mod -emit-mlir -o - %s | FileCheck %s --check-prefixes=CHECK%if target=x86_64{{.*}} %{,CHECK-KIND10%}%if flang-supports-f128-math %{,CHECK-KIND16%} | ||
|
||
|
|
||
| ! CHECK: module attributes {{{.*}}fir.fast_real_mod = true{{.*}}} | ||
|
|
||
| ! CHECK-LABEL: @_QPmod_real4 | ||
| subroutine mod_real4(r, a, p) | ||
| implicit none | ||
| real(kind=4) :: r, a, p | ||
| ! CHECK: %[[A:.*]] = fir.declare{{.*}}a" | ||
| ! CHECK: %[[P:.*]] = fir.declare{{.*}}p" | ||
| ! CHECK: %[[R:.*]] = fir.declare{{.*}}r" | ||
| ! CHECK: %[[A_LOAD:.*]] = fir.load %[[A]] | ||
| ! CHECK: %[[P_LOAD:.*]] = fir.load %[[P]] | ||
| ! CHECK: %[[DIV:.*]] = arith.divf %[[A_LOAD]], %[[P_LOAD]] fastmath<contract> : f32 | ||
| ! CHECK: %[[CV1:.*]] = fir.convert %[[DIV]] : (f32) -> si32 | ||
| ! CHECK: %[[CV2:.*]] = fir.convert %[[CV1]] : (si32) -> f32 | ||
| ! CHECK: %[[MUL:.*]] = arith.mulf %[[CV2]], %[[P_LOAD]] fastmath<contract> : f32 | ||
| ! CHECK: %[[SUB:.*]] = arith.subf %[[A_LOAD]], %[[MUL]] fastmath<contract> : f32 | ||
| ! CHECK: fir.store %[[SUB]] to %[[R]] : !fir.ref<f32> | ||
| r = mod(a, p) | ||
| end subroutine mod_real4 | ||
|
|
||
| ! CHECK-LABEL: @_QPmod_real8 | ||
| subroutine mod_real8(r, a, p) | ||
| implicit none | ||
| real(kind=8) :: r, a, p | ||
| ! CHECK: %[[A:.*]] = fir.declare{{.*}}a" | ||
| ! CHECK: %[[P:.*]] = fir.declare{{.*}}p" | ||
| ! CHECK: %[[R:.*]] = fir.declare{{.*}}r" | ||
| ! CHECK: %[[A_LOAD:.*]] = fir.load %[[A]] | ||
| ! CHECK: %[[P_LOAD:.*]] = fir.load %[[P]] | ||
| ! CHECK: %[[DIV:.*]] = arith.divf %[[A_LOAD]], %[[P_LOAD]] fastmath<contract> : f64 | ||
| ! CHECK: %[[CV1:.*]] = fir.convert %[[DIV]] : (f64) -> si64 | ||
| ! CHECK: %[[CV2:.*]] = fir.convert %[[CV1]] : (si64) -> f64 | ||
| ! CHECK: %[[MUL:.*]] = arith.mulf %[[CV2]], %[[P_LOAD]] fastmath<contract> : f64 | ||
| ! CHECK: %[[SUB:.*]] = arith.subf %[[A_LOAD]], %[[MUL]] fastmath<contract> : f64 | ||
| ! CHECK: fir.store %[[SUB]] to %[[R]] : !fir.ref<f64> | ||
| r = mod(a, p) | ||
| end subroutine mod_real8 | ||
|
|
||
| ! CHECK-LABEL: @_QPmod_real10 | ||
| subroutine mod_real10(r, a, p) | ||
| implicit none | ||
| integer, parameter :: kind10 = merge(10, 4, selected_real_kind(p=18).eq.10) | ||
| real(kind=kind10) :: r, a, p | ||
| ! CHECK-KIND10: %[[A:.*]] = fir.declare{{.*}}a" | ||
| ! CHECK-KIND10: %[[P:.*]] = fir.declare{{.*}}p" | ||
| ! CHECK-KIND10: %[[R:.*]] = fir.declare{{.*}}r" | ||
| ! CHECK-KIND10: %[[A_LOAD:.*]] = fir.load %[[A]] | ||
| ! CHECK-KIND10: %[[P_LOAD:.*]] = fir.load %[[P]] | ||
| ! CHECK-KIND10: %[[DIV:.*]] = arith.divf %[[A_LOAD]], %[[P_LOAD]] fastmath<contract> : f80 | ||
| ! CHECK-KIND10: %[[CV1:.*]] = fir.convert %[[DIV]] : (f80) -> si80 | ||
| ! CHECK-KIND10: %[[CV2:.*]] = fir.convert %[[CV1]] : (si80) -> f80 | ||
| ! CHECK-KIND10: %[[MUL:.*]] = arith.mulf %[[CV2]], %[[P_LOAD]] fastmath<contract> : f80 | ||
| ! CHECK-KIND10: %[[SUB:.*]] = arith.subf %[[A_LOAD]], %[[MUL]] fastmath<contract> : f80 | ||
| ! CHECK-KIND10: fir.store %[[SUB]] to %[[R]] : !fir.ref<f80> | ||
| r = mod(a, p) | ||
| end subroutine mod_real10 | ||
|
|
||
| ! CHECK-LABEL: @_QPmod_real16 | ||
| subroutine mod_real16(r, a, p) | ||
| implicit none | ||
| integer, parameter :: kind16 = merge(16, 4, selected_real_kind(p=33).eq.16) | ||
| real(kind=kind16) :: r, a, p | ||
| ! CHECK-KIND16: %[[A:.*]] = fir.declare{{.*}}a" | ||
| ! CHECK-KIND16: %[[P:.*]] = fir.declare{{.*}}p" | ||
| ! CHECK-KIND16: %[[R:.*]] = fir.declare{{.*}}r" | ||
| ! CHECK-KIND16: %[[A_LOAD:.*]] = fir.load %[[A]] | ||
| ! CHECK-KIND16: %[[P_LOAD:.*]] = fir.load %[[P]] | ||
| ! CHECK-KIND16: %[[DIV:.*]] = arith.divf %[[A_LOAD]], %[[P_LOAD]] fastmath<contract> : f128 | ||
| ! CHECK-KIND16: %[[CV1:.*]] = fir.convert %[[DIV]] : (f128) -> si128 | ||
| ! CHECK-KIND16: %[[CV2:.*]] = fir.convert %[[CV1]] : (si128) -> f128 | ||
| ! CHECK-KIND16: %[[MUL:.*]] = arith.mulf %[[CV2]], %[[P_LOAD]] fastmath<contract> : f128 | ||
| ! CHECK-KIND16: %[[SUB:.*]] = arith.subf %[[A_LOAD]], %[[MUL]] fastmath<contract> : f128 | ||
| ! CHECK-KIND16: fir.store %[[SUB]] to %[[R]] : !fir.ref<f128> | ||
| r = mod(a, p) | ||
| end subroutine mod_real16 | ||
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Can you please also add
-fno-fast-real-mod?There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
I have added it my local copy for now and push it with my next update.