Skip to content

Commit aa3dcae

Browse files
SaieieiSairudra More
authored andcommitted
[OpenMP] Fix defaultmap(firstprivate:pointer) handling (llvm#169622)
This fixes a bug where pointers from defaultmap(firstprivate:pointer) were incorrectly treated as firstprivate literals, causing OMP_MAP_LITERAL to be set. This prevented the runtime from performing device address lookup. Realted PR llvm#167879 Co-authored-by: Sairudra More <[email protected]>
1 parent c1459c9 commit aa3dcae

File tree

4 files changed

+237
-15
lines changed

4 files changed

+237
-15
lines changed

clang/lib/CodeGen/CGOpenMPRuntime.cpp

Lines changed: 65 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -28,6 +28,7 @@
2828
#include "clang/Basic/SourceManager.h"
2929
#include "clang/CodeGen/ConstantInitBuilder.h"
3030
#include "llvm/ADT/ArrayRef.h"
31+
#include "llvm/ADT/SmallSet.h"
3132
#include "llvm/ADT/SmallVector.h"
3233
#include "llvm/ADT/StringExtras.h"
3334
#include "llvm/Bitcode/BitcodeReader.h"
@@ -7211,6 +7212,9 @@ class MappableExprsHandler {
72117212
/// firstprivate, false otherwise.
72127213
llvm::DenseMap<CanonicalDeclPtr<const VarDecl>, bool> FirstPrivateDecls;
72137214

7215+
/// Set of defaultmap clause kinds that use firstprivate behavior.
7216+
llvm::SmallSet<OpenMPDefaultmapClauseKind, 4> DefaultmapFirstprivateKinds;
7217+
72147218
/// Map between device pointer declarations and their expression components.
72157219
/// The key value for declarations in 'this' is null.
72167220
llvm::DenseMap<
@@ -9007,6 +9011,10 @@ class MappableExprsHandler {
90079011
FirstPrivateDecls.try_emplace(VD, /*Implicit=*/true);
90089012
}
90099013
}
9014+
// Extract defaultmap clause information.
9015+
for (const auto *C : Dir.getClausesOfKind<OMPDefaultmapClause>())
9016+
if (C->getDefaultmapModifier() == OMPC_DEFAULTMAP_MODIFIER_firstprivate)
9017+
DefaultmapFirstprivateKinds.insert(C->getDefaultmapKind());
90109018
// Extract device pointer clause information.
90119019
for (const auto *C : Dir.getClausesOfKind<OMPIsDevicePtrClause>())
90129020
for (auto L : C->component_lists())
@@ -9584,6 +9592,36 @@ class MappableExprsHandler {
95849592
}
95859593
}
95869594

9595+
/// Check if a variable should be treated as firstprivate due to explicit
9596+
/// firstprivate clause or defaultmap(firstprivate:...).
9597+
bool isEffectivelyFirstprivate(const VarDecl *VD, QualType Type) const {
9598+
// Check explicit firstprivate clauses (not implicit from defaultmap)
9599+
auto I = FirstPrivateDecls.find(VD);
9600+
if (I != FirstPrivateDecls.end() && !I->getSecond())
9601+
return true; // Explicit firstprivate only
9602+
9603+
// Check defaultmap(firstprivate:scalar) for scalar types
9604+
if (DefaultmapFirstprivateKinds.count(OMPC_DEFAULTMAP_scalar)) {
9605+
if (Type->isScalarType())
9606+
return true;
9607+
}
9608+
9609+
// Check defaultmap(firstprivate:pointer) for pointer types
9610+
if (DefaultmapFirstprivateKinds.count(OMPC_DEFAULTMAP_pointer)) {
9611+
if (Type->isAnyPointerType())
9612+
return true;
9613+
}
9614+
9615+
// Check defaultmap(firstprivate:aggregate) for aggregate types
9616+
if (DefaultmapFirstprivateKinds.count(OMPC_DEFAULTMAP_aggregate)) {
9617+
if (Type->isAggregateType())
9618+
return true;
9619+
}
9620+
9621+
// Check defaultmap(firstprivate:all) for all types
9622+
return DefaultmapFirstprivateKinds.count(OMPC_DEFAULTMAP_all);
9623+
}
9624+
95879625
/// Generate the default map information for a given capture \a CI,
95889626
/// record field declaration \a RI and captured value \a CV.
95899627
void generateDefaultMapInfo(const CapturedStmt::Capture &CI,
@@ -9611,13 +9649,23 @@ class MappableExprsHandler {
96119649
CombinedInfo.DevicePtrDecls.push_back(nullptr);
96129650
CombinedInfo.DevicePointers.push_back(DeviceInfoTy::None);
96139651
CombinedInfo.Pointers.push_back(CV);
9652+
bool IsFirstprivate =
9653+
isEffectivelyFirstprivate(VD, RI.getType().getNonReferenceType());
9654+
96149655
if (!RI.getType()->isAnyPointerType()) {
96159656
// We have to signal to the runtime captures passed by value that are
96169657
// not pointers.
96179658
CombinedInfo.Types.push_back(
96189659
OpenMPOffloadMappingFlags::OMP_MAP_LITERAL);
96199660
CombinedInfo.Sizes.push_back(CGF.Builder.CreateIntCast(
96209661
CGF.getTypeSize(RI.getType()), CGF.Int64Ty, /*isSigned=*/true));
9662+
} else if (IsFirstprivate) {
9663+
// Firstprivate pointers should be passed by value (as literals)
9664+
// without performing a present table lookup at runtime.
9665+
CombinedInfo.Types.push_back(
9666+
OpenMPOffloadMappingFlags::OMP_MAP_LITERAL);
9667+
// Use zero size for pointer literals (just passing the pointer value)
9668+
CombinedInfo.Sizes.push_back(llvm::Constant::getNullValue(CGF.Int64Ty));
96219669
} else {
96229670
// Pointers are implicitly mapped with a zero size and no flags
96239671
// (other than first map that is added for all implicit maps).
@@ -9631,26 +9679,31 @@ class MappableExprsHandler {
96319679
assert(CI.capturesVariable() && "Expected captured reference.");
96329680
const auto *PtrTy = cast<ReferenceType>(RI.getType().getTypePtr());
96339681
QualType ElementType = PtrTy->getPointeeType();
9634-
CombinedInfo.Sizes.push_back(CGF.Builder.CreateIntCast(
9635-
CGF.getTypeSize(ElementType), CGF.Int64Ty, /*isSigned=*/true));
9636-
// The default map type for a scalar/complex type is 'to' because by
9637-
// default the value doesn't have to be retrieved. For an aggregate
9638-
// type, the default is 'tofrom'.
9639-
CombinedInfo.Types.push_back(getMapModifiersForPrivateClauses(CI));
96409682
const VarDecl *VD = CI.getCapturedVar();
9641-
auto I = FirstPrivateDecls.find(VD);
9683+
bool IsFirstprivate = isEffectivelyFirstprivate(VD, ElementType);
96429684
CombinedInfo.Exprs.push_back(VD->getCanonicalDecl());
96439685
CombinedInfo.BasePointers.push_back(CV);
96449686
CombinedInfo.DevicePtrDecls.push_back(nullptr);
96459687
CombinedInfo.DevicePointers.push_back(DeviceInfoTy::None);
9646-
if (I != FirstPrivateDecls.end() && ElementType->isAnyPointerType()) {
9647-
Address PtrAddr = CGF.EmitLoadOfReference(CGF.MakeAddrLValue(
9648-
CV, ElementType, CGF.getContext().getDeclAlign(VD),
9649-
AlignmentSource::Decl));
9650-
CombinedInfo.Pointers.push_back(PtrAddr.emitRawPointer(CGF));
9688+
9689+
// For firstprivate pointers, pass by value instead of dereferencing
9690+
if (IsFirstprivate && ElementType->isAnyPointerType()) {
9691+
// Treat as a literal value (pass the pointer value itself)
9692+
CombinedInfo.Pointers.push_back(CV);
9693+
// Use zero size for pointer literals
9694+
CombinedInfo.Sizes.push_back(llvm::Constant::getNullValue(CGF.Int64Ty));
9695+
CombinedInfo.Types.push_back(
9696+
OpenMPOffloadMappingFlags::OMP_MAP_LITERAL);
96519697
} else {
9698+
CombinedInfo.Sizes.push_back(CGF.Builder.CreateIntCast(
9699+
CGF.getTypeSize(ElementType), CGF.Int64Ty, /*isSigned=*/true));
9700+
// The default map type for a scalar/complex type is 'to' because by
9701+
// default the value doesn't have to be retrieved. For an aggregate
9702+
// type, the default is 'tofrom'.
9703+
CombinedInfo.Types.push_back(getMapModifiersForPrivateClauses(CI));
96529704
CombinedInfo.Pointers.push_back(CV);
96539705
}
9706+
auto I = FirstPrivateDecls.find(VD);
96549707
if (I != FirstPrivateDecls.end())
96559708
IsImplicit = I->getSecond();
96569709
}

clang/test/OpenMP/target_defaultmap_codegen_01.cpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -734,8 +734,8 @@ void explicit_maps_single (){
734734
// CK14-LABEL: @.__omp_offloading_{{.*}}explicit_maps_single{{.*}}_l{{[0-9]+}}.region_id = weak{{.*}} constant i8 0
735735

736736
// CK14: [[SIZE09:@.+]] = private {{.*}}constant [1 x i64] zeroinitializer
737-
// Map types: OMP_MAP_TARGET_PARAM | OMP_MAP_IMPLICIT = 544
738-
// CK14: [[MTYPE09:@.+]] = private {{.*}}constant [1 x i64] [i64 544]
737+
// Map types: OMP_MAP_TARGET_PARAM | OMP_MAP_LITERAL | OMP_MAP_IMPLICIT = 800
738+
// CK14: [[MTYPE09:@.+]] = private {{.*}}constant [1 x i64] [i64 800]
739739

740740
// CK14-LABEL: explicit_maps_single{{.*}}(
741741
void explicit_maps_single (){
Lines changed: 169 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,169 @@
1+
// RUN: %clang_cc1 -verify -fopenmp -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple powerpc64le-unknown-unknown -emit-llvm %s -o - | FileCheck %s
2+
// RUN: %clang_cc1 -fopenmp -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -std=c++11 -triple powerpc64le-unknown-unknown -emit-pch -o %t %s
3+
// RUN: %clang_cc1 -fopenmp -fopenmp-targets=powerpc64le-ibm-linux-gnu -x c++ -triple powerpc64le-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s
4+
// expected-no-diagnostics
5+
6+
#ifndef HEADER
7+
#define HEADER
8+
9+
/// ========================================================================
10+
/// Test: Firstprivate pointer handling in OpenMP target regions
11+
/// ========================================================================
12+
///
13+
/// This test verifies that pointers with firstprivate semantics get the
14+
/// OMP_MAP_LITERAL flag, enabling the runtime to pass pointer values directly
15+
/// without performing present table lookups.
16+
///
17+
/// Map type values:
18+
/// 288 = OMP_MAP_TARGET_PARAM (32) + OMP_MAP_LITERAL (256)
19+
/// Used for explicit firstprivate(ptr)
20+
///
21+
/// 800 = OMP_MAP_TARGET_PARAM (32) + OMP_MAP_LITERAL (256) + OMP_MAP_IS_PTR (512)
22+
/// Used for implicit firstprivate pointers (e.g., from defaultmap clauses)
23+
/// Note: 512 is OMP_MAP_IS_PTR, not IMPLICIT. Implicitness is tracked separately.
24+
///
25+
/// 544 = OMP_MAP_TARGET_PARAM (32) + OMP_MAP_IS_PTR (512)
26+
/// Incorrect behavior - missing LITERAL flag, causes runtime present table lookup
27+
///
28+
29+
///==========================================================================
30+
/// Test 1: Explicit firstprivate(pointer) → map type 288
31+
///==========================================================================
32+
33+
// CHECK-DAG: @.offload_maptypes{{[^.]*}} = private unnamed_addr constant [1 x i64] [i64 288]
34+
// CHECK-DAG: @.offload_sizes{{[^.]*}} = private unnamed_addr constant [1 x i64] zeroinitializer
35+
36+
void test1_explicit_firstprivate() {
37+
double *ptr = nullptr;
38+
39+
// Explicit firstprivate should generate map type 288
40+
// (TARGET_PARAM | LITERAL, no IS_PTR flag for explicit clauses)
41+
#pragma omp target firstprivate(ptr)
42+
{
43+
if (ptr) ptr[0] = 1.0;
44+
}
45+
}
46+
47+
///==========================================================================
48+
/// Test 2: defaultmap(firstprivate:pointer) → map type 800
49+
///==========================================================================
50+
51+
// CHECK-DAG: @.offload_maptypes{{.*}} = private unnamed_addr constant [1 x i64] [i64 800]
52+
// CHECK-DAG: @.offload_sizes{{.*}} = private unnamed_addr constant [1 x i64] zeroinitializer
53+
54+
void test2_defaultmap_firstprivate_pointer() {
55+
double *ptr = nullptr;
56+
57+
// defaultmap(firstprivate:pointer) creates implicit firstprivate
58+
// Should generate map type 800 (TARGET_PARAM | LITERAL | IS_PTR)
59+
#pragma omp target defaultmap(firstprivate:pointer)
60+
{
61+
if (ptr) ptr[0] = 2.0;
62+
}
63+
}
64+
65+
///==========================================================================
66+
/// Test 3: defaultmap(firstprivate:scalar) with double → map type 800
67+
///==========================================================================
68+
69+
// CHECK-DAG: @.offload_maptypes{{.*}} = private unnamed_addr constant [1 x i64] [i64 800]
70+
71+
void test3_defaultmap_scalar_double() {
72+
double d = 3.0;
73+
74+
// OpenMP's "scalar" category excludes pointers but includes arithmetic types
75+
// Double gets implicit firstprivate → map type 800
76+
#pragma omp target defaultmap(firstprivate:scalar)
77+
{
78+
d += 1.0;
79+
}
80+
}
81+
82+
///==========================================================================
83+
/// Test 4: Pointer with defaultmap(firstprivate:scalar) → map type 800
84+
///==========================================================================
85+
86+
// CHECK-DAG: @.offload_maptypes{{.*}} = private unnamed_addr constant [1 x i64] [i64 800]
87+
// CHECK-DAG: @.offload_sizes{{.*}} = private unnamed_addr constant [1 x i64] zeroinitializer
88+
89+
void test4_pointer_with_scalar_defaultmap() {
90+
double *ptr = nullptr;
91+
92+
// Note: defaultmap(firstprivate:scalar) does NOT apply to pointers (scalar excludes pointers).
93+
// However, the pointer still gets 800 because in OpenMP 5.0+, pointers without explicit
94+
// data-sharing attributes are implicitly firstprivate and lowered as IS_PTR|LITERAL|TARGET_PARAM.
95+
// This is the default pointer behavior, NOT due to the scalar defaultmap.
96+
#pragma omp target defaultmap(firstprivate:scalar)
97+
{
98+
if (ptr) ptr[0] = 4.0;
99+
}
100+
}
101+
102+
///==========================================================================
103+
/// Test 5: Multiple pointers with explicit firstprivate → all get 288
104+
///==========================================================================
105+
106+
// CHECK-DAG: @.offload_maptypes{{.*}} = private unnamed_addr constant [3 x i64] [i64 288, i64 288, i64 288]
107+
// CHECK-DAG: @.offload_sizes{{.*}} = private unnamed_addr constant [3 x i64] zeroinitializer
108+
109+
void test5_multiple_firstprivate() {
110+
int *a = nullptr;
111+
float *b = nullptr;
112+
double *c = nullptr;
113+
114+
// All explicit firstprivate pointers get map type 288
115+
#pragma omp target firstprivate(a, b, c)
116+
{
117+
if (a) a[0] = 6;
118+
if (b) b[0] = 7.0f;
119+
if (c) c[0] = 8.0;
120+
}
121+
}
122+
123+
///==========================================================================
124+
/// Test 6: Pointer to const with firstprivate → map type 288
125+
///==========================================================================
126+
127+
// CHECK-DAG: @.offload_maptypes{{.*}} = private unnamed_addr constant [1 x i64] [i64 288]
128+
// CHECK-DAG: @.offload_sizes{{.*}} = private unnamed_addr constant [1 x i64] zeroinitializer
129+
130+
void test6_const_pointer() {
131+
const double *const_ptr = nullptr;
132+
133+
// Const pointer with explicit firstprivate → 288
134+
#pragma omp target firstprivate(const_ptr)
135+
{
136+
if (const_ptr) {
137+
double val = const_ptr[0];
138+
(void)val;
139+
}
140+
}
141+
}
142+
143+
///==========================================================================
144+
/// Test 7: Pointer-to-pointer with firstprivate → map type 288
145+
///==========================================================================
146+
147+
// CHECK-DAG: @.offload_maptypes{{.*}} = private unnamed_addr constant [1 x i64] [i64 288]
148+
// CHECK-DAG: @.offload_sizes{{.*}} = private unnamed_addr constant [1 x i64] zeroinitializer
149+
150+
void test7_pointer_to_pointer() {
151+
int **pp = nullptr;
152+
153+
// Pointer-to-pointer with explicit firstprivate → 288
154+
#pragma omp target firstprivate(pp)
155+
{
156+
if (pp && *pp) (*pp)[0] = 9;
157+
}
158+
}
159+
160+
///==========================================================================
161+
/// Verification: The key fix is that firstprivate pointers now include
162+
/// the LITERAL flag (256), which tells the runtime to pass the pointer
163+
/// value directly instead of performing a present table lookup.
164+
///
165+
/// Before fix: Pointers got 544 (TARGET_PARAM | IS_PTR) → runtime lookup
166+
/// After fix: Pointers get 288 or 800 (includes LITERAL) → direct pass
167+
///==========================================================================
168+
169+
#endif // HEADER

clang/test/OpenMP/target_map_codegen_26.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -52,7 +52,7 @@
5252
// CK27-LABEL: @.__omp_offloading_{{.*}}zero_size_section_and_private_maps{{.*}}_l{{[0-9]+}}.region_id = weak constant i8 0
5353
// CK27-LABEL: @.__omp_offloading_{{.*}}zero_size_section_and_private_maps{{.*}}_l{{[0-9]+}}.region_id = weak constant i8 0
5454
// CK27: [[SIZE05:@.+]] = private {{.*}}constant [1 x i64] zeroinitializer
55-
// CK27: [[MTYPE05:@.+]] = private {{.*}}constant [1 x i64] [i64 32]
55+
// CK27: [[MTYPE05:@.+]] = private {{.*}}constant [1 x i64] [i64 288]
5656

5757
// CK27-LABEL: @.__omp_offloading_{{.*}}zero_size_section_and_private_maps{{.*}}_l{{[0-9]+}}.region_id = weak constant i8 0
5858
// CK27-LABEL: @.__omp_offloading_{{.*}}zero_size_section_and_private_maps{{.*}}_l{{[0-9]+}}.region_id = weak constant i8 0

0 commit comments

Comments
 (0)