Skip to content

Commit a091a82

Browse files
author
Marcos Maronas
authored
[Backport to 15] [DebugInfo] Round up #elts of TypeVector when calculating memory size (#2648)
* [DebugInfo] Round up #elts of TypeVector when calculating memory size (#2504) Round up number of elements in a Vector to a power of 2 when calculating memory size. Memory size will be calculated as BaseType * bit_ceil(ComponentCount). The previous calculation already rounded 3 elements to 4 elements. Signed-off-by: Lu, John <john.lu@intel.com> * Avoid requiring C++20 (#2600) bit_ceil requires C++20. Use llvm::bit_ceil to avoid this requirement. Signed-off-by: Lu, John <john.lu@intel.com> * Remove unecessary include that require c++20 (#2628) * Add own bit_ceil implementation. Signed-off-by: Marcos Maronas <marcos.maronas@intel.com> Signed-off-by: Lu, John <john.lu@intel.com>
1 parent 0303992 commit a091a82

File tree

4 files changed

+71
-9
lines changed

4 files changed

+71
-9
lines changed

lib/SPIRV/SPIRVInternal.h

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1098,6 +1098,15 @@ bool postProcessBuiltinsWithArrayArguments(Module *M, bool IsCpp = false);
10981098

10991099
template <typename T>
11001100
MetadataAsValue *map2MDString(LLVMContext &C, SPIRVValue *V);
1101+
1102+
/// Returns the smallest integral power of two no smaller than Value if Value is
1103+
/// nonzero. Returns 1 otherwise.
1104+
///
1105+
/// Ex. bitCeil(5) == 8.
1106+
///
1107+
/// The return value is undefined if the input is larger than the largest power
1108+
/// of two representable in SPIRVWord.
1109+
[[nodiscard]] SPIRVWord bitCeil(SPIRVWord Value);
11011110
} // namespace SPIRV
11021111

11031112
#endif // SPIRV_SPIRVINTERNAL_H

lib/SPIRV/SPIRVToLLVMDbgTran.cpp

Lines changed: 7 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -495,15 +495,13 @@ SPIRVToLLVMDbgTran::transTypeVector(const SPIRVExtInst *DebugInst) {
495495
transNonNullDebugType(BM->get<SPIRVExtInst>(Ops[BaseTypeIdx]));
496496
SPIRVWord Count = getConstantValueOrLiteral(Ops, ComponentCountIdx,
497497
DebugInst->getExtSetKind());
498-
// FIXME: The current design of SPIR-V Debug Info doesn't provide a field
499-
// for the derived memory size. Meanwhile, OpenCL/SYCL 3-element vectors
500-
// occupy the same amount of memory as 4-element vectors, hence the simple
501-
// elem_count * elem_size formula fails in this edge case.
502-
// Once the specification is updated to reflect the whole memory block's
503-
// size in SPIR-V, the calculations below must be replaced with a simple
504-
// translation of the known size.
505-
SPIRVWord SizeCount = (Count == 3) ? 4 : Count;
506-
uint64_t Size = getDerivedSizeInBits(BaseTy) * SizeCount;
498+
// Round up to a power of two.
499+
// OpenCL/SYCL 3-element vectors
500+
// occupy the same amount of memory as 4-element vectors
501+
// Clang rounds up the memory size of vectors to a power of 2.
502+
// Vulkan allows vec3 to have a memory size of 12, but in RenderDoc memory
503+
// size is not derived from debug info.
504+
const uint64_t Size = getDerivedSizeInBits(BaseTy) * bitCeil(Count);
507505

508506
SmallVector<llvm::Metadata *, 8> Subscripts;
509507
Subscripts.push_back(getDIBuilder(DebugInst).getOrCreateSubrange(0, Count));

lib/SPIRV/SPIRVUtil.cpp

Lines changed: 16 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2492,4 +2492,20 @@ template MetadataAsValue *
24922492
map2MDString<internal::InternalJointMatrixLayout>(LLVMContext &, SPIRVValue *);
24932493
template MetadataAsValue *map2MDString<spv::Scope>(LLVMContext &, SPIRVValue *);
24942494

2495+
[[nodiscard]] SPIRVWord bitCeil(SPIRVWord Value) {
2496+
if (Value < 2)
2497+
return 1;
2498+
2499+
// If Value is already a power of 2, just return it.
2500+
if ((Value & (Value - 1)) == 0)
2501+
return Value;
2502+
2503+
Value--;
2504+
for (SPIRVWord Shift = std::numeric_limits<SPIRVWord>::digits >> 1; Shift;
2505+
Shift >>= 1) {
2506+
Value |= Value >> Shift;
2507+
}
2508+
return ++Value;
2509+
}
2510+
24952511
} // namespace SPIRV

test/DebugInfo/DebugInfoVector.ll

Lines changed: 39 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,39 @@
1+
; Ensure that a vector type's memory size is calculated as bit_ceil(# elements) * element size
2+
; even if the (# elements) is not 3.
3+
;
4+
; This test was derived from DebugInfo/X86/sycl-vec-3.ll.
5+
6+
; RUN: llvm-as < %s -o %t.bc
7+
8+
; RUN: llvm-spirv %t.bc -o %t.spv -spirv-ext=+SPV_INTEL_vector_compute
9+
; RUN: llvm-spirv -r %t.spv -o %t.bc
10+
; RUN: llvm-dis %t.bc -o - | FileCheck %s --check-prefixes=CHECK
11+
12+
target datalayout = "e-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-n8:16:32:64"
13+
target triple = "spir64-unknown-unknown"
14+
15+
%"class.cl::sycl::vec" = type { <832 x i32> }
16+
@vector = dso_local addrspace(1) global %"class.cl::sycl::vec" zeroinitializer, align 16, !dbg !0
17+
18+
!llvm.dbg.cu = !{!9}
19+
!llvm.module.flags = !{!10, !11, !12, !13, !14}
20+
21+
!0 = !DIGlobalVariableExpression(var: !1, expr: !DIExpression())
22+
!1 = distinct !DIGlobalVariable(name: "vector", scope: null, file: !2, line: 3, type: !3, isLocal: false, isDefinition: true)
23+
!2 = !DIFile(filename: "sycl-vec-3.cpp", directory: "/tmp")
24+
; CHECK: !DICompositeType(tag: DW_TAG_array_type, baseType: ![[BASE_TY:[0-9]+]],{{.*}} size: 32768, flags: DIFlagVector, elements: ![[ELEMS:[0-9]+]])
25+
!3 = distinct !DICompositeType(tag: DW_TAG_array_type, baseType: !6, file: !2, line: 3, size: 32768, flags: DIFlagVector, elements: !4, identifier: "_ZTSN2cl4sycl3vecIiLi3EEE")
26+
; CHECK-DAG: ![[ELEMS]] = !{![[ELEMS_RANGE:[0-9]+]]}
27+
!4 = !{!5}
28+
; CHECK-DAG: ![[ELEMS_RANGE]] = !DISubrange(count: 832{{.*}})
29+
!5 = !DISubrange(count: 832)
30+
; CHECK-DAG: ![[BASE_TY]] = !DIBasicType(name: "int", size: 32,{{.*}} encoding: DW_ATE_signed)
31+
!6 = !DIBasicType(name: "int", size: 32, align: 32, encoding: DW_ATE_signed)
32+
!7 = !{}
33+
!8 = !{!0}
34+
!9 = distinct !DICompileUnit(language: DW_LANG_C_plus_plus, file: !2, producer: "clang version 13.0.0 (https://github.com/intel/llvm.git)", isOptimized: false, runtimeVersion: 0, emissionKind: FullDebug, enums: !7, retainedTypes: !7, globals: !8, imports: !7)
35+
!10 = !{i32 7, !"Dwarf Version", i32 4}
36+
!11 = !{i32 2, !"Debug Info Version", i32 3}
37+
!12 = !{i32 1, !"wchar_size", i32 4}
38+
!13 = !{i32 7, !"uwtable", i32 1}
39+
!14 = !{i32 7, !"frame-pointer", i32 2}

0 commit comments

Comments
 (0)