Skip to content
This repository was archived by the owner on May 9, 2024. It is now read-only.

Commit 1dac6a1

Browse files
committed
Increase SLM buffer size
1 parent 535783c commit 1dac6a1

File tree

1 file changed

+4
-4
lines changed
  • omniscidb/QueryEngine/Compiler

1 file changed

+4
-4
lines changed

omniscidb/QueryEngine/Compiler/genx.ll

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -12,10 +12,10 @@ declare i64 @__spirv_BuiltInSubgroupSize(i32 %dimention)
1212

1313
declare void @__spirv_ControlBarrier(i32 %execution_scope, i32 %memory_scope, i32 %memory_semantics)
1414

15-
@slm.buf.i64 = internal local_unnamed_addr addrspace(3) global [1024 x i64] zeroinitializer, align 4
15+
@slm.buf.i64 = internal local_unnamed_addr addrspace(3) global [4096 x i64] zeroinitializer, align 4
1616

1717
define i64 addrspace(4)* @declare_dynamic_shared_memory() {
18-
%res.share = bitcast [1024 x i64] addrspace(3)* @slm.buf.i64 to i64 addrspace(3)*
18+
%res.share = bitcast [4096 x i64] addrspace(3)* @slm.buf.i64 to i64 addrspace(3)*
1919
%res = addrspacecast i64 addrspace(3)* %res.share to i64 addrspace(4)*
2020
ret i64 addrspace(4)* %res
2121
}
@@ -333,15 +333,15 @@ define i64 addrspace(4)* @init_shared_mem(i64 addrspace(4)* %agg_init_val, i32 n
333333
.for_body:
334334
%pos.idx = phi i64 [ %pos, %.entry ], [ %pos.idx.new, %.for_body ]
335335
%agg_init_val.idx = getelementptr inbounds i64, i64 addrspace(4)* %agg_init_val, i64 %pos.idx
336-
%slm.idx = getelementptr inbounds [1024 x i64], [1024 x i64] addrspace(3)* @slm.buf.i64, i64 0, i64 %pos.idx
336+
%slm.idx = getelementptr inbounds [4096 x i64], [4096 x i64] addrspace(3)* @slm.buf.i64, i64 0, i64 %pos.idx
337337
%val = load i64, i64 addrspace(4)* %agg_init_val.idx
338338
store i64 %val, i64 addrspace(3)* %slm.idx
339339
%pos.idx.new = add nsw i64 %pos.idx, %wgnum
340340
%cond = icmp slt i64 %pos.idx.new, %buf.units.i64
341341
br i1 %cond, label %.for_body, label %.exit
342342
.exit:
343343
call void @sync_threadblock()
344-
%res.ptr = bitcast [1024 x i64] addrspace(3)* @slm.buf.i64 to i64 addrspace(3)*
344+
%res.ptr = bitcast [4096 x i64] addrspace(3)* @slm.buf.i64 to i64 addrspace(3)*
345345
%res.ptr.casted = addrspacecast i64 addrspace(3)* %res.ptr to i64 addrspace(4)*
346346
ret i64 addrspace(4)* %res.ptr.casted
347347
}

0 commit comments

Comments
 (0)