Skip to content

Commit 55f293d

Browse files
committed
Review comments pt.2
1 parent a7ca93a commit 55f293d

File tree

2 files changed

+11
-11
lines changed

2 files changed

+11
-11
lines changed

llvm/lib/Target/AMDGPU/SIISelLowering.cpp

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -4048,20 +4048,20 @@ SDValue SITargetLowering::lowerDYNAMIC_STACKALLOCImpl(SDValue Op,
40484048
Chain = BaseAddr.getValue(1);
40494049
Align StackAlign = TFL->getStackAlign();
40504050
if (Alignment > StackAlign) {
4051-
auto ScaledAlignment = (uint64_t)Alignment.value()
4052-
<< Subtarget->getWavefrontSizeLog2();
4053-
auto StackAlignMask = ScaledAlignment - 1;
4054-
auto TmpAddr = DAG.getNode(ISD::ADD, dl, VT, BaseAddr,
4055-
DAG.getConstant(StackAlignMask, dl, VT));
4051+
uint64_t ScaledAlignment = (uint64_t)Alignment.value()
4052+
<< Subtarget->getWavefrontSizeLog2();
4053+
uint64_t StackAlignMask = ScaledAlignment - 1;
4054+
SDValue TmpAddr = DAG.getNode(ISD::ADD, dl, VT, BaseAddr,
4055+
DAG.getConstant(StackAlignMask, dl, VT));
40564056
BaseAddr = DAG.getNode(ISD::AND, dl, VT, TmpAddr,
4057-
DAG.getConstant(ScaledAlignment, dl, VT));
4057+
DAG.getSignedConstant(-ScaledAlignment, dl, VT));
40584058
}
40594059

40604060
SDValue ScaledSize = DAG.getNode(
40614061
ISD::SHL, dl, VT, Size,
40624062
DAG.getConstant(Subtarget->getWavefrontSizeLog2(), dl, MVT::i32));
40634063

4064-
auto NewSP = DAG.getNode(ISD::ADD, dl, VT, BaseAddr, ScaledSize); // Value
4064+
SDValue NewSP = DAG.getNode(ISD::ADD, dl, VT, BaseAddr, ScaledSize); // Value
40654065

40664066
Chain = DAG.getCopyToReg(Chain, dl, SPReg, NewSP); // Output chain
40674067
Tmp2 = DAG.getCALLSEQ_END(Chain, 0, 0, SDValue(), dl);

llvm/test/CodeGen/AMDGPU/non-entry-alloca.ll

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -131,7 +131,7 @@ define amdgpu_kernel void @kernel_non_entry_block_static_alloca_uniformly_reache
131131
; MUBUF-NEXT: s_cbranch_scc1 .LBB1_2
132132
; MUBUF-NEXT: ; %bb.1: ; %bb.0
133133
; MUBUF-NEXT: s_add_i32 s4, s32, 0xfff
134-
; MUBUF-NEXT: s_and_b32 s4, s4, 0x1000
134+
; MUBUF-NEXT: s_and_b32 s4, s4, 0xfffff000
135135
; MUBUF-NEXT: s_lshl_b32 s5, s5, 2
136136
; MUBUF-NEXT: s_add_i32 s32, s4, 0x1000
137137
; MUBUF-NEXT: v_mov_b32_e32 v1, 0
@@ -166,7 +166,7 @@ define amdgpu_kernel void @kernel_non_entry_block_static_alloca_uniformly_reache
166166
; FLATSCR-NEXT: ; %bb.1: ; %bb.0
167167
; FLATSCR-NEXT: s_add_i32 s0, s32, 0xfff
168168
; FLATSCR-NEXT: v_mov_b32_e32 v1, 0
169-
; FLATSCR-NEXT: s_and_b32 s0, s0, 0x1000
169+
; FLATSCR-NEXT: s_and_b32 s0, s0, 0xfffff000
170170
; FLATSCR-NEXT: v_mov_b32_e32 v2, 1
171171
; FLATSCR-NEXT: s_lshl_b32 s1, s1, 2
172172
; FLATSCR-NEXT: s_add_i32 s32, s0, 0x1000
@@ -323,7 +323,7 @@ define void @func_non_entry_block_static_alloca_align64(ptr addrspace(1) %out, i
323323
; MUBUF-NEXT: s_cbranch_execz .LBB3_2
324324
; MUBUF-NEXT: ; %bb.1: ; %bb.0
325325
; MUBUF-NEXT: s_add_i32 s6, s32, 0xfff
326-
; MUBUF-NEXT: s_and_b32 s6, s6, 0x1000
326+
; MUBUF-NEXT: s_and_b32 s6, s6, 0xfffff000
327327
; MUBUF-NEXT: v_mov_b32_e32 v2, 0
328328
; MUBUF-NEXT: v_mov_b32_e32 v4, s6
329329
; MUBUF-NEXT: buffer_store_dword v2, v4, s[0:3], 0 offen
@@ -357,7 +357,7 @@ define void @func_non_entry_block_static_alloca_align64(ptr addrspace(1) %out, i
357357
; FLATSCR-NEXT: s_cbranch_execz .LBB3_2
358358
; FLATSCR-NEXT: ; %bb.1: ; %bb.0
359359
; FLATSCR-NEXT: s_add_i32 s2, s32, 0xfff
360-
; FLATSCR-NEXT: s_and_b32 s2, s2, 0x1000
360+
; FLATSCR-NEXT: s_and_b32 s2, s2, 0xfffff000
361361
; FLATSCR-NEXT: v_mov_b32_e32 v4, 0
362362
; FLATSCR-NEXT: v_mov_b32_e32 v5, 1
363363
; FLATSCR-NEXT: scratch_store_dwordx2 off, v[4:5], s2

0 commit comments

Comments
 (0)