From: Changpeng Fang Date: Thu, 3 Aug 2017 16:37:02 +0000 (+0000) Subject: AMDGPU/SI: Don't fix a PHI under uniform branch in SIFixSGPRCopies only when sources... X-Git-Url: https://granicus.if.org/sourcecode?a=commitdiff_plain;h=d865f4ba1b0a33f1e7c8d39843b3e57b11c7a9b1;p=llvm AMDGPU/SI: Don't fix a PHI under uniform branch in SIFixSGPRCopies only when sources and destination are all sgprs Summary: If a PHI has at lease one VGPR operand, we have to fix the PHI in SIFixSGPRCopies. Reviewer: Matt Differential Revision: http://reviews.llvm.org/D34727 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@309959 91177308-0d34-0410-b5e6-96231b3b80d8 --- diff --git a/lib/Target/AMDGPU/SIFixSGPRCopies.cpp b/lib/Target/AMDGPU/SIFixSGPRCopies.cpp index 0a795c99f94..32e83cb385f 100644 --- a/lib/Target/AMDGPU/SIFixSGPRCopies.cpp +++ b/lib/Target/AMDGPU/SIFixSGPRCopies.cpp @@ -604,7 +604,8 @@ bool SIFixSGPRCopies::runOnMachineFunction(MachineFunction &MF) { // We don't need to fix the PHI if the common dominator of the // two incoming blocks terminates with a uniform branch. - if (MI.getNumExplicitOperands() == 5) { + bool HasVGPROperand = phiHasVGPROperands(MI, MRI, TRI, TII); + if (MI.getNumExplicitOperands() == 5 && !HasVGPROperand) { MachineBasicBlock *MBB0 = MI.getOperand(2).getMBB(); MachineBasicBlock *MBB1 = MI.getOperand(4).getMBB(); @@ -649,8 +650,7 @@ bool SIFixSGPRCopies::runOnMachineFunction(MachineFunction &MF) { // is no chance for values to be over-written. SmallSet Visited; - if (phiHasVGPROperands(MI, MRI, TRI, TII) || - !phiHasBreakDef(MI, MRI, Visited)) { + if (HasVGPROperand || !phiHasBreakDef(MI, MRI, Visited)) { DEBUG(dbgs() << "Fixing PHI: " << MI); TII->moveToVALU(MI); } diff --git a/test/CodeGen/AMDGPU/uniform-cfg.ll b/test/CodeGen/AMDGPU/uniform-cfg.ll index 9416336a44e..3c25dc7f0e7 100644 --- a/test/CodeGen/AMDGPU/uniform-cfg.ll +++ b/test/CodeGen/AMDGPU/uniform-cfg.ll @@ -557,6 +557,28 @@ done: ret void } +; GCN-LABEL: {{^}}move_to_valu_vgpr_operand_phi: +; GCN: v_add_i32_e32 +; GCN: ds_write_b32 +define void @move_to_valu_vgpr_operand_phi(i32 addrspace(3)* %out) { +bb0: + br label %bb1 + +bb1: ; preds = %bb3, %bb0 + %tmp0 = phi i32 [ 8, %bb0 ], [ %tmp4, %bb3 ] + %tmp1 = add nsw i32 %tmp0, -1 + %tmp2 = getelementptr inbounds i32, i32 addrspace(3)* %out, i32 %tmp1 + br i1 undef, label %bb2, label %bb3 + +bb2: ; preds = %bb1 + store volatile i32 1, i32 addrspace(3)* %tmp2, align 4 + br label %bb3 + +bb3: ; preds = %bb2, %bb1 + %tmp4 = add nsw i32 %tmp0, 2 + br label %bb1 +} + declare i32 @llvm.amdgcn.workitem.id.x() #0 attributes #0 = { nounwind readnone }