From ab06ef3e9ba29d304f14061382f9c040812a3a55 Mon Sep 17 00:00:00 2001 From: Matt Arsenault Date: Sat, 2 Feb 2019 23:35:15 +0000 Subject: [PATCH] AMDGPU/GlobalISel: Legalize icmp for pointer types git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@352976 91177308-0d34-0410-b5e6-96231b3b80d8 --- lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp | 11 +- .../AMDGPU/GlobalISel/legalize-icmp.mir | 175 ++++++++++++++++++ 2 files changed, 185 insertions(+), 1 deletion(-) diff --git a/lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp b/lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp index 2c4c8d9580d..a123d7320cb 100644 --- a/lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp +++ b/lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp @@ -200,7 +200,16 @@ AMDGPULegalizerInfo::AMDGPULegalizerInfo(const GCNSubtarget &ST, setAction({G_BLOCK_ADDR, CodePtr}, Legal); - getActionDefinitionsBuilder({G_ICMP, G_FCMP}) + getActionDefinitionsBuilder(G_ICMP) + .legalForCartesianProduct( + {S1}, {S32, S64, GlobalPtr, LocalPtr, ConstantPtr, PrivatePtr, FlatPtr}) + .legalFor({{S1, S32}, {S1, S64}}) + .widenScalarToNextPow2(1) + .clampScalar(1, S32, S64) + .scalarize(0) + .legalIf(all(typeIs(0, S1), isPointer(1))); + + getActionDefinitionsBuilder(G_FCMP) .legalFor({{S1, S32}, {S1, S64}}) .widenScalarToNextPow2(1) .clampScalar(1, S32, S64) diff --git a/test/CodeGen/AMDGPU/GlobalISel/legalize-icmp.mir b/test/CodeGen/AMDGPU/GlobalISel/legalize-icmp.mir index eadba8dcef3..302e1bfaaf2 100644 --- a/test/CodeGen/AMDGPU/GlobalISel/legalize-icmp.mir +++ b/test/CodeGen/AMDGPU/GlobalISel/legalize-icmp.mir @@ -164,3 +164,178 @@ body: | S_NOP 0, implicit %3 ... + +--- +name: test_icmp_p0 +body: | + bb.0.entry: + liveins: $vgpr0_vgpr1, $vgpr2_vgpr3 + ; CHECK-LABEL: name: test_icmp_p0 + ; CHECK: [[COPY:%[0-9]+]]:_(p0) = COPY $vgpr0_vgpr1 + ; CHECK: [[COPY1:%[0-9]+]]:_(p0) = COPY $vgpr0_vgpr1 + ; CHECK: [[ICMP:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[COPY]](p0), [[COPY1]] + ; CHECK: [[SEXT:%[0-9]+]]:_(s32) = G_SEXT [[ICMP]](s1) + ; CHECK: $vgpr0 = COPY [[SEXT]](s32) + %0:_(p0) = COPY $vgpr0_vgpr1 + %1:_(p0) = COPY $vgpr0_vgpr1 + %2:_(s1) = G_ICMP intpred(ne), %0, %1 + %3:_(s32) = G_SEXT %2 + $vgpr0 = COPY %3 +... + +--- +name: test_icmp_p1 +body: | + bb.0.entry: + liveins: $vgpr0_vgpr1, $vgpr2_vgpr3 + ; CHECK-LABEL: name: test_icmp_p1 + ; CHECK: [[COPY:%[0-9]+]]:_(p1) = COPY $vgpr0_vgpr1 + ; CHECK: [[COPY1:%[0-9]+]]:_(p1) = COPY $vgpr0_vgpr1 + ; CHECK: [[ICMP:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[COPY]](p1), [[COPY1]] + ; CHECK: [[SEXT:%[0-9]+]]:_(s32) = G_SEXT [[ICMP]](s1) + ; CHECK: $vgpr0 = COPY [[SEXT]](s32) + %0:_(p1) = COPY $vgpr0_vgpr1 + %1:_(p1) = COPY $vgpr0_vgpr1 + %2:_(s1) = G_ICMP intpred(ne), %0, %1 + %3:_(s32) = G_SEXT %2 + $vgpr0 = COPY %3 +... + +--- +name: test_icmp_p2 +body: | + bb.0.entry: + liveins: $vgpr0, $vgpr1 + + ; CHECK-LABEL: name: test_icmp_p2 + ; CHECK: [[COPY:%[0-9]+]]:_(p2) = COPY $vgpr0 + ; CHECK: [[COPY1:%[0-9]+]]:_(p2) = COPY $vgpr1 + ; CHECK: [[ICMP:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[COPY]](p2), [[COPY1]] + ; CHECK: [[SEXT:%[0-9]+]]:_(s32) = G_SEXT [[ICMP]](s1) + ; CHECK: $vgpr0 = COPY [[SEXT]](s32) + %0:_(p2) = COPY $vgpr0 + %1:_(p2) = COPY $vgpr1 + %2:_(s1) = G_ICMP intpred(ne), %0, %1 + %3:_(s32) = G_SEXT %2 + $vgpr0 = COPY %3 +... + +--- +name: test_icmp_p3 +body: | + bb.0.entry: + liveins: $vgpr0, $vgpr1 + + ; CHECK-LABEL: name: test_icmp_p3 + ; CHECK: [[COPY:%[0-9]+]]:_(p3) = COPY $vgpr0 + ; CHECK: [[COPY1:%[0-9]+]]:_(p3) = COPY $vgpr1 + ; CHECK: [[ICMP:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[COPY]](p3), [[COPY1]] + ; CHECK: [[SEXT:%[0-9]+]]:_(s32) = G_SEXT [[ICMP]](s1) + ; CHECK: $vgpr0 = COPY [[SEXT]](s32) + %0:_(p3) = COPY $vgpr0 + %1:_(p3) = COPY $vgpr1 + %2:_(s1) = G_ICMP intpred(ne), %0, %1 + %3:_(s32) = G_SEXT %2 + $vgpr0 = COPY %3 +... + +--- +name: test_icmp_p4 +body: | + bb.0.entry: + liveins: $vgpr0_vgpr1, $vgpr2_vgpr3 + ; CHECK-LABEL: name: test_icmp_p4 + ; CHECK: [[COPY:%[0-9]+]]:_(p4) = COPY $vgpr0_vgpr1 + ; CHECK: [[COPY1:%[0-9]+]]:_(p4) = COPY $vgpr0_vgpr1 + ; CHECK: [[ICMP:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[COPY]](p4), [[COPY1]] + ; CHECK: [[SEXT:%[0-9]+]]:_(s32) = G_SEXT [[ICMP]](s1) + ; CHECK: $vgpr0 = COPY [[SEXT]](s32) + %0:_(p4) = COPY $vgpr0_vgpr1 + %1:_(p4) = COPY $vgpr0_vgpr1 + %2:_(s1) = G_ICMP intpred(ne), %0, %1 + %3:_(s32) = G_SEXT %2 + $vgpr0 = COPY %3 +... + +--- +name: test_icmp_p5 +body: | + bb.0.entry: + liveins: $vgpr0, $vgpr1 + + ; CHECK-LABEL: name: test_icmp_p5 + ; CHECK: [[COPY:%[0-9]+]]:_(p5) = COPY $vgpr0 + ; CHECK: [[COPY1:%[0-9]+]]:_(p5) = COPY $vgpr1 + ; CHECK: [[ICMP:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[COPY]](p5), [[COPY1]] + ; CHECK: [[SEXT:%[0-9]+]]:_(s32) = G_SEXT [[ICMP]](s1) + ; CHECK: $vgpr0 = COPY [[SEXT]](s32) + %0:_(p5) = COPY $vgpr0 + %1:_(p5) = COPY $vgpr1 + %2:_(s1) = G_ICMP intpred(ne), %0, %1 + %3:_(s32) = G_SEXT %2 + $vgpr0 = COPY %3 +... + +--- +name: test_icmp_p999 +body: | + bb.0.entry: + liveins: $vgpr0_vgpr1, $vgpr2_vgpr3 + ; CHECK-LABEL: name: test_icmp_p999 + ; CHECK: [[COPY:%[0-9]+]]:_(p999) = COPY $vgpr0_vgpr1 + ; CHECK: [[COPY1:%[0-9]+]]:_(p999) = COPY $vgpr0_vgpr1 + ; CHECK: [[ICMP:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[COPY]](p999), [[COPY1]] + ; CHECK: [[SEXT:%[0-9]+]]:_(s32) = G_SEXT [[ICMP]](s1) + ; CHECK: $vgpr0 = COPY [[SEXT]](s32) + %0:_(p999) = COPY $vgpr0_vgpr1 + %1:_(p999) = COPY $vgpr0_vgpr1 + %2:_(s1) = G_ICMP intpred(ne), %0, %1 + %3:_(s32) = G_SEXT %2 + $vgpr0 = COPY %3 +... + +--- +name: test_icmp_v2p3 +body: | + bb.0.entry: + liveins: $vgpr0_vgpr1, $vgpr2_vgpr3 + ; CHECK-LABEL: name: test_icmp_v2p3 + ; CHECK: [[COPY:%[0-9]+]]:_(<2 x p3>) = COPY $vgpr0_vgpr1 + ; CHECK: [[COPY1:%[0-9]+]]:_(<2 x p3>) = COPY $vgpr0_vgpr1 + ; CHECK: [[UV:%[0-9]+]]:_(p3), [[UV1:%[0-9]+]]:_(p3) = G_UNMERGE_VALUES [[COPY]](<2 x p3>) + ; CHECK: [[UV2:%[0-9]+]]:_(p3), [[UV3:%[0-9]+]]:_(p3) = G_UNMERGE_VALUES [[COPY1]](<2 x p3>) + ; CHECK: [[ICMP:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[UV]](p3), [[UV2]] + ; CHECK: [[ICMP1:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[UV1]](p3), [[UV3]] + ; CHECK: [[SEXT:%[0-9]+]]:_(s32) = G_SEXT [[ICMP]](s1) + ; CHECK: [[SEXT1:%[0-9]+]]:_(s32) = G_SEXT [[ICMP1]](s1) + ; CHECK: [[BUILD_VECTOR:%[0-9]+]]:_(<2 x s32>) = G_BUILD_VECTOR [[SEXT]](s32), [[SEXT1]](s32) + ; CHECK: $vgpr0_vgpr1 = COPY [[BUILD_VECTOR]](<2 x s32>) + %0:_(<2 x p3>) = COPY $vgpr0_vgpr1 + %1:_(<2 x p3>) = COPY $vgpr0_vgpr1 + %2:_(<2 x s1>) = G_ICMP intpred(ne), %0, %1 + %3:_(<2 x s32>) = G_SEXT %2 + $vgpr0_vgpr1 = COPY %3 +... + +--- +name: test_icmp_v2p999 +body: | + bb.0.entry: + liveins: $vgpr0_vgpr1_vgpr2_vgpr3, $vgpr4_vgpr5_vgpr6_vgpr7 + ; CHECK-LABEL: name: test_icmp_v2p999 + ; CHECK: [[COPY:%[0-9]+]]:_(<2 x p999>) = COPY $vgpr0_vgpr1_vgpr2_vgpr3 + ; CHECK: [[COPY1:%[0-9]+]]:_(<2 x p999>) = COPY $vgpr4_vgpr5_vgpr6_vgpr7 + ; CHECK: [[UV:%[0-9]+]]:_(p999), [[UV1:%[0-9]+]]:_(p999) = G_UNMERGE_VALUES [[COPY]](<2 x p999>) + ; CHECK: [[UV2:%[0-9]+]]:_(p999), [[UV3:%[0-9]+]]:_(p999) = G_UNMERGE_VALUES [[COPY1]](<2 x p999>) + ; CHECK: [[ICMP:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[UV]](p999), [[UV2]] + ; CHECK: [[ICMP1:%[0-9]+]]:_(s1) = G_ICMP intpred(ne), [[UV1]](p999), [[UV3]] + ; CHECK: [[SEXT:%[0-9]+]]:_(s32) = G_SEXT [[ICMP]](s1) + ; CHECK: [[SEXT1:%[0-9]+]]:_(s32) = G_SEXT [[ICMP1]](s1) + ; CHECK: [[BUILD_VECTOR:%[0-9]+]]:_(<2 x s32>) = G_BUILD_VECTOR [[SEXT]](s32), [[SEXT1]](s32) + ; CHECK: $vgpr0_vgpr1 = COPY [[BUILD_VECTOR]](<2 x s32>) + %0:_(<2 x p999>) = COPY $vgpr0_vgpr1_vgpr2_vgpr3 + %1:_(<2 x p999>) = COPY $vgpr4_vgpr5_vgpr6_vgpr7 + %2:_(<2 x s1>) = G_ICMP intpred(ne), %0, %1 + %3:_(<2 x s32>) = G_SEXT %2 + $vgpr0_vgpr1 = COPY %3 +... -- 2.50.1