[AMDGPU] Add llvm.amdgpu.update.dpp intrinsic

author Connor Abbott <cwabbott0@gmail.com>

Tue, 8 Aug 2017 18:52:22 +0000 (18:52 +0000)

committer Connor Abbott <cwabbott0@gmail.com>

Tue, 8 Aug 2017 18:52:22 +0000 (18:52 +0000)
author Connor Abbott <cwabbott0@gmail.com>
Tue, 8 Aug 2017 18:52:22 +0000 (18:52 +0000)
committer Connor Abbott <cwabbott0@gmail.com>
Tue, 8 Aug 2017 18:52:22 +0000 (18:52 +0000)
diff --git a/include/llvm/IR/IntrinsicsAMDGPU.td b/include/llvm/IR/IntrinsicsAMDGPU.td

index 40ac52e5d0d3f12712ae6e73aa454b0aad628b07..f2203470008f6109e073820b98e7924051efa6fe 100644 (file)
--- a/include/llvm/IR/IntrinsicsAMDGPU.td
+++ b/include/llvm/IR/IntrinsicsAMDGPU.td
@@ -788,6 +788,15 @@ def int_amdgcn_mov_dpp :
              [LLVMMatchType<0>, llvm_i32_ty, llvm_i32_ty, llvm_i32_ty,
               llvm_i1_ty], [IntrNoMem, IntrConvergent]>;
  
+// llvm.amdgcn.update.dpp.i32 <old> <src> <dpp_ctrl> <row_mask> <bank_mask> <bound_ctrl>
+// Should be equivalent to:
+// v_mov_b32 <dest> <old>
+// v_mov_b32 <dest> <src> <dpp_ctrl> <row_mask> <bank_mask> <bound_ctrl>
+def int_amdgcn_update_dpp :
+  Intrinsic<[llvm_anyint_ty],
+            [LLVMMatchType<0>, LLVMMatchType<0>, llvm_i32_ty, llvm_i32_ty,
+             llvm_i32_ty, llvm_i1_ty], [IntrNoMem, IntrConvergent]>;
+
  def int_amdgcn_s_dcache_wb :
    GCCBuiltin<"__builtin_amdgcn_s_dcache_wb">,
    Intrinsic<[], [], []>;
diff --git a/lib/Target/AMDGPU/VOP1Instructions.td b/lib/Target/AMDGPU/VOP1Instructions.td

index f20a20e91cd59fbddcf150afaef1d1d4420fa6a8..b2b9af3dca937f1e2f487f223b9c68f5b4734407 100644 (file)
--- a/lib/Target/AMDGPU/VOP1Instructions.td
+++ b/lib/Target/AMDGPU/VOP1Instructions.td
@@ -663,6 +663,14 @@ def : Pat <
                         (as_i1imm $bound_ctrl))
  >;
  
+def : Pat <
+  (i32 (int_amdgcn_update_dpp i32:$old, i32:$src, imm:$dpp_ctrl, imm:$row_mask,
+                      imm:$bank_mask, imm:$bound_ctrl)),
+  (V_MOV_B32_dpp $old, $src, (as_i32imm $dpp_ctrl),
+                       (as_i32imm $row_mask), (as_i32imm $bank_mask),
+                       (as_i1imm $bound_ctrl))
+>;
+
  def : Pat<
    (i32 (anyext i16:$src)),
    (COPY $src)
diff --git a/test/CodeGen/AMDGPU/llvm.amdgcn.update.dpp.ll b/test/CodeGen/AMDGPU/llvm.amdgcn.update.dpp.ll

new file mode 100644 (file)

index 0000000..4d1dbf5
--- /dev/null
+++ b/test/CodeGen/AMDGPU/llvm.amdgcn.update.dpp.ll
@@ -0,0 +1,17 @@
+; RUN: llc -march=amdgcn -mcpu=tonga -mattr=-flat-for-global -verify-machineinstrs -show-mc-encoding < %s | FileCheck -check-prefix=VI -check-prefix=VI-OPT %s
+; RUN: llc -O0 -march=amdgcn -mcpu=tonga -mattr=-flat-for-global -verify-machineinstrs -show-mc-encoding < %s | FileCheck -check-prefix=VI -check-prefix=VI-NOOPT %s
+
+; VI-LABEL: {{^}}dpp_test:
+; VI: v_mov_b32_e32 v0, s{{[0-9]+}}
+; VI: v_mov_b32_e32 v1, s{{[0-9]+}}
+; VI: s_nop 1
+; VI: v_mov_b32_dpp v0, v1 quad_perm:[1,0,0,0] row_mask:0x1 bank_mask:0x1 bound_ctrl:0 ; encoding: [0xfa,0x02,0x00,0x7e,0x01,0x01,0x08,0x11]
+define amdgpu_kernel void @dpp_test(i32 addrspace(1)* %out, i32 %in1, i32 %in2) {
+  %tmp0 = call i32 @llvm.amdgcn.update.dpp.i32(i32 %in1, i32 %in2, i32 1, i32 1, i32 1, i1 1) #0
+  store i32 %tmp0, i32 addrspace(1)* %out
+  ret void
+}
+
+declare i32 @llvm.amdgcn.update.dpp.i32(i32, i32, i32, i32, i32, i1) #0
+
+attributes #0 = { nounwind readnone convergent }
author	Connor Abbott <cwabbott0@gmail.com>
	Tue, 8 Aug 2017 18:52:22 +0000 (18:52 +0000)
committer	Connor Abbott <cwabbott0@gmail.com>
	Tue, 8 Aug 2017 18:52:22 +0000 (18:52 +0000)
include/llvm/IR/IntrinsicsAMDGPU.td		patch \| blob \| history
lib/Target/AMDGPU/VOP1Instructions.td		patch \| blob \| history
test/CodeGen/AMDGPU/llvm.amdgcn.update.dpp.ll	[new file with mode: 0644]	patch \| blob