[AArch64] Add support for NEON scalar three register different instruction

author Chad Rosier <mcrosier@codeaurora.org>

Thu, 17 Oct 2013 18:12:50 +0000 (18:12 +0000)

committer Chad Rosier <mcrosier@codeaurora.org>

Thu, 17 Oct 2013 18:12:50 +0000 (18:12 +0000)
author Chad Rosier <mcrosier@codeaurora.org>
Thu, 17 Oct 2013 18:12:50 +0000 (18:12 +0000)
committer Chad Rosier <mcrosier@codeaurora.org>
Thu, 17 Oct 2013 18:12:50 +0000 (18:12 +0000)
diff --git a/include/clang/Basic/arm_neon.td b/include/clang/Basic/arm_neon.td

index 56b7e9c15b4e90a76fa5ddfd6e08ac9a09e2e209..560ed9f01fe81d07d054a1213715b01ba75a46a6 100644 (file)
--- a/include/clang/Basic/arm_neon.td
+++ b/include/clang/Basic/arm_neon.td
@@ -878,4 +878,16 @@ def SCALAR_SUQADD : SInst<"vuqadd", "sss", "ScSsSiSl">;
  ////////////////////////////////////////////////////////////////////////////////
  // Scalar Unsigned Saturating Accumulated of Signed Value
  def SCALAR_USQADD : SInst<"vsqadd", "sss", "SUcSUsSUiSUl">;
+
+////////////////////////////////////////////////////////////////////////////////
+// Signed Saturating Doubling Multiply-Add Long
+def SCALAR_SQDMLAL : SInst<"vqdmlal", "rss", "SsSi">;
+
+////////////////////////////////////////////////////////////////////////////////
+// Signed Saturating Doubling Multiply-Subtract Long
+def SCALAR_SQDMLSL : SInst<"vqdmlsl", "rss", "SsSi">;
+
+////////////////////////////////////////////////////////////////////////////////
+// Signed Saturating Doubling Multiply Long
+def SCALAR_SQDMULL : SInst<"vqdmull", "rss", "SsSi">;
  }
diff --git a/lib/CodeGen/CGBuiltin.cpp b/lib/CodeGen/CGBuiltin.cpp

index 36829391e53a2305bd1218b1da1345eac07b253d..0802b3a3f65fe5348a6e3d0d746dbea43c9fa8b8 100644 (file)
--- a/lib/CodeGen/CGBuiltin.cpp
+++ b/lib/CodeGen/CGBuiltin.cpp
@@ -1755,6 +1755,7 @@ static Value *EmitAArch64ScalarBuiltinExpr(CodeGenFunction &CGF,
    // Extend element of one-element vector
    bool ExtendEle = false;
    bool OverloadInt = false;
+  bool OverloadWideInt = false;
    const char *s = NULL;
  
    SmallVector<Value *, 4> Ops;
@@ -2110,6 +2111,21 @@ static Value *EmitAArch64ScalarBuiltinExpr(CodeGenFunction &CGF,
    case AArch64::BI__builtin_neon_vsqaddd_u64:
      Int = Intrinsic::aarch64_neon_vsqadd;
      s = "vsqadd"; OverloadInt = true; break;
+  // Signed Saturating Doubling Multiply-Add Long
+  case AArch64::BI__builtin_neon_vqdmlalh_s16:
+  case AArch64::BI__builtin_neon_vqdmlals_s32:
+    Int = Intrinsic::aarch64_neon_vqdmlal;
+    s = "vqdmlal"; OverloadWideInt = true; break;
+  // Signed Saturating Doubling Multiply-Subtract Long
+  case AArch64::BI__builtin_neon_vqdmlslh_s16:
+  case AArch64::BI__builtin_neon_vqdmlsls_s32:
+    Int = Intrinsic::aarch64_neon_vqdmlsl;
+    s = "vqdmlsl"; OverloadWideInt = true; break;
+  // Signed Saturating Doubling Multiply Long
+  case AArch64::BI__builtin_neon_vqdmullh_s16:
+  case AArch64::BI__builtin_neon_vqdmulls_s32:
+    Int = Intrinsic::aarch64_neon_vqdmull;
+    s = "vqdmull"; OverloadWideInt = true; break;
    }
  
    if (!Int)
@@ -2135,8 +2151,7 @@ static Value *EmitAArch64ScalarBuiltinExpr(CodeGenFunction &CGF,
      llvm::Type *Tys[2] = {RTy, VTy};
      F = CGF.CGM.getIntrinsic(Int, Tys);
      assert(E->getNumArgs() == 1);
-  }
-  else if (OverloadInt) {
+  } else if (OverloadInt) {
      // Determine the type of this overloaded AArch64 intrinsic
      const Expr *Arg = E->getArg(E->getNumArgs()-1);
      llvm::Type *Ty = CGF.ConvertType(Arg->getType());
@@ -2144,6 +2159,13 @@ static Value *EmitAArch64ScalarBuiltinExpr(CodeGenFunction &CGF,
      assert(VTy);
  
      F = CGF.CGM.getIntrinsic(Int, VTy);
+  } else if (OverloadWideInt) {
+    // Determine the type of this overloaded AArch64 intrinsic
+    const Expr *Arg = E->getArg(E->getNumArgs()-1);
+    llvm::Type *Ty = CGF.ConvertType(Arg->getType());
+    llvm::VectorType *VTy = llvm::VectorType::get(Ty, 1);
+    llvm::VectorType *RTy = llvm::VectorType::getExtendedElementVectorType(VTy);
+    F = CGF.CGM.getIntrinsic(Int, RTy);
    } else
      F = CGF.CGM.getIntrinsic(Int);
  
diff --git a/test/CodeGen/aarch64-neon-intrinsics.c b/test/CodeGen/aarch64-neon-intrinsics.c

index d3fd0cd585ea7ed75f092265b663620c73a47d6f..ffee567c8916cce8bf2e2b040415015a9b484dfc 100644 (file)
--- a/test/CodeGen/aarch64-neon-intrinsics.c
+++ b/test/CodeGen/aarch64-neon-intrinsics.c
@@ -7225,3 +7225,39 @@ uint64_t test_vsqaddd_u64(uint64_t a, uint64_t b) {
  // CHECK: usqadd {{d[0-9]+}}, {{d[0-9]+}}
    return (uint64_t)vsqaddd_u64(a, b);
  }
+
+int32_t test_vqdmlalh_s16(int16_t a, int16_t b) {
+// CHECK: test_vqdmlalh_s16
+// CHECK: sqdmlal {{s[0-9]+}}, {{h[0-9]+}}, {{h[0-9]+}}
+  return (int32_t)vqdmlalh_s16(a, b);
+}
+
+int64_t test_vqdmlals_s32(int32_t a, int32_t b) {
+// CHECK: test_vqdmlals_s32
+// CHECK: sqdmlal {{d[0-9]+}}, {{s[0-9]+}}, {{s[0-9]+}}
+  return (int64_t)vqdmlals_s32(a, b);
+}
+
+int32_t test_vqdmlslh_s16(int16_t a, int16_t b) {
+// CHECK: test_vqdmlslh_s16
+// CHECK: sqdmlsl {{s[0-9]+}}, {{h[0-9]+}}, {{h[0-9]+}}
+  return (int32_t)vqdmlslh_s16(a, b);
+}
+
+int64_t test_vqdmlsls_s32(int32_t a, int32_t b) {
+// CHECK: test_vqdmlsls_s32
+// CHECK: sqdmlsl {{d[0-9]+}}, {{s[0-9]+}}, {{s[0-9]+}}
+  return (int64_t)vqdmlsls_s32(a, b);
+}
+
+int32_t test_vqdmullh_s16(int16_t a, int16_t b) {
+// CHECK: test_vqdmullh_s16
+// CHECK: sqdmull {{s[0-9]+}}, {{h[0-9]+}}, {{h[0-9]+}}
+  return (int32_t)vqdmullh_s16(a, b);
+}
+
+int64_t test_vqdmulls_s32(int32_t a, int32_t b) {
+// CHECK: test_vqdmulls_s32
+// CHECK: sqdmull {{d[0-9]+}}, {{s[0-9]+}}, {{s[0-9]+}}
+  return (int64_t)vqdmulls_s32(a, b);
+}
author	Chad Rosier <mcrosier@codeaurora.org>
	Thu, 17 Oct 2013 18:12:50 +0000 (18:12 +0000)
committer	Chad Rosier <mcrosier@codeaurora.org>
	Thu, 17 Oct 2013 18:12:50 +0000 (18:12 +0000)
include/clang/Basic/arm_neon.td		patch \| blob \| history
lib/CodeGen/CGBuiltin.cpp		patch \| blob \| history
test/CodeGen/aarch64-neon-intrinsics.c		patch \| blob \| history