pass argument vectors in a type that corresponds to the user type if

author Chris Lattner <sabre@nondot.org>

Wed, 28 Jul 2010 23:47:21 +0000 (23:47 +0000)

committer Chris Lattner <sabre@nondot.org>

Wed, 28 Jul 2010 23:47:21 +0000 (23:47 +0000)
author Chris Lattner <sabre@nondot.org>
Wed, 28 Jul 2010 23:47:21 +0000 (23:47 +0000)
committer Chris Lattner <sabre@nondot.org>
Wed, 28 Jul 2010 23:47:21 +0000 (23:47 +0000)
diff --git a/lib/CodeGen/TargetInfo.cpp b/lib/CodeGen/TargetInfo.cpp

index 613e2f62819ae3f32c81f632cf95668e3b7e031c..fc5e91fb7d0727445601f3633bdf54eb91e3c154 100644 (file)
--- a/lib/CodeGen/TargetInfo.cpp
+++ b/lib/CodeGen/TargetInfo.cpp
@@ -1432,10 +1432,22 @@ ABIArgInfo X86_64ABIInfo::classifyArgumentType(QualType Ty,
  
      // AMD64-ABI 3.2.3p3: Rule 4. If the class is SSEUP, the
      // eightbyte is passed in the upper half of the last used SSE
-    // register.
+    // register.  This only happens when 128-bit vectors are passed. 
    case SSEUp:
-    assert(Lo == SSE && "Unexpected SSEUp classification.");
+    assert(Lo == SSE && "Unexpected SSEUp classification");
      ResType = llvm::VectorType::get(llvm::Type::getDoubleTy(VMContext), 2);
+      
+    // If the preferred type is a 16-byte vector, prefer to pass it.
+    if (const llvm::VectorType *VT =
+          dyn_cast_or_null<llvm::VectorType>(PrefType)) {
+      const llvm::Type *EltTy = VT->getElementType();
+      if (VT->getBitWidth() == 128 &&
+          (EltTy->isFloatTy() || EltTy->isDoubleTy() ||
+           EltTy->isIntegerTy(8) || EltTy->isIntegerTy(16) ||
+           EltTy->isIntegerTy(32) || EltTy->isIntegerTy(64) ||
+           EltTy->isIntegerTy(128)))
+        ResType = PrefType;
+    }
      break;
    }
  
diff --git a/test/CodeGen/x86_64-arguments.c b/test/CodeGen/x86_64-arguments.c

index 1b7967d0de716afc0c03979235222e58496814d8..b4500d6de691cca6b9485d15d35287284eb7248d 100644 (file)
--- a/test/CodeGen/x86_64-arguments.c
+++ b/test/CodeGen/x86_64-arguments.c
@@ -152,3 +152,11 @@ struct f23S f24(struct f23S *X, struct f24s *P2) {
    // CHECK: define %struct.f24s @f24(%struct.f23S* %X, %struct.f24s* %P2)
  }
  
+typedef float v4f32 __attribute__((__vector_size__(16)));
+
+v4f32 f25(v4f32 X) {
+  // CHECK: define <2 x double> @f25(<4 x float> %X.coerce)
+  return X+X;
+}
+
+
author	Chris Lattner <sabre@nondot.org>
	Wed, 28 Jul 2010 23:47:21 +0000 (23:47 +0000)
committer	Chris Lattner <sabre@nondot.org>
	Wed, 28 Jul 2010 23:47:21 +0000 (23:47 +0000)
lib/CodeGen/TargetInfo.cpp		patch \| blob \| history
test/CodeGen/x86_64-arguments.c		patch \| blob \| history