From 26c4b495a93b1d3f8bb699f476a7d673eaebc8c3 Mon Sep 17 00:00:00 2001 From: Simon Pilgrim Date: Mon, 7 Sep 2015 20:10:11 +0000 Subject: [PATCH] [X86][SSE4A] Added SSE4A IR + assembly codegen builtin tests git-svn-id: https://llvm.org/svn/llvm-project/cfe/trunk@246974 91177308-0d34-0410-b5e6-96231b3b80d8 --- test/CodeGen/sse4a-builtins.c | 39 ++++++++++++++++++++++------------- 1 file changed, 25 insertions(+), 14 deletions(-) diff --git a/test/CodeGen/sse4a-builtins.c b/test/CodeGen/sse4a-builtins.c index e1d7e8fb56..5ccbd9243c 100644 --- a/test/CodeGen/sse4a-builtins.c +++ b/test/CodeGen/sse4a-builtins.c @@ -1,39 +1,50 @@ -// RUN: %clang_cc1 -ffreestanding -triple i386-apple-darwin9 -target-cpu pentium4 -target-feature +sse4a -g -emit-llvm %s -o - | FileCheck %s +// REQUIRES: x86-registered-target +// RUN: %clang_cc1 %s -O0 -triple=x86_64-apple-darwin -target-feature +sse4a -emit-llvm -o - -Werror | FileCheck %s +// RUN: %clang_cc1 %s -O0 -triple=x86_64-apple-darwin -target-feature +sse4a -S -o - -Werror | FileCheck %s --check-prefix=CHECK-ASM -#include +// Don't include mm_malloc.h, it's system specific. +#define __MM_MALLOC_H + +#include __m128i test_extracti_si64(__m128i x) { + // CHECK-LABEL: test_extracti_si64 + // CHECK: call <2 x i64> @llvm.x86.sse4a.extrqi(<2 x i64> %{{[^,]+}}, i8 3, i8 2) + // CHECK-ASM: extrq $2, $3, %xmm{{.*}} return _mm_extracti_si64(x, 3, 2); -// CHECK: @test_extracti_si64 -// CHECK: @llvm.x86.sse4a.extrqi(<2 x i64> %{{[^,]+}}, i8 3, i8 2) } __m128i test_extract_si64(__m128i x, __m128i y) { + // CHECK-LABEL: test_extract_si64 + // CHECK: call <2 x i64> @llvm.x86.sse4a.extrq(<2 x i64> %{{[^,]+}}, <16 x i8> %{{[^,]+}}) + // CHECK-ASM: extrq %xmm{{.*}}, %xmm{{.*}} return _mm_extract_si64(x, y); -// CHECK: @test_extract_si64 -// CHECK: @llvm.x86.sse4a.extrq(<2 x i64> %{{[^,]+}}, <16 x i8> %{{[^,]+}}) } __m128i test_inserti_si64(__m128i x, __m128i y) { + // CHECK-LABEL: test_inserti_si64 + // CHECK: call <2 x i64> @llvm.x86.sse4a.insertqi(<2 x i64> %{{[^,]+}}, <2 x i64> %{{[^,]+}}, i8 5, i8 6) + // CHECK-ASM: insertq $6, $5, %xmm{{.*}}, %xmm{{.*}} return _mm_inserti_si64(x, y, 5, 6); -// CHECK: @test_inserti_si64 -// CHECK: @llvm.x86.sse4a.insertqi(<2 x i64> %{{[^,]+}}, <2 x i64> %{{[^,]+}}, i8 5, i8 6) } __m128i test_insert_si64(__m128i x, __m128i y) { + // CHECK-LABEL: test_insert_si64 + // CHECK: call <2 x i64> @llvm.x86.sse4a.insertq(<2 x i64> %{{[^,]+}}, <2 x i64> %{{[^,]+}}) + // CHECK-ASM: insertq %xmm{{.*}}, %xmm{{.*}} return _mm_insert_si64(x, y); -// CHECK: @test_insert_si64 -// CHECK: @llvm.x86.sse4a.insertq(<2 x i64> %{{[^,]+}}, <2 x i64> %{{[^,]+}}) } void test_stream_sd(double *p, __m128d a) { + // CHECK-LABEL: test_stream_sd + // CHECK: call void @llvm.x86.sse4a.movnt.sd(i8* %{{[^,]+}}, <2 x double> %{{[^,]+}}) + // CHECK-ASM: movntsd %xmm{{.*}} _mm_stream_sd(p, a); -// CHECK: @test_stream_sd -// CHECK: @llvm.x86.sse4a.movnt.sd(i8* %{{[^,]+}}, <2 x double> %{{[^,]+}}) } void test_stream_ss(float *p, __m128 a) { + // CHECK-LABEL: test_stream_ss + // CHECK: call void @llvm.x86.sse4a.movnt.ss(i8* %{{[^,]+}}, <4 x float> %{{[^,]+}}) + // CHECK-ASM: movntss %xmm{{.*}} _mm_stream_ss(p, a); -// CHECK: @test_stream_ss -// CHECK: @llvm.x86.sse4a.movnt.ss(i8* %{{[^,]+}}, <4 x float> %{{[^,]+}}) } -- 2.40.0