1 // RUN: %clang_cc1 %s -O3 -triple=x86_64-apple-darwin -target-feature +avx -emit-llvm -o - | FileCheck %s
2
3 // Don't include mm_malloc.h, it's system specific.
4 #define __MM_MALLOC_H
5
6 #include <immintrin.h>
7
8 //
9 // Test LLVM IR codegen of cmpXY instructions
10 //
11
test_cmp_pd(__m128d a,__m128d b)12 __m128d test_cmp_pd(__m128d a, __m128d b) {
13 // Expects that the third argument in LLVM IR is immediate expression
14 // CHECK: @llvm.x86.sse2.cmp.pd({{.*}}, i8 13)
15 return _mm_cmp_pd(a, b, _CMP_GE_OS);
16 }
17
test_cmp_ps(__m128 a,__m128 b)18 __m128d test_cmp_ps(__m128 a, __m128 b) {
19 // Expects that the third argument in LLVM IR is immediate expression
20 // CHECK: @llvm.x86.sse.cmp.ps({{.*}}, i8 13)
21 return _mm_cmp_ps(a, b, _CMP_GE_OS);
22 }
23
test_cmp_pd256(__m256d a,__m256d b)24 __m256d test_cmp_pd256(__m256d a, __m256d b) {
25 // Expects that the third argument in LLVM IR is immediate expression
26 // CHECK: @llvm.x86.avx.cmp.pd.256({{.*}}, i8 13)
27 return _mm256_cmp_pd(a, b, _CMP_GE_OS);
28 }
29
test_cmp_ps256(__m256 a,__m256 b)30 __m256d test_cmp_ps256(__m256 a, __m256 b) {
31 // Expects that the third argument in LLVM IR is immediate expression
32 // CHECK: @llvm.x86.avx.cmp.ps.256({{.*}}, i8 13)
33 return _mm256_cmp_ps(a, b, _CMP_GE_OS);
34 }
35
test_cmp_sd(__m128d a,__m128d b)36 __m128d test_cmp_sd(__m128d a, __m128d b) {
37 // Expects that the third argument in LLVM IR is immediate expression
38 // CHECK: @llvm.x86.sse2.cmp.sd({{.*}}, i8 13)
39 return _mm_cmp_sd(a, b, _CMP_GE_OS);
40 }
41
test_cmp_ss(__m128 a,__m128 b)42 __m128d test_cmp_ss(__m128 a, __m128 b) {
43 // Expects that the third argument in LLVM IR is immediate expression
44 // CHECK: @llvm.x86.sse.cmp.ss({{.*}}, i8 13)
45 return _mm_cmp_ss(a, b, _CMP_GE_OS);
46 }
47
test_cmpgt_ss(__m128 a,__m128 b)48 __m128 test_cmpgt_ss(__m128 a, __m128 b) {
49 // CHECK: @llvm.x86.sse.cmp.ss({{.*}}, i8 1)
50 // CHECK: shufflevector <{{.*}}, <4 x i32> <i32 4, i32 1, i32 2, i32 3>
51 return _mm_cmpgt_ss(a, b);
52 }
53
test_cmpge_ss(__m128 a,__m128 b)54 __m128 test_cmpge_ss(__m128 a, __m128 b) {
55 // CHECK: @llvm.x86.sse.cmp.ss({{.*}}, i8 2)
56 // CHECK: shufflevector <{{.*}}, <4 x i32> <i32 4, i32 1, i32 2, i32 3>
57 return _mm_cmpge_ss(a, b);
58 }
59
test_cmpngt_ss(__m128 a,__m128 b)60 __m128 test_cmpngt_ss(__m128 a, __m128 b) {
61 // CHECK: @llvm.x86.sse.cmp.ss({{.*}}, i8 5)
62 // CHECK: shufflevector <{{.*}}, <4 x i32> <i32 4, i32 1, i32 2, i32 3>
63 return _mm_cmpngt_ss(a, b);
64 }
65
test_cmpnge_ss(__m128 a,__m128 b)66 __m128 test_cmpnge_ss(__m128 a, __m128 b) {
67 // CHECK: @llvm.x86.sse.cmp.ss({{.*}}, i8 6)
68 // CHECK: shufflevector <{{.*}}, <4 x i32> <i32 4, i32 1, i32 2, i32 3>
69 return _mm_cmpnge_ss(a, b);
70 }
71
test_cmpgt_sd(__m128d a,__m128d b)72 __m128d test_cmpgt_sd(__m128d a, __m128d b) {
73 // CHECK: @llvm.x86.sse2.cmp.sd({{.*}}, i8 1)
74 // CHECK: shufflevector <{{.*}}, <2 x i32> <i32 0, i32 3>
75 return _mm_cmpgt_sd(a, b);
76 }
77
test_cmpge_sd(__m128d a,__m128d b)78 __m128d test_cmpge_sd(__m128d a, __m128d b) {
79 // CHECK: @llvm.x86.sse2.cmp.sd({{.*}}, i8 2)
80 // CHECK: shufflevector <{{.*}}, <2 x i32> <i32 0, i32 3>
81 return _mm_cmpge_sd(a, b);
82 }
83
test_cmpngt_sd(__m128d a,__m128d b)84 __m128d test_cmpngt_sd(__m128d a, __m128d b) {
85 // CHECK: @llvm.x86.sse2.cmp.sd({{.*}}, i8 5)
86 // CHECK: shufflevector <{{.*}}, <2 x i32> <i32 0, i32 3>
87 return _mm_cmpngt_sd(a, b);
88 }
89
test_cmpnge_sd(__m128d a,__m128d b)90 __m128d test_cmpnge_sd(__m128d a, __m128d b) {
91 // CHECK: @llvm.x86.sse2.cmp.sd({{.*}}, i8 6)
92 // CHECK: shufflevector <{{.*}}, <2 x i32> <i32 0, i32 3>
93 return _mm_cmpnge_sd(a, b);
94 }
95