Home
last modified time | relevance | path

Searched refs:SSE (Results 1 – 25 of 130) sorted by relevance

123456

/external/llvm/test/CodeGen/X86/
Dvector-idiv.ll2 ; RUN: llc -march=x86-64 -mcpu=core2 < %s | FileCheck %s --check-prefix=SSE
23 ; SSE-LABEL: test1:
24 ; SSE: # BB#0:
25 ; SSE-NEXT: movdqa {{.*#+}} xmm1 = [613566757,613566757,613566757,613566757]
26 ; SSE-NEXT: movdqa %xmm0, %xmm2
27 ; SSE-NEXT: pmuludq %xmm1, %xmm2
28 ; SSE-NEXT: pshufd {{.*#+}} xmm2 = xmm2[1,3,2,3]
29 ; SSE-NEXT: pshufd {{.*#+}} xmm1 = xmm1[1,1,3,3]
30 ; SSE-NEXT: pshufd {{.*#+}} xmm3 = xmm0[1,1,3,3]
31 ; SSE-NEXT: pmuludq %xmm1, %xmm3
[all …]
Dsse-scalar-fp-arith.ll1 ; RUN: llc -mcpu=x86-64 -mattr=+sse2 < %s | FileCheck --check-prefix=SSE --check-prefix=SSE2 %s
2 ; RUN: llc -mcpu=x86-64 -mattr=+sse4.1 < %s | FileCheck --check-prefix=SSE --check-prefix=SSE41 %s
8 ; instructions immediately after SSE scalar fp instructions
12 ; SSE-LABEL: test_add_ss:
13 ; SSE: # BB#0:
14 ; SSE-NEXT: addss %xmm1, %xmm0
15 ; SSE-NEXT: retq
29 ; SSE-LABEL: test_sub_ss:
30 ; SSE: # BB#0:
31 ; SSE-NEXT: subss %xmm1, %xmm0
[all …]
Dpreserve_mostcc64.ll1 ; RUN: llc < %s -mtriple=x86_64-apple-darwin -mcpu=corei7 | FileCheck --check-prefix=SSE %s
7 ;SSE-LABEL: preserve_mostcc1
8 ;SSE: pushq %r10
9 ;SSE-NEXT: pushq %r9
10 ;SSE-NEXT: pushq %r8
11 ;SSE-NEXT: pushq %rdi
12 ;SSE-NEXT: pushq %rsi
13 ;SSE-NEXT: pushq %rdx
14 ;SSE-NEXT: pushq %rcx
15 ;SSE-NEXT: pushq %rax
[all …]
Dpreserve_allcc64.ll1 ; RUN: llc < %s -mtriple=x86_64-apple-darwin -mcpu=corei7 | FileCheck --check-prefix=SSE %s
6 ;SSE-LABEL: preserve_allcc1
7 ;SSE: pushq %r10
8 ;SSE-NEXT: pushq %r9
9 ;SSE-NEXT: pushq %r8
10 ;SSE-NEXT: pushq %rdi
11 ;SSE-NEXT: pushq %rsi
12 ;SSE-NEXT: pushq %rdx
13 ;SSE-NEXT: pushq %rcx
14 ;SSE-NEXT: pushq %rax
[all …]
Dvector-shuffle-128-v2.ll1 …known-unknown -mcpu=x86-64 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE2
2 … -mcpu=x86-64 -mattr=+sse3 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE3
3 …mcpu=x86-64 -mattr=+ssse3 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSSE3
4 …cpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41
12 ; SSE-LABEL: shuffle_v2i64_00:
13 ; SSE: # BB#0:
14 ; SSE-NEXT: pshufd {{.*#+}} xmm0 = xmm0[0,1,0,1]
15 ; SSE-NEXT: retq
30 ; SSE-LABEL: shuffle_v2i64_10:
31 ; SSE: # BB#0:
[all …]
Dcmov-fp.ll1 ; RUN: llc -march x86 -mcpu pentium4 < %s | FileCheck %s -check-prefix=SSE
12 ; SSE-LABEL: test1:
13 ; SSE: movsd
31 ; SSE-LABEL: test2:
32 ; SSE: movsd
49 ; SSE-LABEL: test3:
50 ; SSE: movsd
67 ; SSE-LABEL: test4:
68 ; SSE: movsd
85 ; SSE-LABEL: test5:
[all …]
Drounding-ops.ll1 ; RUN: llc < %s -mtriple=x86_64-apple-macosx -mattr=+sse4.1 | FileCheck -check-prefix=CHECK-SSE %s
8 ; CHECK-SSE-LABEL: test1:
9 ; CHECK-SSE: roundss $1
21 ; CHECK-SSE-LABEL: test2:
22 ; CHECK-SSE: roundsd $1
34 ; CHECK-SSE-LABEL: test3:
35 ; CHECK-SSE: roundss $12
47 ; CHECK-SSE-LABEL: test4:
48 ; CHECK-SSE: roundsd $12
60 ; CHECK-SSE-LABEL: test5:
[all …]
Dlower-vec-shift.ll2 …mtriple=x86_64-unknown-linux-gnu -mcpu=core2 | FileCheck %s --check-prefix=CHECK --check-prefix=SSE
16 ; SSE: psrlw
17 ; SSE-NEXT: psrlw
18 ; SSE-NEXT: movss
33 ; SSE: psrlw
34 ; SSE-NEXT: psrlw
35 ; SSE-NEXT: movsd
50 ; SSE: psrld
51 ; SSE-NEXT: psrld
52 ; SSE-NEXT: movss
[all …]
Dcommute-fcmp.ll1 …N: llc -O3 -mtriple=x86_64-unknown -mcpu=x86-64 -mattr=+sse2 < %s | FileCheck %s --check-prefix=SSE
10 ;SSE-LABEL: commute_cmpps_eq
11 ;SSE: cmpeqps (%rdi), %xmm0
12 ;SSE-NEXT: retq
25 ;SSE-LABEL: commute_cmpps_ne
26 ;SSE: cmpneqps (%rdi), %xmm0
27 ;SSE-NEXT: retq
40 ;SSE-LABEL: commute_cmpps_ord
41 ;SSE: cmpordps (%rdi), %xmm0
42 ;SSE-NEXT: retq
[all …]
Dbreak-false-dep.ll1 ; RUN: llc < %s -mtriple=x86_64-linux -mattr=+sse2 -mcpu=nehalem | FileCheck %s --check-prefix=SSE
2 ; RUN: llc < %s -mtriple=x86_64-win32 -mattr=+sse2 -mcpu=nehalem | FileCheck %s --check-prefix=SSE
7 ; SSE-LABEL: t1:
8 ; SSE: movss ([[A0:%rdi|%rcx]]), %xmm0
9 ; SSE: cvtss2sd %xmm0, %xmm0
18 ; SSE-LABEL: t2:
19 ; SSE: cvtsd2ss ([[A0]]), %xmm0
27 ; SSE-LABEL: squirtf:
28 ; SSE: movss ([[A0]]), %xmm0
29 ; SSE: sqrtss %xmm0, %xmm0
[all …]
Dvec_uint_to_fp.ll1 ; RUN: llc < %s -mtriple=x86_64-apple-macosx | FileCheck --check-prefix=CHECK --check-prefix=SSE --…
7 ; SSE: [[MASKCSTADDR:LCPI0_[0-9]+]]:
8 ; SSE-NEXT: .long 65535 ## 0xffff
9 ; SSE-NEXT: .long 65535 ## 0xffff
10 ; SSE-NEXT: .long 65535 ## 0xffff
11 ; SSE-NEXT: .long 65535 ## 0xffff
43 ; SSE: movdqa [[MASKCSTADDR]](%rip), [[MASK:%xmm[0-9]+]]
44 ; SSE-NEXT: pand %xmm0, [[MASK]]
47 ; SSE-NEXT: por [[LOWCSTADDR]](%rip), [[MASK]]
48 ; SSE-NEXT: psrld $16, %xmm0
[all …]
Dexedeps-movq.ll1 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=sse2 | FileCheck %s --check-prefix=SSE
13 ; SSE-LABEL: store_floats:
14 ; SSE: # BB#0:
15 ; SSE-NEXT: addps %xmm0, %xmm0
16 ; SSE-NEXT: movlps %xmm0, (%rdi)
17 ; SSE-NEXT: retq
37 ; SSE-LABEL: store_double:
38 ; SSE: # BB#0:
39 ; SSE-NEXT: addpd %xmm0, %xmm0
40 ; SSE-NEXT: movlpd %xmm0, (%rdi)
[all …]
Dcommute-clmul.ll1 …O3 -mtriple=x86_64-unknown -mcpu=x86-64 -mattr=+sse2,+pclmul < %s | FileCheck %s --check-prefix=SSE
7 ;SSE-LABEL: commute_lq_lq
8 ;SSE: pclmulqdq $0, (%rdi), %xmm0
9 ;SSE-NEXT: retq
21 ;SSE-LABEL: commute_lq_hq
22 ;SSE: pclmulqdq $1, (%rdi), %xmm0
23 ;SSE-NEXT: retq
35 ;SSE-LABEL: commute_hq_lq
36 ;SSE: pclmulqdq $16, (%rdi), %xmm0
37 ;SSE-NEXT: retq
[all …]
Dvector-zmov.ll1 …_64-unknown-unknown -mcpu=x86-64 -mattr=+sse2 | FileCheck %s --check-prefix=SSE --check-prefix=SSE2
2 …4-unknown-unknown -mcpu=x86-64 -mattr=+ssse3 | FileCheck %s --check-prefix=SSE --check-prefix=SSSE3
3 …-unknown-unknown -mcpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=SSE --check-prefix=SSE41
8 ; SSE-LABEL: load_zmov_4i32_to_0zzz:
9 ; SSE: # BB#0: # %entry
10 ; SSE-NEXT: movd (%rdi), %xmm0
11 ; SSE-NEXT: retq
24 ; SSE-LABEL: load_zmov_2i64_to_0z:
25 ; SSE: # BB#0: # %entry
26 ; SSE-NEXT: movq (%rdi), %xmm0
[all …]
Dfast-isel-vecload.ll1 …riple=x86_64-unknown-unknown -mattr=+sse2 < %s | FileCheck %s --check-prefix=SSE --check-prefix=ALL
9 ; SSE: movdqa (%rdi), %xmm0
19 ; SSE: movdqa (%rdi), %xmm0
29 ; SSE: movdqa (%rdi), %xmm0
39 ; SSE: movdqa (%rdi), %xmm0
49 ; SSE: movdqu (%rdi), %xmm0
59 ; SSE: movdqu (%rdi), %xmm0
69 ; SSE: movdqu (%rdi), %xmm0
79 ; SSE: movdqu (%rdi), %xmm0
89 ; SSE: movaps (%rdi), %xmm0
[all …]
Dvector-shuffle-128-v8.ll1 …known-unknown -mcpu=x86-64 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE2
2 …mcpu=x86-64 -mattr=+ssse3 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSSE3
3 …cpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41
11 ; SSE-LABEL: shuffle_v8i16_01012323:
12 ; SSE: # BB#0:
13 ; SSE-NEXT: pshufd {{.*#+}} xmm0 = xmm0[0,0,1,1]
14 ; SSE-NEXT: retq
24 ; SSE-LABEL: shuffle_v8i16_67452301:
25 ; SSE: # BB#0:
26 ; SSE-NEXT: pshufd {{.*#+}} xmm0 = xmm0[3,2,1,0]
[all …]
Dvector-shuffle-128-v4.ll1 …known-unknown -mcpu=x86-64 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE2
2 … -mcpu=x86-64 -mattr=+sse3 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE3
3 …mcpu=x86-64 -mattr=+ssse3 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSSE3
4 …cpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41
12 ; SSE-LABEL: shuffle_v4i32_0001:
13 ; SSE: # BB#0:
14 ; SSE-NEXT: pshufd {{.*#+}} xmm0 = xmm0[0,0,0,1]
15 ; SSE-NEXT: retq
25 ; SSE-LABEL: shuffle_v4i32_0020:
26 ; SSE: # BB#0:
[all …]
Dvector-shuffle-combining.ll1 ; RUN: llc < %s -mcpu=x86-64 -mattr=+sse2 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --ch…
2 ; RUN: llc < %s -mcpu=x86-64 -mattr=+ssse3 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --c…
3 ; RUN: llc < %s -mcpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --…
55 ; SSE-LABEL: combine_pshufd4:
56 ; SSE: # BB#0: # %entry
57 ; SSE-NEXT: pshufhw {{.*#+}} xmm0 = xmm0[0,1,2,3,7,6,5,4]
58 ; SSE-NEXT: retq
74 ; SSE-LABEL: combine_pshufd5:
75 ; SSE: # BB#0: # %entry
76 ; SSE-NEXT: pshuflw {{.*#+}} xmm0 = xmm0[3,2,1,0,4,5,6,7]
[all …]
Dfold-vex.ll6 …< %s -mtriple=x86_64-unknown-unknown -mattr=-avx | FileCheck %s --check-prefix=SSE
7 …< %s -mtriple=x86_64-unknown-unknown -mcpu=corei7-avx -mattr=-avx | FileCheck %s --check-prefix=SSE
8 …< %s -mtriple=x86_64-unknown-unknown -mcpu=btver2 -mattr=-avx | FileCheck %s --check-prefix=SSE
13 ; With SSE, folding memory operands into math/logic ops requires 16-byte alignment
26 ; SSE-LABEL: @test1
27 ; SSE: movups (%rdi), %xmm1
28 ; SSE-NEXT: andps %xmm1, %xmm0
29 ; SSE-NEXT: ret
Dfast-isel-sse12-fptoint.ll1 …6_64-apple-darwin -mattr=-avx,+sse2 -fast-isel -fast-isel-abort=1 | FileCheck %s --check-prefix=SSE
5 ; SSE-LABEL: cvt_test1
6 ; SSE: cvttss2si %xmm0, %eax
19 ; SSE-LABEL: cvt_test2
20 ; SSE: cvttss2si %xmm0, %rax
33 ; SSE-LABEL: cvt_test3
34 ; SSE: cvttsd2si %xmm0, %eax
45 ; SSE-LABEL: cvt_test4
46 ; SSE: cvttsd2si %xmm0, %rax
Dvec_shift6.ll1 …mtriple=x86_64-unknown-linux-gnu -mattr=sse4.1 | FileCheck %s -check-prefix=CHECK -check-prefix=SSE
38 ; SSE: pmulld
49 ; SSE: pmulld
63 ; SSE: pmullw
64 ; SSE-NEXT: pmullw
79 ; SSE: pmulld
80 ; SSE-NEXT: pmulld
94 ; SSE: pmullw
95 ; SSE-NEXT: pmullw
96 ; SSE-NEXT: pmullw
[all …]
Dsse3-avx-addsub.ll1 ; RUN: llc < %s -march=x86-64 -mcpu=core2 | FileCheck %s -check-prefix=SSE -check-prefix=CHECK
44 ; SSE: addsubps
56 ; SSE: addsubps
57 ; SSE-NEXT: addsubps
70 ; SSE: addsubpd
71 ; SSE: addsubpd
84 ; SSE: addsubpd
97 ; SSE: addsubps
110 ; SSE: addsubps
111 ; SSE-NEXT: addsubps
[all …]
Danyregcc.ll2 …%s -mtriple=x86_64-apple-darwin -mcpu=corei7 -disable-fp-elim | FileCheck --check-prefix=SSE %s
370 ;SSE-LABEL: anyregcc1
371 ;SSE: pushq %rbp
372 ;SSE: pushq %rax
373 ;SSE: pushq %r15
374 ;SSE: pushq %r14
375 ;SSE: pushq %r13
376 ;SSE: pushq %r12
377 ;SSE: pushq %r11
378 ;SSE: pushq %r10
[all …]
Dsplat-const.ll1 ; RUN: llc < %s -mcpu=penryn | FileCheck %s --check-prefix=SSE
9 ; SSE-LABEL: zero_vector:
10 ; SSE: xorps %xmm0, %xmm0
11 ; SSE-NEXT: retq
28 ; SSE-LABEL: const_vector:
29 ; SSE: movaps {{.*}}, %xmm0 # xmm0 = [42,42,42,42]
30 ; SSE-NEXT: retq
Dnontemporal-2.ll1 …s -mtriple=x86_64-unknown-unknown -mcpu=corei7 | FileCheck %s -check-prefix=CHECK -check-prefix=SSE
10 ; SSE: movntps
18 ; SSE: movntps
26 ; SSE: movntps
34 ; SSE: movntps
42 ; SSE: movntps
50 ; SSE: movntps
105 ; SSE: movntps
113 ; SSE: movntps
121 ; SSE: movntps
[all …]

123456