Searched refs:SSE (Results 1 – 25 of 130) sorted by relevance
123456
/external/llvm/test/CodeGen/X86/ |
D | vector-idiv.ll | 2 ; RUN: llc -march=x86-64 -mcpu=core2 < %s | FileCheck %s --check-prefix=SSE 23 ; SSE-LABEL: test1: 24 ; SSE: # BB#0: 25 ; SSE-NEXT: movdqa {{.*#+}} xmm1 = [613566757,613566757,613566757,613566757] 26 ; SSE-NEXT: movdqa %xmm0, %xmm2 27 ; SSE-NEXT: pmuludq %xmm1, %xmm2 28 ; SSE-NEXT: pshufd {{.*#+}} xmm2 = xmm2[1,3,2,3] 29 ; SSE-NEXT: pshufd {{.*#+}} xmm1 = xmm1[1,1,3,3] 30 ; SSE-NEXT: pshufd {{.*#+}} xmm3 = xmm0[1,1,3,3] 31 ; SSE-NEXT: pmuludq %xmm1, %xmm3 [all …]
|
D | sse-scalar-fp-arith.ll | 1 ; RUN: llc -mcpu=x86-64 -mattr=+sse2 < %s | FileCheck --check-prefix=SSE --check-prefix=SSE2 %s 2 ; RUN: llc -mcpu=x86-64 -mattr=+sse4.1 < %s | FileCheck --check-prefix=SSE --check-prefix=SSE41 %s 8 ; instructions immediately after SSE scalar fp instructions 12 ; SSE-LABEL: test_add_ss: 13 ; SSE: # BB#0: 14 ; SSE-NEXT: addss %xmm1, %xmm0 15 ; SSE-NEXT: retq 29 ; SSE-LABEL: test_sub_ss: 30 ; SSE: # BB#0: 31 ; SSE-NEXT: subss %xmm1, %xmm0 [all …]
|
D | preserve_mostcc64.ll | 1 ; RUN: llc < %s -mtriple=x86_64-apple-darwin -mcpu=corei7 | FileCheck --check-prefix=SSE %s 7 ;SSE-LABEL: preserve_mostcc1 8 ;SSE: pushq %r10 9 ;SSE-NEXT: pushq %r9 10 ;SSE-NEXT: pushq %r8 11 ;SSE-NEXT: pushq %rdi 12 ;SSE-NEXT: pushq %rsi 13 ;SSE-NEXT: pushq %rdx 14 ;SSE-NEXT: pushq %rcx 15 ;SSE-NEXT: pushq %rax [all …]
|
D | preserve_allcc64.ll | 1 ; RUN: llc < %s -mtriple=x86_64-apple-darwin -mcpu=corei7 | FileCheck --check-prefix=SSE %s 6 ;SSE-LABEL: preserve_allcc1 7 ;SSE: pushq %r10 8 ;SSE-NEXT: pushq %r9 9 ;SSE-NEXT: pushq %r8 10 ;SSE-NEXT: pushq %rdi 11 ;SSE-NEXT: pushq %rsi 12 ;SSE-NEXT: pushq %rdx 13 ;SSE-NEXT: pushq %rcx 14 ;SSE-NEXT: pushq %rax [all …]
|
D | vector-shuffle-128-v2.ll | 1 …known-unknown -mcpu=x86-64 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE2 2 … -mcpu=x86-64 -mattr=+sse3 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE3 3 …mcpu=x86-64 -mattr=+ssse3 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSSE3 4 …cpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41 12 ; SSE-LABEL: shuffle_v2i64_00: 13 ; SSE: # BB#0: 14 ; SSE-NEXT: pshufd {{.*#+}} xmm0 = xmm0[0,1,0,1] 15 ; SSE-NEXT: retq 30 ; SSE-LABEL: shuffle_v2i64_10: 31 ; SSE: # BB#0: [all …]
|
D | cmov-fp.ll | 1 ; RUN: llc -march x86 -mcpu pentium4 < %s | FileCheck %s -check-prefix=SSE 12 ; SSE-LABEL: test1: 13 ; SSE: movsd 31 ; SSE-LABEL: test2: 32 ; SSE: movsd 49 ; SSE-LABEL: test3: 50 ; SSE: movsd 67 ; SSE-LABEL: test4: 68 ; SSE: movsd 85 ; SSE-LABEL: test5: [all …]
|
D | rounding-ops.ll | 1 ; RUN: llc < %s -mtriple=x86_64-apple-macosx -mattr=+sse4.1 | FileCheck -check-prefix=CHECK-SSE %s 8 ; CHECK-SSE-LABEL: test1: 9 ; CHECK-SSE: roundss $1 21 ; CHECK-SSE-LABEL: test2: 22 ; CHECK-SSE: roundsd $1 34 ; CHECK-SSE-LABEL: test3: 35 ; CHECK-SSE: roundss $12 47 ; CHECK-SSE-LABEL: test4: 48 ; CHECK-SSE: roundsd $12 60 ; CHECK-SSE-LABEL: test5: [all …]
|
D | lower-vec-shift.ll | 2 …mtriple=x86_64-unknown-linux-gnu -mcpu=core2 | FileCheck %s --check-prefix=CHECK --check-prefix=SSE 16 ; SSE: psrlw 17 ; SSE-NEXT: psrlw 18 ; SSE-NEXT: movss 33 ; SSE: psrlw 34 ; SSE-NEXT: psrlw 35 ; SSE-NEXT: movsd 50 ; SSE: psrld 51 ; SSE-NEXT: psrld 52 ; SSE-NEXT: movss [all …]
|
D | commute-fcmp.ll | 1 …N: llc -O3 -mtriple=x86_64-unknown -mcpu=x86-64 -mattr=+sse2 < %s | FileCheck %s --check-prefix=SSE 10 ;SSE-LABEL: commute_cmpps_eq 11 ;SSE: cmpeqps (%rdi), %xmm0 12 ;SSE-NEXT: retq 25 ;SSE-LABEL: commute_cmpps_ne 26 ;SSE: cmpneqps (%rdi), %xmm0 27 ;SSE-NEXT: retq 40 ;SSE-LABEL: commute_cmpps_ord 41 ;SSE: cmpordps (%rdi), %xmm0 42 ;SSE-NEXT: retq [all …]
|
D | break-false-dep.ll | 1 ; RUN: llc < %s -mtriple=x86_64-linux -mattr=+sse2 -mcpu=nehalem | FileCheck %s --check-prefix=SSE 2 ; RUN: llc < %s -mtriple=x86_64-win32 -mattr=+sse2 -mcpu=nehalem | FileCheck %s --check-prefix=SSE 7 ; SSE-LABEL: t1: 8 ; SSE: movss ([[A0:%rdi|%rcx]]), %xmm0 9 ; SSE: cvtss2sd %xmm0, %xmm0 18 ; SSE-LABEL: t2: 19 ; SSE: cvtsd2ss ([[A0]]), %xmm0 27 ; SSE-LABEL: squirtf: 28 ; SSE: movss ([[A0]]), %xmm0 29 ; SSE: sqrtss %xmm0, %xmm0 [all …]
|
D | vec_uint_to_fp.ll | 1 ; RUN: llc < %s -mtriple=x86_64-apple-macosx | FileCheck --check-prefix=CHECK --check-prefix=SSE --… 7 ; SSE: [[MASKCSTADDR:LCPI0_[0-9]+]]: 8 ; SSE-NEXT: .long 65535 ## 0xffff 9 ; SSE-NEXT: .long 65535 ## 0xffff 10 ; SSE-NEXT: .long 65535 ## 0xffff 11 ; SSE-NEXT: .long 65535 ## 0xffff 43 ; SSE: movdqa [[MASKCSTADDR]](%rip), [[MASK:%xmm[0-9]+]] 44 ; SSE-NEXT: pand %xmm0, [[MASK]] 47 ; SSE-NEXT: por [[LOWCSTADDR]](%rip), [[MASK]] 48 ; SSE-NEXT: psrld $16, %xmm0 [all …]
|
D | exedeps-movq.ll | 1 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=sse2 | FileCheck %s --check-prefix=SSE 13 ; SSE-LABEL: store_floats: 14 ; SSE: # BB#0: 15 ; SSE-NEXT: addps %xmm0, %xmm0 16 ; SSE-NEXT: movlps %xmm0, (%rdi) 17 ; SSE-NEXT: retq 37 ; SSE-LABEL: store_double: 38 ; SSE: # BB#0: 39 ; SSE-NEXT: addpd %xmm0, %xmm0 40 ; SSE-NEXT: movlpd %xmm0, (%rdi) [all …]
|
D | commute-clmul.ll | 1 …O3 -mtriple=x86_64-unknown -mcpu=x86-64 -mattr=+sse2,+pclmul < %s | FileCheck %s --check-prefix=SSE 7 ;SSE-LABEL: commute_lq_lq 8 ;SSE: pclmulqdq $0, (%rdi), %xmm0 9 ;SSE-NEXT: retq 21 ;SSE-LABEL: commute_lq_hq 22 ;SSE: pclmulqdq $1, (%rdi), %xmm0 23 ;SSE-NEXT: retq 35 ;SSE-LABEL: commute_hq_lq 36 ;SSE: pclmulqdq $16, (%rdi), %xmm0 37 ;SSE-NEXT: retq [all …]
|
D | vector-zmov.ll | 1 …_64-unknown-unknown -mcpu=x86-64 -mattr=+sse2 | FileCheck %s --check-prefix=SSE --check-prefix=SSE2 2 …4-unknown-unknown -mcpu=x86-64 -mattr=+ssse3 | FileCheck %s --check-prefix=SSE --check-prefix=SSSE3 3 …-unknown-unknown -mcpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=SSE --check-prefix=SSE41 8 ; SSE-LABEL: load_zmov_4i32_to_0zzz: 9 ; SSE: # BB#0: # %entry 10 ; SSE-NEXT: movd (%rdi), %xmm0 11 ; SSE-NEXT: retq 24 ; SSE-LABEL: load_zmov_2i64_to_0z: 25 ; SSE: # BB#0: # %entry 26 ; SSE-NEXT: movq (%rdi), %xmm0 [all …]
|
D | fast-isel-vecload.ll | 1 …riple=x86_64-unknown-unknown -mattr=+sse2 < %s | FileCheck %s --check-prefix=SSE --check-prefix=ALL 9 ; SSE: movdqa (%rdi), %xmm0 19 ; SSE: movdqa (%rdi), %xmm0 29 ; SSE: movdqa (%rdi), %xmm0 39 ; SSE: movdqa (%rdi), %xmm0 49 ; SSE: movdqu (%rdi), %xmm0 59 ; SSE: movdqu (%rdi), %xmm0 69 ; SSE: movdqu (%rdi), %xmm0 79 ; SSE: movdqu (%rdi), %xmm0 89 ; SSE: movaps (%rdi), %xmm0 [all …]
|
D | vector-shuffle-128-v8.ll | 1 …known-unknown -mcpu=x86-64 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE2 2 …mcpu=x86-64 -mattr=+ssse3 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSSE3 3 …cpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41 11 ; SSE-LABEL: shuffle_v8i16_01012323: 12 ; SSE: # BB#0: 13 ; SSE-NEXT: pshufd {{.*#+}} xmm0 = xmm0[0,0,1,1] 14 ; SSE-NEXT: retq 24 ; SSE-LABEL: shuffle_v8i16_67452301: 25 ; SSE: # BB#0: 26 ; SSE-NEXT: pshufd {{.*#+}} xmm0 = xmm0[3,2,1,0] [all …]
|
D | vector-shuffle-128-v4.ll | 1 …known-unknown -mcpu=x86-64 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE2 2 … -mcpu=x86-64 -mattr=+sse3 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE3 3 …mcpu=x86-64 -mattr=+ssse3 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSSE3 4 …cpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41 12 ; SSE-LABEL: shuffle_v4i32_0001: 13 ; SSE: # BB#0: 14 ; SSE-NEXT: pshufd {{.*#+}} xmm0 = xmm0[0,0,0,1] 15 ; SSE-NEXT: retq 25 ; SSE-LABEL: shuffle_v4i32_0020: 26 ; SSE: # BB#0: [all …]
|
D | vector-shuffle-combining.ll | 1 ; RUN: llc < %s -mcpu=x86-64 -mattr=+sse2 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --ch… 2 ; RUN: llc < %s -mcpu=x86-64 -mattr=+ssse3 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --c… 3 ; RUN: llc < %s -mcpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --… 55 ; SSE-LABEL: combine_pshufd4: 56 ; SSE: # BB#0: # %entry 57 ; SSE-NEXT: pshufhw {{.*#+}} xmm0 = xmm0[0,1,2,3,7,6,5,4] 58 ; SSE-NEXT: retq 74 ; SSE-LABEL: combine_pshufd5: 75 ; SSE: # BB#0: # %entry 76 ; SSE-NEXT: pshuflw {{.*#+}} xmm0 = xmm0[3,2,1,0,4,5,6,7] [all …]
|
D | fold-vex.ll | 6 …< %s -mtriple=x86_64-unknown-unknown -mattr=-avx | FileCheck %s --check-prefix=SSE 7 …< %s -mtriple=x86_64-unknown-unknown -mcpu=corei7-avx -mattr=-avx | FileCheck %s --check-prefix=SSE 8 …< %s -mtriple=x86_64-unknown-unknown -mcpu=btver2 -mattr=-avx | FileCheck %s --check-prefix=SSE 13 ; With SSE, folding memory operands into math/logic ops requires 16-byte alignment 26 ; SSE-LABEL: @test1 27 ; SSE: movups (%rdi), %xmm1 28 ; SSE-NEXT: andps %xmm1, %xmm0 29 ; SSE-NEXT: ret
|
D | fast-isel-sse12-fptoint.ll | 1 …6_64-apple-darwin -mattr=-avx,+sse2 -fast-isel -fast-isel-abort=1 | FileCheck %s --check-prefix=SSE 5 ; SSE-LABEL: cvt_test1 6 ; SSE: cvttss2si %xmm0, %eax 19 ; SSE-LABEL: cvt_test2 20 ; SSE: cvttss2si %xmm0, %rax 33 ; SSE-LABEL: cvt_test3 34 ; SSE: cvttsd2si %xmm0, %eax 45 ; SSE-LABEL: cvt_test4 46 ; SSE: cvttsd2si %xmm0, %rax
|
D | vec_shift6.ll | 1 …mtriple=x86_64-unknown-linux-gnu -mattr=sse4.1 | FileCheck %s -check-prefix=CHECK -check-prefix=SSE 38 ; SSE: pmulld 49 ; SSE: pmulld 63 ; SSE: pmullw 64 ; SSE-NEXT: pmullw 79 ; SSE: pmulld 80 ; SSE-NEXT: pmulld 94 ; SSE: pmullw 95 ; SSE-NEXT: pmullw 96 ; SSE-NEXT: pmullw [all …]
|
D | sse3-avx-addsub.ll | 1 ; RUN: llc < %s -march=x86-64 -mcpu=core2 | FileCheck %s -check-prefix=SSE -check-prefix=CHECK 44 ; SSE: addsubps 56 ; SSE: addsubps 57 ; SSE-NEXT: addsubps 70 ; SSE: addsubpd 71 ; SSE: addsubpd 84 ; SSE: addsubpd 97 ; SSE: addsubps 110 ; SSE: addsubps 111 ; SSE-NEXT: addsubps [all …]
|
D | anyregcc.ll | 2 …%s -mtriple=x86_64-apple-darwin -mcpu=corei7 -disable-fp-elim | FileCheck --check-prefix=SSE %s 370 ;SSE-LABEL: anyregcc1 371 ;SSE: pushq %rbp 372 ;SSE: pushq %rax 373 ;SSE: pushq %r15 374 ;SSE: pushq %r14 375 ;SSE: pushq %r13 376 ;SSE: pushq %r12 377 ;SSE: pushq %r11 378 ;SSE: pushq %r10 [all …]
|
D | splat-const.ll | 1 ; RUN: llc < %s -mcpu=penryn | FileCheck %s --check-prefix=SSE 9 ; SSE-LABEL: zero_vector: 10 ; SSE: xorps %xmm0, %xmm0 11 ; SSE-NEXT: retq 28 ; SSE-LABEL: const_vector: 29 ; SSE: movaps {{.*}}, %xmm0 # xmm0 = [42,42,42,42] 30 ; SSE-NEXT: retq
|
D | nontemporal-2.ll | 1 …s -mtriple=x86_64-unknown-unknown -mcpu=corei7 | FileCheck %s -check-prefix=CHECK -check-prefix=SSE 10 ; SSE: movntps 18 ; SSE: movntps 26 ; SSE: movntps 34 ; SSE: movntps 42 ; SSE: movntps 50 ; SSE: movntps 105 ; SSE: movntps 113 ; SSE: movntps 121 ; SSE: movntps [all …]
|
123456