/external/llvm/test/CodeGen/X86/ |
D | vector-shuffle-sse1.ll | 9 ; SSE1-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,0,0,1] 17 ; SSE1-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,0,2,0] 25 ; SSE1-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,3,0,0] 33 ; SSE1-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,0,0,0] 41 ; SSE1-NEXT: shufps {{.*#+}} xmm0 = xmm0[2,2,0,0] 49 ; SSE1-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,3,3,0] 57 ; SSE1-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,2,1,0] 81 ; SSE1-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,0,2,2] 89 ; SSE1-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,1,3,3] 110 ; SSE1-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,0],xmm1[0,0] [all …]
|
D | vector-shuffle-128-v4.ll | 134 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,0,0,1] 147 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,0,2,0] 160 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,3,0,0] 173 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,0,0,0] 186 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[2,2,0,0] 199 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,3,3,0] 212 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,2,1,0] 251 ; SSE2-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,0,2,2] 279 ; SSE2-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,1,3,3] 308 ; SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[2,0] [all …]
|
D | vector-blend.ll | 12 ; SSE2-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,2],xmm1[1,3] 13 ; SSE2-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,2,1,3] 18 ; SSSE3-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,2],xmm1[1,3] 19 ; SSSE3-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,2,1,3] 66 ; SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1[2,0],xmm0[3,0] 67 ; SSE2-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[0,2] 72 ; SSSE3-NEXT: shufps {{.*#+}} xmm1 = xmm1[2,0],xmm0[3,0] 73 ; SSSE3-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[0,2] 98 ; SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1[1,0],xmm0[0,0] 99 ; SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1[2,0],xmm0[2,3] [all …]
|
D | swizzle-2.ll | 155 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,0,3,2] 165 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[2,1,3,0] 175 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,0,3,2] 185 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,1,0,2] 205 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[2,0,1,3] 215 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,2,3,1] 225 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,3,2,0] 245 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,2,0,3] 255 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,2,1,0] 265 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,3,1,2] [all …]
|
D | vector-shuffle-combining.ll | 994 ; SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[3,0] 995 ; SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1[2,0],xmm0[0,1] 1001 ; SSSE3-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[3,0] 1002 ; SSSE3-NEXT: shufps {{.*#+}} xmm1 = xmm1[2,0],xmm0[0,1] 1071 ; SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[1,0] 1072 ; SSE2-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,1],xmm1[0,2] 1077 ; SSSE3-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[1,0] 1078 ; SSSE3-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,1],xmm1[0,2] 1156 ; SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[2,3] 1157 ; SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,2,3,1] [all …]
|
D | fmaxnum.ll | 102 ; SSE-NEXT: shufps {{.*#+}} xmm2 = xmm2[3,1,2,3] 104 ; SSE-NEXT: shufps {{.*#+}} xmm3 = xmm3[3,1,2,3] 113 ; SSE-NEXT: shufps {{.*#+}} xmm2 = xmm2[1,1,2,3] 115 ; SSE-NEXT: shufps {{.*#+}} xmm5 = xmm5[1,1,2,3] 177 ; SSE-NEXT: shufps {{.*#+}} xmm2 = xmm2[3,1,2,3] 179 ; SSE-NEXT: shufps {{.*#+}} xmm3 = xmm3[3,1,2,3] 188 ; SSE-NEXT: shufps {{.*#+}} xmm2 = xmm2[1,1,2,3] 190 ; SSE-NEXT: shufps {{.*#+}} xmm5 = xmm5[1,1,2,3]
|
D | vec_insert-2.ll | 6 ; X32: shufps $36 15 ; X32: shufps $36
|
D | vec_insert-5.ll | 29 ; CHECK-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[2,0] 30 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,0] 56 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,0],xmm1[1,0] 57 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,2],xmm1[2,3]
|
D | sse3-avx-addsub-2.ll | 316 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,1,2,3] 317 ; SSE-NEXT: shufps {{.*#+}} xmm1 = xmm1[3,1,2,3] 319 ; SSE-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,1,2,0] 346 ; SSE-NEXT: shufps {{.*#+}} xmm2 = xmm2[0,1,1,3] 375 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,1,2,3] 376 ; SSE-NEXT: shufps {{.*#+}} xmm1 = xmm1[3,1,2,3] 379 ; SSE-NEXT: shufps {{.*#+}} xmm2 = xmm2[0,0,2,1] 417 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,1,2,3] 418 ; SSE-NEXT: shufps {{.*#+}} xmm1 = xmm1[3,1,2,3]
|
D | sse1.ll | 18 ; CHECK-NEXT: shufps {{.*#+}} xmm2 = xmm2[1,1,2,3] 20 ; CHECK-NEXT: shufps {{.*#+}} xmm1 = xmm1[1,1,2,3]
|
D | 2009-06-18-movlp-shuffle-register.ll | 6 ; CHECK: shufps $228, %xmm
|
D | vec_fp_to_int.ll | 494 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,1,2,3] 520 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,1,2,3] 562 ; SSE-NEXT: shufps {{.*#+}} xmm1 = xmm1[1,1,2,3] 567 ; SSE-NEXT: shufps {{.*#+}} xmm1 = xmm1[3,1,2,3] 605 ; SSE-NEXT: shufps {{.*#+}} xmm1 = xmm1[1,1,2,3] 610 ; SSE-NEXT: shufps {{.*#+}} xmm1 = xmm1[3,1,2,3] 650 ; SSE-NEXT: shufps {{.*#+}} xmm1 = xmm1[3,1,2,3] 654 ; SSE-NEXT: shufps {{.*#+}} xmm2 = xmm2[1,1,2,3] 699 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,1,2,3] 751 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,1,2,3] [all …]
|
D | vec_set-6.ll | 4 ; RUN: grep shufps %t | count 1
|
D | palignr.ll | 28 ; CHECK-YONAH-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[3,0] 29 ; CHECK-YONAH-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,2],xmm1[2,0]
|
D | sse41.ll | 94 ; X32-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,1,2,3] 103 ; X64-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,1,2,3] 114 ; X32-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,1,2,3] 122 ; X64-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,1,2,3] 854 ; X32-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0,0,0] 861 ; X64-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0,0,0] 879 ; X32-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0,0,0] 886 ; X64-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0,0,0] 906 ; X32-NEXT: shufps {{.*#+}} xmm4 = xmm4[0,0,0,0] 919 ; X64-NEXT: shufps {{.*#+}} xmm4 = xmm4[0,0,0,0]
|
/external/libyuv/files/source/ |
D | scale_argb.cc | 54 shufps xmm0, xmm1, 0x88 in ScaleARGBRowDown2_SSE2() 87 shufps xmm0, xmm1, 0x88 // even pixels in ScaleARGBRowDown2Int_SSE2() 88 shufps xmm2, xmm1, 0xdd // odd pixels in ScaleARGBRowDown2Int_SSE2() 174 shufps xmm0, xmm1, 0x88 // even pixels in ScaleARGBRowDownEvenInt_SSE2() 175 shufps xmm2, xmm1, 0xdd // odd pixels in ScaleARGBRowDownEvenInt_SSE2() 240 shufps xmm0, xmm0, 0xff in ScaleARGBFilterRows_SSE2() 254 shufps xmm0, xmm0, 0xff in ScaleARGBFilterRows_SSE2() 269 shufps xmm0, xmm0, 0xff in ScaleARGBFilterRows_SSE2() 323 shufps xmm0, xmm0, 0xff in ScaleARGBFilterRows_SSSE3() 337 shufps xmm0, xmm0, 0xff in ScaleARGBFilterRows_SSSE3() [all …]
|
D | row_win.cc | 958 shufps xmm0, xmm1, 0x88 in ARGBToUVRow_SSSE3() 959 shufps xmm4, xmm1, 0xdd in ARGBToUVRow_SSSE3() 962 shufps xmm2, xmm3, 0x88 in ARGBToUVRow_SSSE3() 963 shufps xmm4, xmm3, 0xdd in ARGBToUVRow_SSSE3() 1028 shufps xmm0, xmm1, 0x88 in ARGBToUVRow_Unaligned_SSSE3() 1029 shufps xmm4, xmm1, 0xdd in ARGBToUVRow_Unaligned_SSSE3() 1032 shufps xmm2, xmm3, 0x88 in ARGBToUVRow_Unaligned_SSSE3() 1033 shufps xmm4, xmm3, 0xdd in ARGBToUVRow_Unaligned_SSSE3() 1094 shufps xmm0, xmm1, 0x88 in BGRAToUVRow_SSSE3() 1095 shufps xmm4, xmm1, 0xdd in BGRAToUVRow_SSSE3() [all …]
|
/external/llvm/lib/Target/X86/ |
D | README-SSE.txt | 128 shufps $0, %xmm2, %xmm5 #60.21 133 shufps $85, %xmm2, %xmm4 #61.21 134 shufps $170, %xmm2, %xmm3 #62.21 135 shufps $255, %xmm2, %xmm2 #63.21 197 This looks really bad. The problem is shufps is a destructive opcode. Since it 198 appears as operand two in more than one shufps ops. It resulted in a number of 293 shufps $50, %xmm1, %xmm2 294 shufps $132, %xmm2, %xmm0 679 shufps $2, %xmm1, %xmm2 680 shufps $132, %xmm2, %xmm0
|
/external/libvpx/libvpx/third_party/libyuv/source/ |
D | scale_win.cc | 977 shufps xmm0, xmm1, 0xdd in ScaleARGBRowDown2_SSE2() 1003 shufps xmm0, xmm1, 0x88 // even pixels in ScaleARGBRowDown2Linear_SSE2() 1004 shufps xmm2, xmm1, 0xdd // odd pixels in ScaleARGBRowDown2Linear_SSE2() 1036 shufps xmm0, xmm1, 0x88 // even pixels in ScaleARGBRowDown2Box_SSE2() 1037 shufps xmm2, xmm1, 0xdd // odd pixels in ScaleARGBRowDown2Box_SSE2() 1118 shufps xmm0, xmm1, 0x88 // even pixels in ScaleARGBRowDownEvenBox_SSE2() 1119 shufps xmm2, xmm1, 0xdd // odd pixels in ScaleARGBRowDownEvenBox_SSE2()
|
D | row_win.cc | 1425 shufps xmm0, xmm1, 0x88 in ARGBToUVRow_SSSE3() 1426 shufps xmm4, xmm1, 0xdd in ARGBToUVRow_SSSE3() 1429 shufps xmm2, xmm3, 0x88 in ARGBToUVRow_SSSE3() 1430 shufps xmm4, xmm3, 0xdd in ARGBToUVRow_SSSE3() 1495 shufps xmm0, xmm1, 0x88 in ARGBToUVJRow_SSSE3() 1496 shufps xmm4, xmm1, 0xdd in ARGBToUVJRow_SSSE3() 1499 shufps xmm2, xmm3, 0x88 in ARGBToUVJRow_SSSE3() 1500 shufps xmm4, xmm3, 0xdd in ARGBToUVJRow_SSSE3() 1678 shufps xmm0, xmm1, 0x88 in ARGBToUV422Row_SSSE3() 1679 shufps xmm4, xmm1, 0xdd in ARGBToUV422Row_SSSE3() [all …]
|
/external/boringssl/src/crypto/aes/asm/ |
D | aesni-x86.pl | 2158 &shufps ("xmm4","xmm0",0b00010000); 2160 &shufps ("xmm4","xmm0",0b10001100); 2162 &shufps ("xmm1","xmm1",0b11111111); # critical path 2265 &shufps ("xmm4","xmm0",0b00010000); 2268 &shufps ("xmm4","xmm0",0b10001100); 2280 &shufps ("xmm5","xmm0",0b01000100); 2282 &shufps ("xmm3","xmm2",0b01001110); 2371 &shufps ("xmm4","xmm0",0b00010000); 2373 &shufps ("xmm4","xmm0",0b10001100); 2375 &shufps ("xmm1","xmm1",0b11111111); # critical path [all …]
|
/external/boringssl/mac-x86/crypto/aes/ |
D | aesni-x86.S | 2097 shufps $16,%xmm0,%xmm4 2099 shufps $140,%xmm0,%xmm4 2101 shufps $255,%xmm1,%xmm1 2190 shufps $16,%xmm0,%xmm4 2193 shufps $140,%xmm0,%xmm4 2205 shufps $68,%xmm0,%xmm5 2207 shufps $78,%xmm2,%xmm3 2287 shufps $16,%xmm0,%xmm4 2289 shufps $140,%xmm0,%xmm4 2291 shufps $255,%xmm1,%xmm1 [all …]
|
/external/boringssl/linux-x86/crypto/aes/ |
D | aesni-x86.S | 2132 shufps $16,%xmm0,%xmm4 2134 shufps $140,%xmm0,%xmm4 2136 shufps $255,%xmm1,%xmm1 2225 shufps $16,%xmm0,%xmm4 2228 shufps $140,%xmm0,%xmm4 2240 shufps $68,%xmm0,%xmm5 2242 shufps $78,%xmm2,%xmm3 2322 shufps $16,%xmm0,%xmm4 2324 shufps $140,%xmm0,%xmm4 2326 shufps $255,%xmm1,%xmm1 [all …]
|
/external/boringssl/win-x86/crypto/aes/ |
D | aesni-x86.asm | 2093 shufps xmm4,xmm0,16 2095 shufps xmm4,xmm0,140 2097 shufps xmm1,xmm1,255 2186 shufps xmm4,xmm0,16 2189 shufps xmm4,xmm0,140 2201 shufps xmm5,xmm0,68 2203 shufps xmm3,xmm2,78 2283 shufps xmm4,xmm0,16 2285 shufps xmm4,xmm0,140 2287 shufps xmm1,xmm1,255 [all …]
|
/external/boringssl/linux-x86_64/crypto/aes/ |
D | aesni-x86_64.S | 3478 shufps $16,%xmm0,%xmm4 3480 shufps $140,%xmm0,%xmm4 3482 shufps $255,%xmm1,%xmm1 3493 shufps $16,%xmm0,%xmm4 3496 shufps $140,%xmm0,%xmm4 3509 shufps $68,%xmm0,%xmm5 3511 shufps $78,%xmm2,%xmm3 3521 shufps $16,%xmm0,%xmm4 3523 shufps $140,%xmm0,%xmm4 3525 shufps $255,%xmm1,%xmm1 [all …]
|