/external/llvm/test/CodeGen/X86/ |
D | vector-shuffle-128-v4.ll | 134 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,0,0,1] 147 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,0,2,0] 160 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,3,0,0] 173 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,0,0,0] 186 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[2,2,0,0] 199 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,3,3,0] 212 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,2,1,0] 251 ; SSE2-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,0,2,2] 279 ; SSE2-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,1,3,3] 337 ; SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[2,0] [all …]
|
D | vec_insert-2.ll | 9 ; X32-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[2,0] 10 ; X32-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,0] 15 ; X64-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,0],xmm1[2,0] 16 ; X64-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,1],xmm0[2,0] 27 ; X32-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[2,0] 28 ; X32-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,0] 34 ; X64-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[2,0] 35 ; X64-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,0]
|
D | vector-shuffle-sse1.ll | 9 ; SSE1-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,0,0,1] 17 ; SSE1-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,0,2,0] 25 ; SSE1-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,3,0,0] 33 ; SSE1-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,0,0,0] 41 ; SSE1-NEXT: shufps {{.*#+}} xmm0 = xmm0[2,2,0,0] 49 ; SSE1-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,3,3,0] 57 ; SSE1-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,2,1,0] 81 ; SSE1-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,0,2,2] 89 ; SSE1-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,1,3,3] 126 ; SSE1-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,0],xmm1[0,0] [all …]
|
D | vec_insert-3.ll | 9 ; X32-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[3,0] 10 ; X32-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[0,2] 12 ; X32-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[2,0] 13 ; X32-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,0]
|
D | insertelement-zero.ll | 169 ; SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[3,0] 170 ; SSE2-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[0,2] 176 ; SSE3-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[3,0] 177 ; SSE3-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[0,2] 183 ; SSSE3-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[3,0] 184 ; SSSE3-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[0,2] 207 ; SSE2-NEXT: shufps {{.*#+}} xmm2 = xmm2[0,0],xmm1[3,0] 208 ; SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,1],xmm2[0,2] 215 ; SSE3-NEXT: shufps {{.*#+}} xmm2 = xmm2[0,0],xmm1[3,0] 216 ; SSE3-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,1],xmm2[0,2] [all …]
|
D | vec_insert-5.ll | 41 ; X32-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[2,0] 42 ; X32-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,0] 49 ; X64-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[2,0] 50 ; X64-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,0] 83 ; X32-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,0],xmm1[1,0] 84 ; X32-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,2],xmm1[2,3] 91 ; X64-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,0],xmm1[1,0] 92 ; X64-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,2],xmm1[2,3]
|
D | vector-blend.ll | 13 ; SSE2-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,2],xmm1[1,3] 14 ; SSE2-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,2,1,3] 19 ; SSSE3-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,2],xmm1[1,3] 20 ; SSSE3-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,2,1,3] 67 ; SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1[2,0],xmm0[3,0] 68 ; SSE2-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[0,2] 73 ; SSSE3-NEXT: shufps {{.*#+}} xmm1 = xmm1[2,0],xmm0[3,0] 74 ; SSSE3-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[0,2] 99 ; SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1[1,0],xmm0[0,0] 100 ; SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1[2,0],xmm0[2,3] [all …]
|
D | swizzle-2.ll | 155 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,0,3,2] 165 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[2,1,3,0] 175 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,0,3,2] 185 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,1,0,2] 205 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[2,0,1,3] 215 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,2,3,1] 225 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,3,2,0] 245 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,2,0,3] 255 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,2,1,0] 265 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,3,1,2] [all …]
|
D | vector-shuffle-combining.ll | 999 ; SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[3,0] 1000 ; SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1[2,0],xmm0[0,1] 1006 ; SSSE3-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[3,0] 1007 ; SSSE3-NEXT: shufps {{.*#+}} xmm1 = xmm1[2,0],xmm0[0,1] 1076 ; SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[1,0] 1077 ; SSE2-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,1],xmm1[0,2] 1082 ; SSSE3-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[1,0] 1083 ; SSSE3-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,1],xmm1[0,2] 1161 ; SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[2,3] 1162 ; SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,2,3,1] [all …]
|
D | vector-rem.ll | 88 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,1,2,3] 89 ; CHECK-NEXT: shufps {{.*#+}} xmm1 = xmm1[3,1,2,3] 93 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,1,2,3] 95 ; CHECK-NEXT: shufps {{.*#+}} xmm1 = xmm1[1,1,2,3]
|
D | sse3-avx-addsub-2.ll | 316 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,1,2,3] 317 ; SSE-NEXT: shufps {{.*#+}} xmm1 = xmm1[3,1,2,3] 319 ; SSE-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,1,2,0] 346 ; SSE-NEXT: shufps {{.*#+}} xmm2 = xmm2[0,1,1,3] 375 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,1,2,3] 376 ; SSE-NEXT: shufps {{.*#+}} xmm1 = xmm1[3,1,2,3] 379 ; SSE-NEXT: shufps {{.*#+}} xmm2 = xmm2[0,0,2,1] 417 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[3,1,2,3] 418 ; SSE-NEXT: shufps {{.*#+}} xmm1 = xmm1[3,1,2,3]
|
D | 2009-06-18-movlp-shuffle-register.ll | 6 ; CHECK: shufps $228, %xmm
|
D | sse1.ll | 18 ; CHECK-NEXT: shufps {{.*#+}} xmm2 = xmm2[1,1,2,3] 20 ; CHECK-NEXT: shufps {{.*#+}} xmm1 = xmm1[1,1,2,3]
|
D | vec_fp_to_int.ll | 495 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,1,2,3] 521 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,1,2,3] 563 ; SSE-NEXT: shufps {{.*#+}} xmm1 = xmm1[1,1,2,3] 568 ; SSE-NEXT: shufps {{.*#+}} xmm1 = xmm1[3,1,2,3] 606 ; SSE-NEXT: shufps {{.*#+}} xmm1 = xmm1[1,1,2,3] 611 ; SSE-NEXT: shufps {{.*#+}} xmm1 = xmm1[3,1,2,3] 651 ; SSE-NEXT: shufps {{.*#+}} xmm1 = xmm1[3,1,2,3] 655 ; SSE-NEXT: shufps {{.*#+}} xmm2 = xmm2[1,1,2,3] 700 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,1,2,3] 752 ; SSE-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,1,2,3] [all …]
|
D | vec_set-6.ll | 9 ; CHECK-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,0],xmm1[0,1]
|
/external/swiftshader/third_party/LLVM/test/CodeGen/X86/ |
D | sse1.ll | 37 ; CHECK-NOT: shufps $16 38 ; CHECK: shufps $1, 39 ; CHECK-NOT: shufps $16 40 ; CHECK: shufps $1, 41 ; CHECK-NOT: shufps $16 43 ; CHECK-NOT: shufps $16
|
D | vec_shuffle-16.ll | 7 ; sse: shufps 17 ; sse: shufps 27 ; sse: shufps 38 ; sse: shufps
|
D | vec_insert-2.ll | 6 ; X32: shufps $36 15 ; X32: shufps $36
|
D | 2009-06-18-movlp-shuffle-register.ll | 6 ; CHECK: shufps $-28, %xmm
|
D | vec_set-6.ll | 4 ; RUN: grep shufps %t | count 1
|
D | vec_shuffle-30.ll | 3 ; RUN: grep shufps %t | count 1
|
/external/llvm/lib/Target/X86/ |
D | README-SSE.txt | 128 shufps $0, %xmm2, %xmm5 #60.21 133 shufps $85, %xmm2, %xmm4 #61.21 134 shufps $170, %xmm2, %xmm3 #62.21 135 shufps $255, %xmm2, %xmm2 #63.21 197 This looks really bad. The problem is shufps is a destructive opcode. Since it 198 appears as operand two in more than one shufps ops. It resulted in a number of 293 shufps $50, %xmm1, %xmm2 294 shufps $132, %xmm2, %xmm0 679 shufps $2, %xmm1, %xmm2 680 shufps $132, %xmm2, %xmm0
|
/external/swiftshader/third_party/LLVM/lib/Target/X86/ |
D | README-SSE.txt | 158 shufps $0, %xmm2, %xmm5 #60.21 163 shufps $85, %xmm2, %xmm4 #61.21 164 shufps $170, %xmm2, %xmm3 #62.21 165 shufps $255, %xmm2, %xmm2 #63.21 227 This looks really bad. The problem is shufps is a destructive opcode. Since it 228 appears as operand two in more than one shufps ops. It resulted in a number of 323 shufps $50, %xmm1, %xmm2 324 shufps $132, %xmm2, %xmm0 745 shufps $2, %xmm1, %xmm2 746 shufps $132, %xmm2, %xmm0
|
/external/boringssl/src/crypto/aes/asm/ |
D | aesni-x86.pl | 2164 &shufps ("xmm4","xmm0",0b00010000); 2166 &shufps ("xmm4","xmm0",0b10001100); 2168 &shufps ("xmm1","xmm1",0b11111111); # critical path 2271 &shufps ("xmm4","xmm0",0b00010000); 2274 &shufps ("xmm4","xmm0",0b10001100); 2286 &shufps ("xmm5","xmm0",0b01000100); 2288 &shufps ("xmm3","xmm2",0b01001110); 2377 &shufps ("xmm4","xmm0",0b00010000); 2379 &shufps ("xmm4","xmm0",0b10001100); 2381 &shufps ("xmm1","xmm1",0b11111111); # critical path [all …]
|
/external/libyuv/files/source/ |
D | scale_win.cc | 1008 shufps xmm0, xmm1, 0xdd in ScaleARGBRowDown2_SSE2() 1034 shufps xmm0, xmm1, 0x88 // even pixels in ScaleARGBRowDown2Linear_SSE2() 1035 shufps xmm2, xmm1, 0xdd // odd pixels in ScaleARGBRowDown2Linear_SSE2() 1067 shufps xmm0, xmm1, 0x88 // even pixels in ScaleARGBRowDown2Box_SSE2() 1068 shufps xmm2, xmm1, 0xdd // odd pixels in ScaleARGBRowDown2Box_SSE2() 1150 shufps xmm0, xmm1, 0x88 // even pixels in ScaleARGBRowDownEvenBox_SSE2() 1151 shufps xmm2, xmm1, 0xdd // odd pixels in ScaleARGBRowDownEvenBox_SSE2()
|