/external/libvpx/libvpx/vpx_dsp/x86/ |
D | fwd_txfm_ssse3_x86_64.asm | 95 pmaddwd m5, m2, [GLOBAL(pw_15137_6270)] 96 pmaddwd m2, [GLOBAL(pw_6270_m15137)] 97 pmaddwd m9, m10, [GLOBAL(pw_15137_6270)] 98 pmaddwd m10, [GLOBAL(pw_6270_m15137)] 123 pmaddwd m7, m1, [GLOBAL(pw_16069_3196)] 124 pmaddwd m1, [GLOBAL(pw_3196_m16069)] 125 pmaddwd m9, m10, [GLOBAL(pw_16069_3196)] 126 pmaddwd m10, [GLOBAL(pw_3196_m16069)] 141 pmaddwd m9, m11, [GLOBAL(pw_9102_13623)] 142 pmaddwd m11, [GLOBAL(pw_13623_m9102)] [all …]
|
D | highbd_sad4d_sse2.asm | 36 pmaddwd m4, m1 37 pmaddwd m5, m1 46 pmaddwd m6, m1 47 pmaddwd m7, m1 56 pmaddwd m2, m1 65 pmaddwd m2, m1 74 pmaddwd m2, m1 83 pmaddwd m2, m1 112 pmaddwd m4, m1 113 pmaddwd m5, m1 [all …]
|
D | highbd_variance_impl_sse2.asm | 91 pmaddwd xmm1, xmm1 98 pmaddwd xmm3, xmm3 105 pmaddwd xmm1, xmm1 111 pmaddwd xmm3, xmm3 238 pmaddwd xmm1, xmm1 248 pmaddwd xmm3, xmm3 255 pmaddwd xmm1, xmm1 261 pmaddwd xmm3, xmm3
|
D | vpx_high_subpixel_bilinear_sse2.asm | 46 pmaddwd xmm0, xmm4 ;multiply the filter factors 103 pmaddwd xmm6, xmm7 104 pmaddwd xmm0, xmm7 135 pmaddwd xmm9, xmm7 136 pmaddwd xmm6, xmm7 137 pmaddwd xmm0, xmm7 138 pmaddwd xmm2, xmm7
|
D | vpx_high_subpixel_8t_sse2.asm | 67 pmaddwd xmm0, k0k6 ;multiply the filter factors 68 pmaddwd xmm1, k1k7 69 pmaddwd xmm2, k2k5 70 pmaddwd xmm3, k3k4 167 pmaddwd xmm0, k0k1 168 pmaddwd xmm5, k0k1 169 pmaddwd xmm6, k6k7 170 pmaddwd xmm1, k6k7 171 pmaddwd xmm2, k2k5 172 pmaddwd xmm7, k2k5 [all …]
|
/external/libaom/libaom/aom_dsp/x86/ |
D | fwd_txfm_ssse3_x86_64.asm | 113 pmaddwd m5, m2, [GLOBAL(pw_15137_6270)] 114 pmaddwd m2, [GLOBAL(pw_6270_m15137)] 115 pmaddwd m9, m10, [GLOBAL(pw_15137_6270)] 116 pmaddwd m10, [GLOBAL(pw_6270_m15137)] 141 pmaddwd m7, m1, [GLOBAL(pw_16069_3196)] 142 pmaddwd m1, [GLOBAL(pw_3196_m16069)] 143 pmaddwd m9, m10, [GLOBAL(pw_16069_3196)] 144 pmaddwd m10, [GLOBAL(pw_3196_m16069)] 159 pmaddwd m9, m11, [GLOBAL(pw_9102_13623)] 160 pmaddwd m11, [GLOBAL(pw_13623_m9102)] [all …]
|
D | highbd_sad4d_sse2.asm | 39 pmaddwd m4, m1 40 pmaddwd m5, m1 49 pmaddwd m6, m1 50 pmaddwd m7, m1 59 pmaddwd m2, m1 68 pmaddwd m2, m1 77 pmaddwd m2, m1 86 pmaddwd m2, m1 115 pmaddwd m4, m1 116 pmaddwd m5, m1 [all …]
|
D | highbd_variance_impl_sse2.asm | 94 pmaddwd xmm1, xmm1 101 pmaddwd xmm3, xmm3 108 pmaddwd xmm1, xmm1 114 pmaddwd xmm3, xmm3 241 pmaddwd xmm1, xmm1 251 pmaddwd xmm3, xmm3 258 pmaddwd xmm1, xmm1 264 pmaddwd xmm3, xmm3
|
D | aom_high_subpixel_8t_sse2.asm | 70 pmaddwd xmm0, k0k6 ;multiply the filter factors 71 pmaddwd xmm1, k1k7 72 pmaddwd xmm2, k2k5 73 pmaddwd xmm3, k3k4 170 pmaddwd xmm0, k0k1 171 pmaddwd xmm5, k0k1 172 pmaddwd xmm6, k6k7 173 pmaddwd xmm1, k6k7 174 pmaddwd xmm2, k2k5 175 pmaddwd xmm7, k2k5 [all …]
|
D | aom_high_subpixel_bilinear_sse2.asm | 49 pmaddwd xmm0, xmm4 ;multiply the filter factors 108 pmaddwd xmm6, xmm7 109 pmaddwd xmm0, xmm7 140 pmaddwd xmm5, xmm7 141 pmaddwd xmm6, xmm7 142 pmaddwd xmm0, xmm7 143 pmaddwd xmm2, xmm7
|
/external/libvpx/libvpx/vp8/encoder/x86/ |
D | dct_sse2.asm | 96 pmaddwd xmm0, XMMWORD PTR[GLOBAL(_mult_add)] ;a1 + b1 97 pmaddwd xmm1, XMMWORD PTR[GLOBAL(_mult_sub)] ;a1 - b1 99 pmaddwd xmm3, XMMWORD PTR[GLOBAL(_5352_2217)] ;c1*2217 + d1*5352 100 pmaddwd xmm4, XMMWORD PTR[GLOBAL(_2217_neg5352)];d1*2217 - c1*5352 138 pmaddwd xmm0, XMMWORD PTR[GLOBAL(_mult_add)] ;a1 + b1 139 pmaddwd xmm1, XMMWORD PTR[GLOBAL(_mult_sub)] ;a1 - b1 151 pmaddwd xmm3, XMMWORD PTR[GLOBAL(_5352_2217)] ;c1*2217 + d1*5352 152 pmaddwd xmm4, XMMWORD PTR[GLOBAL(_2217_neg5352)] ;d1*2217 - c1*5352 248 pmaddwd xmm1, XMMWORD PTR[GLOBAL (_5352_2217)] ; c1*2217 + d1*5352 249 pmaddwd xmm4, XMMWORD PTR[GLOBAL (_5352_2217)] ; c1*2217 + d1*5352 [all …]
|
D | block_error_sse2.asm | 38 pmaddwd xmm0, xmm0 39 pmaddwd xmm2, xmm2 97 pmaddwd xmm2, xmm2 102 pmaddwd xmm0, xmm0 157 pmaddwd xmm1, xmm1
|
D | fwalsh_sse2.asm | 80 pmaddwd xmm0, [GLOBAL(c1)] ; d11 a11 d10 a10 81 pmaddwd xmm2, [GLOBAL(cn1)] ; c11 b11 c10 b10 83 pmaddwd xmm1, [GLOBAL(c1)] ; d12 a12 d13 a13 84 pmaddwd xmm3, [GLOBAL(cn1)] ; c12 b12 c13 b13
|
/external/fec/ |
D | dotprod_sse2_assist.s | 36 pmaddwd (%edi),%xmm1 40 pmaddwd 16(%edi),%xmm1 44 pmaddwd 32(%edi),%xmm1 49 pmaddwd 48(%edi),%xmm1
|
D | dotprod_mmx_assist.s | 36 pmaddwd (%edi),%mm1 # mm1 = b[3]*a[3]+b[2]*a[2],b[1]*a[1]+b[0]*a[0] 40 pmaddwd 8(%edi),%mm1 44 pmaddwd 16(%edi),%mm1 49 pmaddwd 24(%edi),%mm1
|
D | sumsq_mmx_assist.s | 28 pmaddwd %mm0,%mm0 # (S0^2+S1^2) (S2^2+S3^2) 30 pmaddwd %mm6,%mm6 # (S4^2+S5^2) (S6^2+S7^2) 67 pmaddwd %mm0,%mm0 # (S0*S0+S1*S1) (S2*S2+S3*S3) 69 pmaddwd %mm1,%mm1
|
/external/libvpx/libvpx/vp9/encoder/x86/ |
D | vp9_error_sse2.asm | 38 pmaddwd m0, m0 39 pmaddwd m1, m1 40 pmaddwd m2, m2 41 pmaddwd m3, m3 94 pmaddwd m0, m0 95 pmaddwd m1, m1
|
/external/libjpeg-turbo/simd/i386/ |
D | jccolext-mmx.asm | 290 pmaddwd mm1, [GOTOFF(eax,PW_F0299_F0337)] ; mm1=ROL*FIX(0.299)+GOL*FIX(0.337) 291 pmaddwd mm6, [GOTOFF(eax,PW_F0299_F0337)] ; mm6=ROH*FIX(0.299)+GOH*FIX(0.337) 292 pmaddwd mm7, [GOTOFF(eax,PW_MF016_MF033)] ; mm7=ROL*-FIX(0.168)+GOL*-FIX(0.331) 293 pmaddwd mm4, [GOTOFF(eax,PW_MF016_MF033)] ; mm4=ROH*-FIX(0.168)+GOH*-FIX(0.331) 322 pmaddwd mm0, [GOTOFF(eax,PW_F0299_F0337)] ; mm0=REL*FIX(0.299)+GEL*FIX(0.337) 323 pmaddwd mm6, [GOTOFF(eax,PW_F0299_F0337)] ; mm6=REH*FIX(0.299)+GEH*FIX(0.337) 324 pmaddwd mm5, [GOTOFF(eax,PW_MF016_MF033)] ; mm5=REL*-FIX(0.168)+GEL*-FIX(0.331) 325 pmaddwd mm4, [GOTOFF(eax,PW_MF016_MF033)] ; mm4=REH*-FIX(0.168)+GEH*-FIX(0.331) 360 pmaddwd mm0, [GOTOFF(eax,PW_F0114_F0250)] ; mm0=BOL*FIX(0.114)+GOL*FIX(0.250) 361 pmaddwd mm4, [GOTOFF(eax,PW_F0114_F0250)] ; mm4=BOH*FIX(0.114)+GOH*FIX(0.250) [all …]
|
D | jccolext-sse2.asm | 319 pmaddwd xmm1, [GOTOFF(eax,PW_F0299_F0337)] ; xmm1=ROL*FIX(0.299)+GOL*FIX(0.337) 320 pmaddwd xmm6, [GOTOFF(eax,PW_F0299_F0337)] ; xmm6=ROH*FIX(0.299)+GOH*FIX(0.337) 321 pmaddwd xmm7, [GOTOFF(eax,PW_MF016_MF033)] ; xmm7=ROL*-FIX(0.168)+GOL*-FIX(0.331) 322 pmaddwd xmm4, [GOTOFF(eax,PW_MF016_MF033)] ; xmm4=ROH*-FIX(0.168)+GOH*-FIX(0.331) 351 pmaddwd xmm0, [GOTOFF(eax,PW_F0299_F0337)] ; xmm0=REL*FIX(0.299)+GEL*FIX(0.337) 352 pmaddwd xmm6, [GOTOFF(eax,PW_F0299_F0337)] ; xmm6=REH*FIX(0.299)+GEH*FIX(0.337) 353 pmaddwd xmm5, [GOTOFF(eax,PW_MF016_MF033)] ; xmm5=REL*-FIX(0.168)+GEL*-FIX(0.331) 354 pmaddwd xmm4, [GOTOFF(eax,PW_MF016_MF033)] ; xmm4=REH*-FIX(0.168)+GEH*-FIX(0.331) 389 pmaddwd xmm0, [GOTOFF(eax,PW_F0114_F0250)] ; xmm0=BOL*FIX(0.114)+GOL*FIX(0.250) 390 pmaddwd xmm4, [GOTOFF(eax,PW_F0114_F0250)] ; xmm4=BOH*FIX(0.114)+GOH*FIX(0.250) [all …]
|
D | jcgryext-mmx.asm | 271 pmaddwd mm1, [GOTOFF(eax,PW_F0299_F0337)] ; mm1=ROL*FIX(0.299)+GOL*FIX(0.337) 272 pmaddwd mm6, [GOTOFF(eax,PW_F0299_F0337)] ; mm6=ROH*FIX(0.299)+GOH*FIX(0.337) 279 pmaddwd mm0, [GOTOFF(eax,PW_F0299_F0337)] ; mm0=REL*FIX(0.299)+GEL*FIX(0.337) 280 pmaddwd mm6, [GOTOFF(eax,PW_F0299_F0337)] ; mm6=REH*FIX(0.299)+GEH*FIX(0.337) 291 pmaddwd mm0, [GOTOFF(eax,PW_F0114_F0250)] ; mm0=BOL*FIX(0.114)+GOL*FIX(0.250) 292 pmaddwd mm4, [GOTOFF(eax,PW_F0114_F0250)] ; mm4=BOH*FIX(0.114)+GOH*FIX(0.250) 307 pmaddwd mm6, [GOTOFF(eax,PW_F0114_F0250)] ; mm6=BEL*FIX(0.114)+GEL*FIX(0.250) 308 pmaddwd mm4, [GOTOFF(eax,PW_F0114_F0250)] ; mm4=BEH*FIX(0.114)+GEH*FIX(0.250)
|
D | jcgryext-sse2.asm | 300 pmaddwd xmm1, [GOTOFF(eax,PW_F0299_F0337)] ; xmm1=ROL*FIX(0.299)+GOL*FIX(0.337) 301 pmaddwd xmm6, [GOTOFF(eax,PW_F0299_F0337)] ; xmm6=ROH*FIX(0.299)+GOH*FIX(0.337) 308 pmaddwd xmm0, [GOTOFF(eax,PW_F0299_F0337)] ; xmm0=REL*FIX(0.299)+GEL*FIX(0.337) 309 pmaddwd xmm6, [GOTOFF(eax,PW_F0299_F0337)] ; xmm6=REH*FIX(0.299)+GEH*FIX(0.337) 320 pmaddwd xmm0, [GOTOFF(eax,PW_F0114_F0250)] ; xmm0=BOL*FIX(0.114)+GOL*FIX(0.250) 321 pmaddwd xmm4, [GOTOFF(eax,PW_F0114_F0250)] ; xmm4=BOH*FIX(0.114)+GOH*FIX(0.250) 336 pmaddwd xmm6, [GOTOFF(eax,PW_F0114_F0250)] ; xmm6=BEL*FIX(0.114)+GEL*FIX(0.250) 337 pmaddwd xmm4, [GOTOFF(eax,PW_F0114_F0250)] ; xmm4=BEH*FIX(0.114)+GEH*FIX(0.250)
|
/external/libjpeg-turbo/simd/x86_64/ |
D | jccolext-sse2.asm | 303 pmaddwd xmm1, [rel PW_F0299_F0337] ; xmm1=ROL*FIX(0.299)+GOL*FIX(0.337) 304 pmaddwd xmm6, [rel PW_F0299_F0337] ; xmm6=ROH*FIX(0.299)+GOH*FIX(0.337) 305 pmaddwd xmm7, [rel PW_MF016_MF033] ; xmm7=ROL*-FIX(0.168)+GOL*-FIX(0.331) 306 pmaddwd xmm4, [rel PW_MF016_MF033] ; xmm4=ROH*-FIX(0.168)+GOH*-FIX(0.331) 335 pmaddwd xmm0, [rel PW_F0299_F0337] ; xmm0=REL*FIX(0.299)+GEL*FIX(0.337) 336 pmaddwd xmm6, [rel PW_F0299_F0337] ; xmm6=REH*FIX(0.299)+GEH*FIX(0.337) 337 pmaddwd xmm5, [rel PW_MF016_MF033] ; xmm5=REL*-FIX(0.168)+GEL*-FIX(0.331) 338 pmaddwd xmm4, [rel PW_MF016_MF033] ; xmm4=REH*-FIX(0.168)+GEH*-FIX(0.331) 373 pmaddwd xmm0, [rel PW_F0114_F0250] ; xmm0=BOL*FIX(0.114)+GOL*FIX(0.250) 374 pmaddwd xmm4, [rel PW_F0114_F0250] ; xmm4=BOH*FIX(0.114)+GOH*FIX(0.250) [all …]
|
D | jcgryext-sse2.asm | 284 pmaddwd xmm1, [rel PW_F0299_F0337] ; xmm1=ROL*FIX(0.299)+GOL*FIX(0.337) 285 pmaddwd xmm6, [rel PW_F0299_F0337] ; xmm6=ROH*FIX(0.299)+GOH*FIX(0.337) 292 pmaddwd xmm0, [rel PW_F0299_F0337] ; xmm0=REL*FIX(0.299)+GEL*FIX(0.337) 293 pmaddwd xmm6, [rel PW_F0299_F0337] ; xmm6=REH*FIX(0.299)+GEH*FIX(0.337) 304 pmaddwd xmm0, [rel PW_F0114_F0250] ; xmm0=BOL*FIX(0.114)+GOL*FIX(0.250) 305 pmaddwd xmm4, [rel PW_F0114_F0250] ; xmm4=BOH*FIX(0.114)+GOH*FIX(0.250) 320 pmaddwd xmm6, [rel PW_F0114_F0250] ; xmm6=BEL*FIX(0.114)+GEL*FIX(0.250) 321 pmaddwd xmm4, [rel PW_F0114_F0250] ; xmm4=BEH*FIX(0.114)+GEH*FIX(0.250)
|
/external/libaom/libaom/av1/encoder/x86/ |
D | error_sse2.asm | 40 pmaddwd m0, m0 41 pmaddwd m1, m1 42 pmaddwd m2, m2 43 pmaddwd m3, m3
|
/external/swiftshader/third_party/llvm-7.0/llvm/test/CodeGen/X86/ |
D | slow-pmulld.ll | 24 ; CHECK32-NEXT: pmaddwd {{\.LCPI.*}}, %xmm0 30 ; CHECK64-NEXT: pmaddwd {{.*}}(%rip), %xmm0 36 ; SSE4-32-NEXT: pmaddwd {{\.LCPI.*}}, %xmm0 42 ; SSE4-64-NEXT: pmaddwd {{.*}}(%rip), %xmm0 159 ; SSE4-32-NEXT: pmaddwd %xmm2, %xmm0 160 ; SSE4-32-NEXT: pmaddwd %xmm2, %xmm1 170 ; SSE4-64-NEXT: pmaddwd %xmm2, %xmm0 171 ; SSE4-64-NEXT: pmaddwd %xmm2, %xmm1 329 ; SSE4-32-NEXT: pmaddwd %xmm4, %xmm0 330 ; SSE4-32-NEXT: pmaddwd %xmm4, %xmm1 [all …]
|