/external/libvpx/libvpx/vpx_dsp/x86/ |
D | fwd_txfm_ssse3_x86_64.asm | 95 pmaddwd m5, m2, [GLOBAL(pw_15137_6270)] 96 pmaddwd m2, [GLOBAL(pw_6270_m15137)] 97 pmaddwd m9, m10, [GLOBAL(pw_15137_6270)] 98 pmaddwd m10, [GLOBAL(pw_6270_m15137)] 123 pmaddwd m7, m1, [GLOBAL(pw_16069_3196)] 124 pmaddwd m1, [GLOBAL(pw_3196_m16069)] 125 pmaddwd m9, m10, [GLOBAL(pw_16069_3196)] 126 pmaddwd m10, [GLOBAL(pw_3196_m16069)] 141 pmaddwd m9, m11, [GLOBAL(pw_9102_13623)] 142 pmaddwd m11, [GLOBAL(pw_13623_m9102)] [all …]
|
D | highbd_sad4d_sse2.asm | 36 pmaddwd m4, m1 37 pmaddwd m5, m1 46 pmaddwd m6, m1 47 pmaddwd m7, m1 56 pmaddwd m2, m1 65 pmaddwd m2, m1 74 pmaddwd m2, m1 83 pmaddwd m2, m1 112 pmaddwd m4, m1 113 pmaddwd m5, m1 [all …]
|
D | highbd_variance_impl_sse2.asm | 91 pmaddwd xmm1, xmm1 98 pmaddwd xmm3, xmm3 105 pmaddwd xmm1, xmm1 111 pmaddwd xmm3, xmm3 238 pmaddwd xmm1, xmm1 248 pmaddwd xmm3, xmm3 255 pmaddwd xmm1, xmm1 261 pmaddwd xmm3, xmm3
|
D | vpx_high_subpixel_bilinear_sse2.asm | 46 pmaddwd xmm0, xmm4 ;multiply the filter factors 103 pmaddwd xmm6, xmm7 104 pmaddwd xmm0, xmm7 135 pmaddwd xmm9, xmm7 136 pmaddwd xmm6, xmm7 137 pmaddwd xmm0, xmm7 138 pmaddwd xmm2, xmm7
|
D | vpx_high_subpixel_8t_sse2.asm | 67 pmaddwd xmm0, k0k6 ;multiply the filter factors 68 pmaddwd xmm1, k1k7 69 pmaddwd xmm2, k2k5 70 pmaddwd xmm3, k3k4 167 pmaddwd xmm0, k0k1 168 pmaddwd xmm5, k0k1 169 pmaddwd xmm6, k6k7 170 pmaddwd xmm1, k6k7 171 pmaddwd xmm2, k2k5 172 pmaddwd xmm7, k2k5 [all …]
|
/external/libaom/libaom/aom_dsp/x86/ |
D | fwd_txfm_ssse3_x86_64.asm | 113 pmaddwd m5, m2, [GLOBAL(pw_15137_6270)] 114 pmaddwd m2, [GLOBAL(pw_6270_m15137)] 115 pmaddwd m9, m10, [GLOBAL(pw_15137_6270)] 116 pmaddwd m10, [GLOBAL(pw_6270_m15137)] 141 pmaddwd m7, m1, [GLOBAL(pw_16069_3196)] 142 pmaddwd m1, [GLOBAL(pw_3196_m16069)] 143 pmaddwd m9, m10, [GLOBAL(pw_16069_3196)] 144 pmaddwd m10, [GLOBAL(pw_3196_m16069)] 159 pmaddwd m9, m11, [GLOBAL(pw_9102_13623)] 160 pmaddwd m11, [GLOBAL(pw_13623_m9102)] [all …]
|
D | highbd_sad4d_sse2.asm | 39 pmaddwd m4, m1 40 pmaddwd m5, m1 49 pmaddwd m6, m1 50 pmaddwd m7, m1 59 pmaddwd m2, m1 68 pmaddwd m2, m1 77 pmaddwd m2, m1 86 pmaddwd m2, m1 115 pmaddwd m4, m1 116 pmaddwd m5, m1 [all …]
|
D | highbd_variance_impl_sse2.asm | 94 pmaddwd xmm1, xmm1 101 pmaddwd xmm3, xmm3 108 pmaddwd xmm1, xmm1 114 pmaddwd xmm3, xmm3 241 pmaddwd xmm1, xmm1 251 pmaddwd xmm3, xmm3 258 pmaddwd xmm1, xmm1 264 pmaddwd xmm3, xmm3
|
D | aom_high_subpixel_8t_sse2.asm | 70 pmaddwd xmm0, k0k6 ;multiply the filter factors 71 pmaddwd xmm1, k1k7 72 pmaddwd xmm2, k2k5 73 pmaddwd xmm3, k3k4 170 pmaddwd xmm0, k0k1 171 pmaddwd xmm5, k0k1 172 pmaddwd xmm6, k6k7 173 pmaddwd xmm1, k6k7 174 pmaddwd xmm2, k2k5 175 pmaddwd xmm7, k2k5 [all …]
|
D | aom_high_subpixel_bilinear_sse2.asm | 49 pmaddwd xmm0, xmm4 ;multiply the filter factors 108 pmaddwd xmm6, xmm7 109 pmaddwd xmm0, xmm7 140 pmaddwd xmm5, xmm7 141 pmaddwd xmm6, xmm7 142 pmaddwd xmm0, xmm7 143 pmaddwd xmm2, xmm7
|
/external/libvpx/libvpx/vp8/encoder/x86/ |
D | dct_sse2.asm | 96 pmaddwd xmm0, XMMWORD PTR[GLOBAL(_mult_add)] ;a1 + b1 97 pmaddwd xmm1, XMMWORD PTR[GLOBAL(_mult_sub)] ;a1 - b1 99 pmaddwd xmm3, XMMWORD PTR[GLOBAL(_5352_2217)] ;c1*2217 + d1*5352 100 pmaddwd xmm4, XMMWORD PTR[GLOBAL(_2217_neg5352)];d1*2217 - c1*5352 138 pmaddwd xmm0, XMMWORD PTR[GLOBAL(_mult_add)] ;a1 + b1 139 pmaddwd xmm1, XMMWORD PTR[GLOBAL(_mult_sub)] ;a1 - b1 151 pmaddwd xmm3, XMMWORD PTR[GLOBAL(_5352_2217)] ;c1*2217 + d1*5352 152 pmaddwd xmm4, XMMWORD PTR[GLOBAL(_2217_neg5352)] ;d1*2217 - c1*5352 248 pmaddwd xmm1, XMMWORD PTR[GLOBAL (_5352_2217)] ; c1*2217 + d1*5352 249 pmaddwd xmm4, XMMWORD PTR[GLOBAL (_5352_2217)] ; c1*2217 + d1*5352 [all …]
|
D | block_error_sse2.asm | 38 pmaddwd xmm0, xmm0 39 pmaddwd xmm2, xmm2 97 pmaddwd xmm2, xmm2 102 pmaddwd xmm0, xmm0 157 pmaddwd xmm1, xmm1
|
D | fwalsh_sse2.asm | 80 pmaddwd xmm0, [GLOBAL(c1)] ; d11 a11 d10 a10 81 pmaddwd xmm2, [GLOBAL(cn1)] ; c11 b11 c10 b10 83 pmaddwd xmm1, [GLOBAL(c1)] ; d12 a12 d13 a13 84 pmaddwd xmm3, [GLOBAL(cn1)] ; c12 b12 c13 b13
|
/external/fec/ |
D | dotprod_sse2_assist.s | 36 pmaddwd (%edi),%xmm1 40 pmaddwd 16(%edi),%xmm1 44 pmaddwd 32(%edi),%xmm1 49 pmaddwd 48(%edi),%xmm1
|
D | dotprod_mmx_assist.s | 36 pmaddwd (%edi),%mm1 # mm1 = b[3]*a[3]+b[2]*a[2],b[1]*a[1]+b[0]*a[0] 40 pmaddwd 8(%edi),%mm1 44 pmaddwd 16(%edi),%mm1 49 pmaddwd 24(%edi),%mm1
|
D | sumsq_mmx_assist.s | 28 pmaddwd %mm0,%mm0 # (S0^2+S1^2) (S2^2+S3^2) 30 pmaddwd %mm6,%mm6 # (S4^2+S5^2) (S6^2+S7^2) 67 pmaddwd %mm0,%mm0 # (S0*S0+S1*S1) (S2*S2+S3*S3) 69 pmaddwd %mm1,%mm1
|
/external/libvpx/libvpx/vp9/encoder/x86/ |
D | vp9_error_sse2.asm | 38 pmaddwd m0, m0 39 pmaddwd m1, m1 40 pmaddwd m2, m2 41 pmaddwd m3, m3 94 pmaddwd m0, m0 95 pmaddwd m1, m1
|
/external/libjpeg-turbo/simd/i386/ |
D | jccolext-mmx.asm | 288 pmaddwd mm1, [GOTOFF(eax,PW_F0299_F0337)] ; mm1=ROL*FIX(0.299)+GOL*FIX(0.337) 289 pmaddwd mm6, [GOTOFF(eax,PW_F0299_F0337)] ; mm6=ROH*FIX(0.299)+GOH*FIX(0.337) 290 pmaddwd mm7, [GOTOFF(eax,PW_MF016_MF033)] ; mm7=ROL*-FIX(0.168)+GOL*-FIX(0.331) 291 pmaddwd mm4, [GOTOFF(eax,PW_MF016_MF033)] ; mm4=ROH*-FIX(0.168)+GOH*-FIX(0.331) 320 pmaddwd mm0, [GOTOFF(eax,PW_F0299_F0337)] ; mm0=REL*FIX(0.299)+GEL*FIX(0.337) 321 pmaddwd mm6, [GOTOFF(eax,PW_F0299_F0337)] ; mm6=REH*FIX(0.299)+GEH*FIX(0.337) 322 pmaddwd mm5, [GOTOFF(eax,PW_MF016_MF033)] ; mm5=REL*-FIX(0.168)+GEL*-FIX(0.331) 323 pmaddwd mm4, [GOTOFF(eax,PW_MF016_MF033)] ; mm4=REH*-FIX(0.168)+GEH*-FIX(0.331) 358 pmaddwd mm0, [GOTOFF(eax,PW_F0114_F0250)] ; mm0=BOL*FIX(0.114)+GOL*FIX(0.250) 359 pmaddwd mm4, [GOTOFF(eax,PW_F0114_F0250)] ; mm4=BOH*FIX(0.114)+GOH*FIX(0.250) [all …]
|
D | jccolext-sse2.asm | 317 pmaddwd xmm1, [GOTOFF(eax,PW_F0299_F0337)] ; xmm1=ROL*FIX(0.299)+GOL*FIX(0.337) 318 pmaddwd xmm6, [GOTOFF(eax,PW_F0299_F0337)] ; xmm6=ROH*FIX(0.299)+GOH*FIX(0.337) 319 pmaddwd xmm7, [GOTOFF(eax,PW_MF016_MF033)] ; xmm7=ROL*-FIX(0.168)+GOL*-FIX(0.331) 320 pmaddwd xmm4, [GOTOFF(eax,PW_MF016_MF033)] ; xmm4=ROH*-FIX(0.168)+GOH*-FIX(0.331) 349 pmaddwd xmm0, [GOTOFF(eax,PW_F0299_F0337)] ; xmm0=REL*FIX(0.299)+GEL*FIX(0.337) 350 pmaddwd xmm6, [GOTOFF(eax,PW_F0299_F0337)] ; xmm6=REH*FIX(0.299)+GEH*FIX(0.337) 351 pmaddwd xmm5, [GOTOFF(eax,PW_MF016_MF033)] ; xmm5=REL*-FIX(0.168)+GEL*-FIX(0.331) 352 pmaddwd xmm4, [GOTOFF(eax,PW_MF016_MF033)] ; xmm4=REH*-FIX(0.168)+GEH*-FIX(0.331) 387 pmaddwd xmm0, [GOTOFF(eax,PW_F0114_F0250)] ; xmm0=BOL*FIX(0.114)+GOL*FIX(0.250) 388 pmaddwd xmm4, [GOTOFF(eax,PW_F0114_F0250)] ; xmm4=BOH*FIX(0.114)+GOH*FIX(0.250) [all …]
|
D | jcgryext-mmx.asm | 269 pmaddwd mm1, [GOTOFF(eax,PW_F0299_F0337)] ; mm1=ROL*FIX(0.299)+GOL*FIX(0.337) 270 pmaddwd mm6, [GOTOFF(eax,PW_F0299_F0337)] ; mm6=ROH*FIX(0.299)+GOH*FIX(0.337) 277 pmaddwd mm0, [GOTOFF(eax,PW_F0299_F0337)] ; mm0=REL*FIX(0.299)+GEL*FIX(0.337) 278 pmaddwd mm6, [GOTOFF(eax,PW_F0299_F0337)] ; mm6=REH*FIX(0.299)+GEH*FIX(0.337) 289 pmaddwd mm0, [GOTOFF(eax,PW_F0114_F0250)] ; mm0=BOL*FIX(0.114)+GOL*FIX(0.250) 290 pmaddwd mm4, [GOTOFF(eax,PW_F0114_F0250)] ; mm4=BOH*FIX(0.114)+GOH*FIX(0.250) 305 pmaddwd mm6, [GOTOFF(eax,PW_F0114_F0250)] ; mm6=BEL*FIX(0.114)+GEL*FIX(0.250) 306 pmaddwd mm4, [GOTOFF(eax,PW_F0114_F0250)] ; mm4=BEH*FIX(0.114)+GEH*FIX(0.250)
|
D | jcgryext-sse2.asm | 298 pmaddwd xmm1, [GOTOFF(eax,PW_F0299_F0337)] ; xmm1=ROL*FIX(0.299)+GOL*FIX(0.337) 299 pmaddwd xmm6, [GOTOFF(eax,PW_F0299_F0337)] ; xmm6=ROH*FIX(0.299)+GOH*FIX(0.337) 306 pmaddwd xmm0, [GOTOFF(eax,PW_F0299_F0337)] ; xmm0=REL*FIX(0.299)+GEL*FIX(0.337) 307 pmaddwd xmm6, [GOTOFF(eax,PW_F0299_F0337)] ; xmm6=REH*FIX(0.299)+GEH*FIX(0.337) 318 pmaddwd xmm0, [GOTOFF(eax,PW_F0114_F0250)] ; xmm0=BOL*FIX(0.114)+GOL*FIX(0.250) 319 pmaddwd xmm4, [GOTOFF(eax,PW_F0114_F0250)] ; xmm4=BOH*FIX(0.114)+GOH*FIX(0.250) 334 pmaddwd xmm6, [GOTOFF(eax,PW_F0114_F0250)] ; xmm6=BEL*FIX(0.114)+GEL*FIX(0.250) 335 pmaddwd xmm4, [GOTOFF(eax,PW_F0114_F0250)] ; xmm4=BEH*FIX(0.114)+GEH*FIX(0.250)
|
/external/libjpeg-turbo/simd/x86_64/ |
D | jccolext-sse2.asm | 302 pmaddwd xmm1, [rel PW_F0299_F0337] ; xmm1=ROL*FIX(0.299)+GOL*FIX(0.337) 303 pmaddwd xmm6, [rel PW_F0299_F0337] ; xmm6=ROH*FIX(0.299)+GOH*FIX(0.337) 304 pmaddwd xmm7, [rel PW_MF016_MF033] ; xmm7=ROL*-FIX(0.168)+GOL*-FIX(0.331) 305 pmaddwd xmm4, [rel PW_MF016_MF033] ; xmm4=ROH*-FIX(0.168)+GOH*-FIX(0.331) 334 pmaddwd xmm0, [rel PW_F0299_F0337] ; xmm0=REL*FIX(0.299)+GEL*FIX(0.337) 335 pmaddwd xmm6, [rel PW_F0299_F0337] ; xmm6=REH*FIX(0.299)+GEH*FIX(0.337) 336 pmaddwd xmm5, [rel PW_MF016_MF033] ; xmm5=REL*-FIX(0.168)+GEL*-FIX(0.331) 337 pmaddwd xmm4, [rel PW_MF016_MF033] ; xmm4=REH*-FIX(0.168)+GEH*-FIX(0.331) 372 pmaddwd xmm0, [rel PW_F0114_F0250] ; xmm0=BOL*FIX(0.114)+GOL*FIX(0.250) 373 pmaddwd xmm4, [rel PW_F0114_F0250] ; xmm4=BOH*FIX(0.114)+GOH*FIX(0.250) [all …]
|
D | jcgryext-sse2.asm | 283 pmaddwd xmm1, [rel PW_F0299_F0337] ; xmm1=ROL*FIX(0.299)+GOL*FIX(0.337) 284 pmaddwd xmm6, [rel PW_F0299_F0337] ; xmm6=ROH*FIX(0.299)+GOH*FIX(0.337) 291 pmaddwd xmm0, [rel PW_F0299_F0337] ; xmm0=REL*FIX(0.299)+GEL*FIX(0.337) 292 pmaddwd xmm6, [rel PW_F0299_F0337] ; xmm6=REH*FIX(0.299)+GEH*FIX(0.337) 303 pmaddwd xmm0, [rel PW_F0114_F0250] ; xmm0=BOL*FIX(0.114)+GOL*FIX(0.250) 304 pmaddwd xmm4, [rel PW_F0114_F0250] ; xmm4=BOH*FIX(0.114)+GOH*FIX(0.250) 319 pmaddwd xmm6, [rel PW_F0114_F0250] ; xmm6=BEL*FIX(0.114)+GEL*FIX(0.250) 320 pmaddwd xmm4, [rel PW_F0114_F0250] ; xmm4=BEH*FIX(0.114)+GEH*FIX(0.250)
|
/external/libaom/libaom/av1/encoder/x86/ |
D | error_sse2.asm | 55 pmaddwd m0, m0 56 pmaddwd m1, m1 57 pmaddwd m2, m2 58 pmaddwd m3, m3
|
/external/llvm-project/llvm/test/CodeGen/X86/ |
D | slow-pmulld.ll | 24 ; CHECK32-NEXT: pmaddwd {{\.LCPI.*}}, %xmm0 30 ; CHECK64-NEXT: pmaddwd {{.*}}(%rip), %xmm0 36 ; SSE4-32-NEXT: pmaddwd {{\.LCPI.*}}, %xmm0 42 ; SSE4-64-NEXT: pmaddwd {{.*}}(%rip), %xmm0 154 ; SSE4-32-NEXT: pmaddwd %xmm2, %xmm0 155 ; SSE4-32-NEXT: pmaddwd %xmm2, %xmm1 164 ; SSE4-64-NEXT: pmaddwd %xmm2, %xmm0 165 ; SSE4-64-NEXT: pmaddwd %xmm2, %xmm1 317 ; SSE4-32-NEXT: pmaddwd %xmm4, %xmm0 318 ; SSE4-32-NEXT: pmaddwd %xmm4, %xmm1 [all …]
|