Home
last modified time | relevance | path

Searched refs:pmaddwd (Results 1 – 25 of 121) sorted by relevance

12345

/external/libvpx/libvpx/vpx_dsp/x86/
Dfwd_txfm_ssse3_x86_64.asm95 pmaddwd m5, m2, [GLOBAL(pw_15137_6270)]
96 pmaddwd m2, [GLOBAL(pw_6270_m15137)]
97 pmaddwd m9, m10, [GLOBAL(pw_15137_6270)]
98 pmaddwd m10, [GLOBAL(pw_6270_m15137)]
123 pmaddwd m7, m1, [GLOBAL(pw_16069_3196)]
124 pmaddwd m1, [GLOBAL(pw_3196_m16069)]
125 pmaddwd m9, m10, [GLOBAL(pw_16069_3196)]
126 pmaddwd m10, [GLOBAL(pw_3196_m16069)]
141 pmaddwd m9, m11, [GLOBAL(pw_9102_13623)]
142 pmaddwd m11, [GLOBAL(pw_13623_m9102)]
[all …]
Dhighbd_sad4d_sse2.asm36 pmaddwd m4, m1
37 pmaddwd m5, m1
46 pmaddwd m6, m1
47 pmaddwd m7, m1
56 pmaddwd m2, m1
65 pmaddwd m2, m1
74 pmaddwd m2, m1
83 pmaddwd m2, m1
112 pmaddwd m4, m1
113 pmaddwd m5, m1
[all …]
Dhighbd_variance_impl_sse2.asm91 pmaddwd xmm1, xmm1
98 pmaddwd xmm3, xmm3
105 pmaddwd xmm1, xmm1
111 pmaddwd xmm3, xmm3
238 pmaddwd xmm1, xmm1
248 pmaddwd xmm3, xmm3
255 pmaddwd xmm1, xmm1
261 pmaddwd xmm3, xmm3
Dvpx_high_subpixel_bilinear_sse2.asm46 pmaddwd xmm0, xmm4 ;multiply the filter factors
103 pmaddwd xmm6, xmm7
104 pmaddwd xmm0, xmm7
135 pmaddwd xmm9, xmm7
136 pmaddwd xmm6, xmm7
137 pmaddwd xmm0, xmm7
138 pmaddwd xmm2, xmm7
Dvpx_high_subpixel_8t_sse2.asm67 pmaddwd xmm0, k0k6 ;multiply the filter factors
68 pmaddwd xmm1, k1k7
69 pmaddwd xmm2, k2k5
70 pmaddwd xmm3, k3k4
167 pmaddwd xmm0, k0k1
168 pmaddwd xmm5, k0k1
169 pmaddwd xmm6, k6k7
170 pmaddwd xmm1, k6k7
171 pmaddwd xmm2, k2k5
172 pmaddwd xmm7, k2k5
[all …]
/external/libaom/libaom/aom_dsp/x86/
Dfwd_txfm_ssse3_x86_64.asm113 pmaddwd m5, m2, [GLOBAL(pw_15137_6270)]
114 pmaddwd m2, [GLOBAL(pw_6270_m15137)]
115 pmaddwd m9, m10, [GLOBAL(pw_15137_6270)]
116 pmaddwd m10, [GLOBAL(pw_6270_m15137)]
141 pmaddwd m7, m1, [GLOBAL(pw_16069_3196)]
142 pmaddwd m1, [GLOBAL(pw_3196_m16069)]
143 pmaddwd m9, m10, [GLOBAL(pw_16069_3196)]
144 pmaddwd m10, [GLOBAL(pw_3196_m16069)]
159 pmaddwd m9, m11, [GLOBAL(pw_9102_13623)]
160 pmaddwd m11, [GLOBAL(pw_13623_m9102)]
[all …]
Dhighbd_sad4d_sse2.asm39 pmaddwd m4, m1
40 pmaddwd m5, m1
49 pmaddwd m6, m1
50 pmaddwd m7, m1
59 pmaddwd m2, m1
68 pmaddwd m2, m1
77 pmaddwd m2, m1
86 pmaddwd m2, m1
115 pmaddwd m4, m1
116 pmaddwd m5, m1
[all …]
Dhighbd_variance_impl_sse2.asm94 pmaddwd xmm1, xmm1
101 pmaddwd xmm3, xmm3
108 pmaddwd xmm1, xmm1
114 pmaddwd xmm3, xmm3
241 pmaddwd xmm1, xmm1
251 pmaddwd xmm3, xmm3
258 pmaddwd xmm1, xmm1
264 pmaddwd xmm3, xmm3
Daom_high_subpixel_8t_sse2.asm70 pmaddwd xmm0, k0k6 ;multiply the filter factors
71 pmaddwd xmm1, k1k7
72 pmaddwd xmm2, k2k5
73 pmaddwd xmm3, k3k4
170 pmaddwd xmm0, k0k1
171 pmaddwd xmm5, k0k1
172 pmaddwd xmm6, k6k7
173 pmaddwd xmm1, k6k7
174 pmaddwd xmm2, k2k5
175 pmaddwd xmm7, k2k5
[all …]
Daom_high_subpixel_bilinear_sse2.asm49 pmaddwd xmm0, xmm4 ;multiply the filter factors
108 pmaddwd xmm6, xmm7
109 pmaddwd xmm0, xmm7
140 pmaddwd xmm5, xmm7
141 pmaddwd xmm6, xmm7
142 pmaddwd xmm0, xmm7
143 pmaddwd xmm2, xmm7
/external/libvpx/libvpx/vp8/encoder/x86/
Ddct_sse2.asm96 pmaddwd xmm0, XMMWORD PTR[GLOBAL(_mult_add)] ;a1 + b1
97 pmaddwd xmm1, XMMWORD PTR[GLOBAL(_mult_sub)] ;a1 - b1
99 pmaddwd xmm3, XMMWORD PTR[GLOBAL(_5352_2217)] ;c1*2217 + d1*5352
100 pmaddwd xmm4, XMMWORD PTR[GLOBAL(_2217_neg5352)];d1*2217 - c1*5352
138 pmaddwd xmm0, XMMWORD PTR[GLOBAL(_mult_add)] ;a1 + b1
139 pmaddwd xmm1, XMMWORD PTR[GLOBAL(_mult_sub)] ;a1 - b1
151 pmaddwd xmm3, XMMWORD PTR[GLOBAL(_5352_2217)] ;c1*2217 + d1*5352
152 pmaddwd xmm4, XMMWORD PTR[GLOBAL(_2217_neg5352)] ;d1*2217 - c1*5352
248 pmaddwd xmm1, XMMWORD PTR[GLOBAL (_5352_2217)] ; c1*2217 + d1*5352
249 pmaddwd xmm4, XMMWORD PTR[GLOBAL (_5352_2217)] ; c1*2217 + d1*5352
[all …]
Dblock_error_sse2.asm38 pmaddwd xmm0, xmm0
39 pmaddwd xmm2, xmm2
97 pmaddwd xmm2, xmm2
102 pmaddwd xmm0, xmm0
157 pmaddwd xmm1, xmm1
Dfwalsh_sse2.asm80 pmaddwd xmm0, [GLOBAL(c1)] ; d11 a11 d10 a10
81 pmaddwd xmm2, [GLOBAL(cn1)] ; c11 b11 c10 b10
83 pmaddwd xmm1, [GLOBAL(c1)] ; d12 a12 d13 a13
84 pmaddwd xmm3, [GLOBAL(cn1)] ; c12 b12 c13 b13
/external/fec/
Ddotprod_sse2_assist.s36 pmaddwd (%edi),%xmm1
40 pmaddwd 16(%edi),%xmm1
44 pmaddwd 32(%edi),%xmm1
49 pmaddwd 48(%edi),%xmm1
Ddotprod_mmx_assist.s36 pmaddwd (%edi),%mm1 # mm1 = b[3]*a[3]+b[2]*a[2],b[1]*a[1]+b[0]*a[0]
40 pmaddwd 8(%edi),%mm1
44 pmaddwd 16(%edi),%mm1
49 pmaddwd 24(%edi),%mm1
Dsumsq_mmx_assist.s28 pmaddwd %mm0,%mm0 # (S0^2+S1^2) (S2^2+S3^2)
30 pmaddwd %mm6,%mm6 # (S4^2+S5^2) (S6^2+S7^2)
67 pmaddwd %mm0,%mm0 # (S0*S0+S1*S1) (S2*S2+S3*S3)
69 pmaddwd %mm1,%mm1
/external/libvpx/libvpx/vp9/encoder/x86/
Dvp9_error_sse2.asm38 pmaddwd m0, m0
39 pmaddwd m1, m1
40 pmaddwd m2, m2
41 pmaddwd m3, m3
94 pmaddwd m0, m0
95 pmaddwd m1, m1
/external/libjpeg-turbo/simd/i386/
Djccolext-mmx.asm288 pmaddwd mm1, [GOTOFF(eax,PW_F0299_F0337)] ; mm1=ROL*FIX(0.299)+GOL*FIX(0.337)
289 pmaddwd mm6, [GOTOFF(eax,PW_F0299_F0337)] ; mm6=ROH*FIX(0.299)+GOH*FIX(0.337)
290 pmaddwd mm7, [GOTOFF(eax,PW_MF016_MF033)] ; mm7=ROL*-FIX(0.168)+GOL*-FIX(0.331)
291 pmaddwd mm4, [GOTOFF(eax,PW_MF016_MF033)] ; mm4=ROH*-FIX(0.168)+GOH*-FIX(0.331)
320 pmaddwd mm0, [GOTOFF(eax,PW_F0299_F0337)] ; mm0=REL*FIX(0.299)+GEL*FIX(0.337)
321 pmaddwd mm6, [GOTOFF(eax,PW_F0299_F0337)] ; mm6=REH*FIX(0.299)+GEH*FIX(0.337)
322 pmaddwd mm5, [GOTOFF(eax,PW_MF016_MF033)] ; mm5=REL*-FIX(0.168)+GEL*-FIX(0.331)
323 pmaddwd mm4, [GOTOFF(eax,PW_MF016_MF033)] ; mm4=REH*-FIX(0.168)+GEH*-FIX(0.331)
358 pmaddwd mm0, [GOTOFF(eax,PW_F0114_F0250)] ; mm0=BOL*FIX(0.114)+GOL*FIX(0.250)
359 pmaddwd mm4, [GOTOFF(eax,PW_F0114_F0250)] ; mm4=BOH*FIX(0.114)+GOH*FIX(0.250)
[all …]
Djccolext-sse2.asm317 pmaddwd xmm1, [GOTOFF(eax,PW_F0299_F0337)] ; xmm1=ROL*FIX(0.299)+GOL*FIX(0.337)
318 pmaddwd xmm6, [GOTOFF(eax,PW_F0299_F0337)] ; xmm6=ROH*FIX(0.299)+GOH*FIX(0.337)
319 pmaddwd xmm7, [GOTOFF(eax,PW_MF016_MF033)] ; xmm7=ROL*-FIX(0.168)+GOL*-FIX(0.331)
320 pmaddwd xmm4, [GOTOFF(eax,PW_MF016_MF033)] ; xmm4=ROH*-FIX(0.168)+GOH*-FIX(0.331)
349 pmaddwd xmm0, [GOTOFF(eax,PW_F0299_F0337)] ; xmm0=REL*FIX(0.299)+GEL*FIX(0.337)
350 pmaddwd xmm6, [GOTOFF(eax,PW_F0299_F0337)] ; xmm6=REH*FIX(0.299)+GEH*FIX(0.337)
351 pmaddwd xmm5, [GOTOFF(eax,PW_MF016_MF033)] ; xmm5=REL*-FIX(0.168)+GEL*-FIX(0.331)
352 pmaddwd xmm4, [GOTOFF(eax,PW_MF016_MF033)] ; xmm4=REH*-FIX(0.168)+GEH*-FIX(0.331)
387 pmaddwd xmm0, [GOTOFF(eax,PW_F0114_F0250)] ; xmm0=BOL*FIX(0.114)+GOL*FIX(0.250)
388 pmaddwd xmm4, [GOTOFF(eax,PW_F0114_F0250)] ; xmm4=BOH*FIX(0.114)+GOH*FIX(0.250)
[all …]
Djcgryext-mmx.asm269 pmaddwd mm1, [GOTOFF(eax,PW_F0299_F0337)] ; mm1=ROL*FIX(0.299)+GOL*FIX(0.337)
270 pmaddwd mm6, [GOTOFF(eax,PW_F0299_F0337)] ; mm6=ROH*FIX(0.299)+GOH*FIX(0.337)
277 pmaddwd mm0, [GOTOFF(eax,PW_F0299_F0337)] ; mm0=REL*FIX(0.299)+GEL*FIX(0.337)
278 pmaddwd mm6, [GOTOFF(eax,PW_F0299_F0337)] ; mm6=REH*FIX(0.299)+GEH*FIX(0.337)
289 pmaddwd mm0, [GOTOFF(eax,PW_F0114_F0250)] ; mm0=BOL*FIX(0.114)+GOL*FIX(0.250)
290 pmaddwd mm4, [GOTOFF(eax,PW_F0114_F0250)] ; mm4=BOH*FIX(0.114)+GOH*FIX(0.250)
305 pmaddwd mm6, [GOTOFF(eax,PW_F0114_F0250)] ; mm6=BEL*FIX(0.114)+GEL*FIX(0.250)
306 pmaddwd mm4, [GOTOFF(eax,PW_F0114_F0250)] ; mm4=BEH*FIX(0.114)+GEH*FIX(0.250)
Djcgryext-sse2.asm298 pmaddwd xmm1, [GOTOFF(eax,PW_F0299_F0337)] ; xmm1=ROL*FIX(0.299)+GOL*FIX(0.337)
299 pmaddwd xmm6, [GOTOFF(eax,PW_F0299_F0337)] ; xmm6=ROH*FIX(0.299)+GOH*FIX(0.337)
306 pmaddwd xmm0, [GOTOFF(eax,PW_F0299_F0337)] ; xmm0=REL*FIX(0.299)+GEL*FIX(0.337)
307 pmaddwd xmm6, [GOTOFF(eax,PW_F0299_F0337)] ; xmm6=REH*FIX(0.299)+GEH*FIX(0.337)
318 pmaddwd xmm0, [GOTOFF(eax,PW_F0114_F0250)] ; xmm0=BOL*FIX(0.114)+GOL*FIX(0.250)
319 pmaddwd xmm4, [GOTOFF(eax,PW_F0114_F0250)] ; xmm4=BOH*FIX(0.114)+GOH*FIX(0.250)
334 pmaddwd xmm6, [GOTOFF(eax,PW_F0114_F0250)] ; xmm6=BEL*FIX(0.114)+GEL*FIX(0.250)
335 pmaddwd xmm4, [GOTOFF(eax,PW_F0114_F0250)] ; xmm4=BEH*FIX(0.114)+GEH*FIX(0.250)
/external/libjpeg-turbo/simd/x86_64/
Djccolext-sse2.asm302 pmaddwd xmm1, [rel PW_F0299_F0337] ; xmm1=ROL*FIX(0.299)+GOL*FIX(0.337)
303 pmaddwd xmm6, [rel PW_F0299_F0337] ; xmm6=ROH*FIX(0.299)+GOH*FIX(0.337)
304 pmaddwd xmm7, [rel PW_MF016_MF033] ; xmm7=ROL*-FIX(0.168)+GOL*-FIX(0.331)
305 pmaddwd xmm4, [rel PW_MF016_MF033] ; xmm4=ROH*-FIX(0.168)+GOH*-FIX(0.331)
334 pmaddwd xmm0, [rel PW_F0299_F0337] ; xmm0=REL*FIX(0.299)+GEL*FIX(0.337)
335 pmaddwd xmm6, [rel PW_F0299_F0337] ; xmm6=REH*FIX(0.299)+GEH*FIX(0.337)
336 pmaddwd xmm5, [rel PW_MF016_MF033] ; xmm5=REL*-FIX(0.168)+GEL*-FIX(0.331)
337 pmaddwd xmm4, [rel PW_MF016_MF033] ; xmm4=REH*-FIX(0.168)+GEH*-FIX(0.331)
372 pmaddwd xmm0, [rel PW_F0114_F0250] ; xmm0=BOL*FIX(0.114)+GOL*FIX(0.250)
373 pmaddwd xmm4, [rel PW_F0114_F0250] ; xmm4=BOH*FIX(0.114)+GOH*FIX(0.250)
[all …]
Djcgryext-sse2.asm283 pmaddwd xmm1, [rel PW_F0299_F0337] ; xmm1=ROL*FIX(0.299)+GOL*FIX(0.337)
284 pmaddwd xmm6, [rel PW_F0299_F0337] ; xmm6=ROH*FIX(0.299)+GOH*FIX(0.337)
291 pmaddwd xmm0, [rel PW_F0299_F0337] ; xmm0=REL*FIX(0.299)+GEL*FIX(0.337)
292 pmaddwd xmm6, [rel PW_F0299_F0337] ; xmm6=REH*FIX(0.299)+GEH*FIX(0.337)
303 pmaddwd xmm0, [rel PW_F0114_F0250] ; xmm0=BOL*FIX(0.114)+GOL*FIX(0.250)
304 pmaddwd xmm4, [rel PW_F0114_F0250] ; xmm4=BOH*FIX(0.114)+GOH*FIX(0.250)
319 pmaddwd xmm6, [rel PW_F0114_F0250] ; xmm6=BEL*FIX(0.114)+GEL*FIX(0.250)
320 pmaddwd xmm4, [rel PW_F0114_F0250] ; xmm4=BEH*FIX(0.114)+GEH*FIX(0.250)
/external/libaom/libaom/av1/encoder/x86/
Derror_sse2.asm55 pmaddwd m0, m0
56 pmaddwd m1, m1
57 pmaddwd m2, m2
58 pmaddwd m3, m3
/external/llvm-project/llvm/test/CodeGen/X86/
Dslow-pmulld.ll24 ; CHECK32-NEXT: pmaddwd {{\.LCPI.*}}, %xmm0
30 ; CHECK64-NEXT: pmaddwd {{.*}}(%rip), %xmm0
36 ; SSE4-32-NEXT: pmaddwd {{\.LCPI.*}}, %xmm0
42 ; SSE4-64-NEXT: pmaddwd {{.*}}(%rip), %xmm0
154 ; SSE4-32-NEXT: pmaddwd %xmm2, %xmm0
155 ; SSE4-32-NEXT: pmaddwd %xmm2, %xmm1
164 ; SSE4-64-NEXT: pmaddwd %xmm2, %xmm0
165 ; SSE4-64-NEXT: pmaddwd %xmm2, %xmm1
317 ; SSE4-32-NEXT: pmaddwd %xmm4, %xmm0
318 ; SSE4-32-NEXT: pmaddwd %xmm4, %xmm1
[all …]

12345