Home
last modified time | relevance | path

Searched refs:_mm_mulhi_epi16 (Results 1 – 25 of 42) sorted by relevance

12

/external/XNNPACK/src/qs8-dwconv/gen/
Dup24x9-minmax-sse41-mul16.c107 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16()
109 const __m128i vp0x89ABCDEFhi = _mm_mulhi_epi16(vxi0x89ABCDEF, vxk0x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16()
111 const __m128i vp0xGHIJKLMNhi = _mm_mulhi_epi16(vxi0xGHIJKLMN, vxk0xGHIJKLMN); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16()
136 const __m128i vp1x01234567hi = _mm_mulhi_epi16(vxi1x01234567, vxk1x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16()
138 const __m128i vp1x89ABCDEFhi = _mm_mulhi_epi16(vxi1x89ABCDEF, vxk1x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16()
140 const __m128i vp1xGHIJKLMNhi = _mm_mulhi_epi16(vxi1xGHIJKLMN, vxk1xGHIJKLMN); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16()
165 const __m128i vp2x01234567hi = _mm_mulhi_epi16(vxi2x01234567, vxk2x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16()
167 const __m128i vp2x89ABCDEFhi = _mm_mulhi_epi16(vxi2x89ABCDEF, vxk2x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16()
169 const __m128i vp2xGHIJKLMNhi = _mm_mulhi_epi16(vxi2xGHIJKLMN, vxk2xGHIJKLMN); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16()
194 const __m128i vp3x01234567hi = _mm_mulhi_epi16(vxi3x01234567, vxk3x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16()
[all …]
Dup16x9-minmax-sse41-mul16.c101 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16()
103 const __m128i vp0x89ABCDEFhi = _mm_mulhi_epi16(vxi0x89ABCDEF, vxk0x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16()
122 const __m128i vp1x01234567hi = _mm_mulhi_epi16(vxi1x01234567, vxk1x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16()
124 const __m128i vp1x89ABCDEFhi = _mm_mulhi_epi16(vxi1x89ABCDEF, vxk1x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16()
143 const __m128i vp2x01234567hi = _mm_mulhi_epi16(vxi2x01234567, vxk2x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16()
145 const __m128i vp2x89ABCDEFhi = _mm_mulhi_epi16(vxi2x89ABCDEF, vxk2x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16()
164 const __m128i vp3x01234567hi = _mm_mulhi_epi16(vxi3x01234567, vxk3x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16()
166 const __m128i vp3x89ABCDEFhi = _mm_mulhi_epi16(vxi3x89ABCDEF, vxk3x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16()
185 const __m128i vp4x01234567hi = _mm_mulhi_epi16(vxi4x01234567, vxk4x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16()
187 const __m128i vp4x89ABCDEFhi = _mm_mulhi_epi16(vxi4x89ABCDEF, vxk4x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16()
[all …]
Dup8x9-minmax-sse41-mul16.c95 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse41_mul16()
108 const __m128i vp1x01234567hi = _mm_mulhi_epi16(vxi1x01234567, vxk1x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse41_mul16()
121 const __m128i vp2x01234567hi = _mm_mulhi_epi16(vxi2x01234567, vxk2x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse41_mul16()
134 const __m128i vp3x01234567hi = _mm_mulhi_epi16(vxi3x01234567, vxk3x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse41_mul16()
147 const __m128i vp4x01234567hi = _mm_mulhi_epi16(vxi4x01234567, vxk4x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse41_mul16()
160 const __m128i vp5x01234567hi = _mm_mulhi_epi16(vxi5x01234567, vxk5x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse41_mul16()
173 const __m128i vp6x01234567hi = _mm_mulhi_epi16(vxi6x01234567, vxk6x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse41_mul16()
186 const __m128i vp7x01234567hi = _mm_mulhi_epi16(vxi7x01234567, vxk7x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse41_mul16()
199 const __m128i vp8x01234567hi = _mm_mulhi_epi16(vxi8x01234567, vxk8x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse41_mul16()
262 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse41_mul16()
[all …]
Dup16x9-minmax-ssse3-mul16.c101 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16()
103 const __m128i vp0x89ABCDEFhi = _mm_mulhi_epi16(vxi0x89ABCDEF, vxk0x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16()
122 const __m128i vp1x01234567hi = _mm_mulhi_epi16(vxi1x01234567, vxk1x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16()
124 const __m128i vp1x89ABCDEFhi = _mm_mulhi_epi16(vxi1x89ABCDEF, vxk1x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16()
143 const __m128i vp2x01234567hi = _mm_mulhi_epi16(vxi2x01234567, vxk2x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16()
145 const __m128i vp2x89ABCDEFhi = _mm_mulhi_epi16(vxi2x89ABCDEF, vxk2x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16()
164 const __m128i vp3x01234567hi = _mm_mulhi_epi16(vxi3x01234567, vxk3x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16()
166 const __m128i vp3x89ABCDEFhi = _mm_mulhi_epi16(vxi3x89ABCDEF, vxk3x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16()
185 const __m128i vp4x01234567hi = _mm_mulhi_epi16(vxi4x01234567, vxk4x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16()
187 const __m128i vp4x89ABCDEFhi = _mm_mulhi_epi16(vxi4x89ABCDEF, vxk4x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16()
[all …]
Dup16x9-minmax-sse2-mul16.c101 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16()
103 const __m128i vp0x89ABCDEFhi = _mm_mulhi_epi16(vxi0x89ABCDEF, vxk0x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16()
122 const __m128i vp1x01234567hi = _mm_mulhi_epi16(vxi1x01234567, vxk1x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16()
124 const __m128i vp1x89ABCDEFhi = _mm_mulhi_epi16(vxi1x89ABCDEF, vxk1x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16()
143 const __m128i vp2x01234567hi = _mm_mulhi_epi16(vxi2x01234567, vxk2x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16()
145 const __m128i vp2x89ABCDEFhi = _mm_mulhi_epi16(vxi2x89ABCDEF, vxk2x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16()
164 const __m128i vp3x01234567hi = _mm_mulhi_epi16(vxi3x01234567, vxk3x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16()
166 const __m128i vp3x89ABCDEFhi = _mm_mulhi_epi16(vxi3x89ABCDEF, vxk3x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16()
185 const __m128i vp4x01234567hi = _mm_mulhi_epi16(vxi4x01234567, vxk4x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16()
187 const __m128i vp4x89ABCDEFhi = _mm_mulhi_epi16(vxi4x89ABCDEF, vxk4x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16()
[all …]
Dup24x9-minmax-ssse3-mul16.c107 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16()
109 const __m128i vp0x89ABCDEFhi = _mm_mulhi_epi16(vxi0x89ABCDEF, vxk0x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16()
111 const __m128i vp0xGHIJKLMNhi = _mm_mulhi_epi16(vxi0xGHIJKLMN, vxk0xGHIJKLMN); in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16()
136 const __m128i vp1x01234567hi = _mm_mulhi_epi16(vxi1x01234567, vxk1x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16()
138 const __m128i vp1x89ABCDEFhi = _mm_mulhi_epi16(vxi1x89ABCDEF, vxk1x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16()
140 const __m128i vp1xGHIJKLMNhi = _mm_mulhi_epi16(vxi1xGHIJKLMN, vxk1xGHIJKLMN); in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16()
165 const __m128i vp2x01234567hi = _mm_mulhi_epi16(vxi2x01234567, vxk2x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16()
167 const __m128i vp2x89ABCDEFhi = _mm_mulhi_epi16(vxi2x89ABCDEF, vxk2x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16()
169 const __m128i vp2xGHIJKLMNhi = _mm_mulhi_epi16(vxi2xGHIJKLMN, vxk2xGHIJKLMN); in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16()
194 const __m128i vp3x01234567hi = _mm_mulhi_epi16(vxi3x01234567, vxk3x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16()
[all …]
Dup24x9-minmax-sse2-mul16.c107 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16()
109 const __m128i vp0x89ABCDEFhi = _mm_mulhi_epi16(vxi0x89ABCDEF, vxk0x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16()
111 const __m128i vp0xGHIJKLMNhi = _mm_mulhi_epi16(vxi0xGHIJKLMN, vxk0xGHIJKLMN); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16()
136 const __m128i vp1x01234567hi = _mm_mulhi_epi16(vxi1x01234567, vxk1x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16()
138 const __m128i vp1x89ABCDEFhi = _mm_mulhi_epi16(vxi1x89ABCDEF, vxk1x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16()
140 const __m128i vp1xGHIJKLMNhi = _mm_mulhi_epi16(vxi1xGHIJKLMN, vxk1xGHIJKLMN); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16()
165 const __m128i vp2x01234567hi = _mm_mulhi_epi16(vxi2x01234567, vxk2x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16()
167 const __m128i vp2x89ABCDEFhi = _mm_mulhi_epi16(vxi2x89ABCDEF, vxk2x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16()
169 const __m128i vp2xGHIJKLMNhi = _mm_mulhi_epi16(vxi2xGHIJKLMN, vxk2xGHIJKLMN); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16()
194 const __m128i vp3x01234567hi = _mm_mulhi_epi16(vxi3x01234567, vxk3x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16()
[all …]
Dup8x9-minmax-sse2-mul16.c95 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse2_mul16()
108 const __m128i vp1x01234567hi = _mm_mulhi_epi16(vxi1x01234567, vxk1x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse2_mul16()
121 const __m128i vp2x01234567hi = _mm_mulhi_epi16(vxi2x01234567, vxk2x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse2_mul16()
134 const __m128i vp3x01234567hi = _mm_mulhi_epi16(vxi3x01234567, vxk3x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse2_mul16()
147 const __m128i vp4x01234567hi = _mm_mulhi_epi16(vxi4x01234567, vxk4x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse2_mul16()
160 const __m128i vp5x01234567hi = _mm_mulhi_epi16(vxi5x01234567, vxk5x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse2_mul16()
173 const __m128i vp6x01234567hi = _mm_mulhi_epi16(vxi6x01234567, vxk6x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse2_mul16()
186 const __m128i vp7x01234567hi = _mm_mulhi_epi16(vxi7x01234567, vxk7x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse2_mul16()
199 const __m128i vp8x01234567hi = _mm_mulhi_epi16(vxi8x01234567, vxk8x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse2_mul16()
283 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse2_mul16()
[all …]
Dup8x9-minmax-ssse3-mul16.c95 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__ssse3_mul16()
108 const __m128i vp1x01234567hi = _mm_mulhi_epi16(vxi1x01234567, vxk1x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__ssse3_mul16()
121 const __m128i vp2x01234567hi = _mm_mulhi_epi16(vxi2x01234567, vxk2x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__ssse3_mul16()
134 const __m128i vp3x01234567hi = _mm_mulhi_epi16(vxi3x01234567, vxk3x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__ssse3_mul16()
147 const __m128i vp4x01234567hi = _mm_mulhi_epi16(vxi4x01234567, vxk4x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__ssse3_mul16()
160 const __m128i vp5x01234567hi = _mm_mulhi_epi16(vxi5x01234567, vxk5x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__ssse3_mul16()
173 const __m128i vp6x01234567hi = _mm_mulhi_epi16(vxi6x01234567, vxk6x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__ssse3_mul16()
186 const __m128i vp7x01234567hi = _mm_mulhi_epi16(vxi7x01234567, vxk7x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__ssse3_mul16()
199 const __m128i vp8x01234567hi = _mm_mulhi_epi16(vxi8x01234567, vxk8x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__ssse3_mul16()
283 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__ssse3_mul16()
[all …]
/external/XNNPACK/src/qu8-dwconv/
Dup8x9-minmax-sse2.c80 const __m128i vprod0_even = _mm_mulhi_epi16(vxi0, vxk0); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2()
89 const __m128i vprod1_even = _mm_mulhi_epi16(vxi1, vxk1); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2()
98 const __m128i vprod2_even = _mm_mulhi_epi16(vxi2, vxk2); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2()
107 const __m128i vprod3_even = _mm_mulhi_epi16(vxi3, vxk3); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2()
116 const __m128i vprod4_even = _mm_mulhi_epi16(vxi4, vxk4); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2()
125 const __m128i vprod5_even = _mm_mulhi_epi16(vxi5, vxk5); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2()
134 const __m128i vprod6_even = _mm_mulhi_epi16(vxi6, vxk6); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2()
143 const __m128i vprod7_even = _mm_mulhi_epi16(vxi7, vxk7); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2()
152 const __m128i vprod8_even = _mm_mulhi_epi16(vxi8, vxk8); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2()
232 const __m128i vprod0_even = _mm_mulhi_epi16(vxi0, vxk0); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2()
[all …]
/external/libvpx/libvpx/vp8/encoder/x86/
Dvp8_quantize_sse2.c89 y0 = _mm_mulhi_epi16(x0, quant0); in vp8_regular_quantize_b_sse2()
90 y1 = _mm_mulhi_epi16(x1, quant1); in vp8_regular_quantize_b_sse2()
97 y0 = _mm_mulhi_epi16(y0, quant_shift0); in vp8_regular_quantize_b_sse2()
98 y1 = _mm_mulhi_epi16(y1, quant_shift1); in vp8_regular_quantize_b_sse2()
173 y0 = _mm_mulhi_epi16(x0, quant_fast0); in vp8_fast_quantize_b_sse2()
174 y1 = _mm_mulhi_epi16(x1, quant_fast1); in vp8_fast_quantize_b_sse2()
Dquantize_sse4.c76 y0 = _mm_mulhi_epi16(x0, quant0); in vp8_regular_quantize_b_sse4_1()
77 y1 = _mm_mulhi_epi16(x1, quant1); in vp8_regular_quantize_b_sse4_1()
84 y0 = _mm_mulhi_epi16(y0, quant_shift0); in vp8_regular_quantize_b_sse4_1()
85 y1 = _mm_mulhi_epi16(y1, quant_shift1); in vp8_regular_quantize_b_sse4_1()
Dvp8_quantize_ssse3.c73 y0 = _mm_mulhi_epi16(x0, quant_fast0); in vp8_fast_quantize_b_ssse3()
74 y1 = _mm_mulhi_epi16(x1, quant_fast1); in vp8_fast_quantize_b_ssse3()
/external/libhevc/common/x86/
Dihevc_weighted_pred_ssse3_intr.c143 res_temp1_4x32b = _mm_mulhi_epi16(lvl_shift_4x32b, wgt0_8x16b); in ihevc_weighted_pred_uni_ssse3()
180 src_temp0_8x16b = _mm_mulhi_epi16(src_temp0_8x16b, wgt0_8x16b); in ihevc_weighted_pred_uni_ssse3()
181 src_temp1_8x16b = _mm_mulhi_epi16(src_temp1_8x16b, wgt0_8x16b); in ihevc_weighted_pred_uni_ssse3()
182 src_temp2_8x16b = _mm_mulhi_epi16(src_temp2_8x16b, wgt0_8x16b); in ihevc_weighted_pred_uni_ssse3()
183 src_temp3_8x16b = _mm_mulhi_epi16(src_temp3_8x16b, wgt0_8x16b); in ihevc_weighted_pred_uni_ssse3()
283 src_temp0_8x16b = _mm_mulhi_epi16(src_temp0_8x16b, wgt0_8x16b); in ihevc_weighted_pred_uni_ssse3()
284 src_temp1_8x16b = _mm_mulhi_epi16(src_temp1_8x16b, wgt0_8x16b); in ihevc_weighted_pred_uni_ssse3()
434 res_temp1_4x32b = _mm_mulhi_epi16(lvl_shift_4x32b, wgt0_8x16b); in ihevc_weighted_pred_chroma_uni_ssse3()
472 src_temp0_8x16b = _mm_mulhi_epi16(src_temp0_8x16b, wgt0_8x16b); in ihevc_weighted_pred_chroma_uni_ssse3()
473 src_temp1_8x16b = _mm_mulhi_epi16(src_temp1_8x16b, wgt0_8x16b); in ihevc_weighted_pred_chroma_uni_ssse3()
[all …]
/external/libaom/libaom/aom_dsp/x86/
Dquantize_x86.h44 tmp = _mm_mulhi_epi16(qcoeff, quant); in calculate_qcoeff()
46 *coeff = _mm_mulhi_epi16(qcoeff, shift); in calculate_qcoeff()
56 tmp = _mm_mulhi_epi16(qcoeff, quant); in calculate_qcoeff_log_scale()
60 tmp1 = _mm_mulhi_epi16(qcoeff, *shift); in calculate_qcoeff_log_scale()
82 const __m128i high = _mm_mulhi_epi16(coeff, dequant); in calculate_dqcoeff_and_store_log_scale()
139 __m128i coeff_vals_hi = _mm_mulhi_epi16(coeff_vals, one); in store_coefficients()
Dquantize_ssse3.c27 tmp = _mm_mulhi_epi16(qcoeff, quant); in calculate_qcoeff_64x64()
31 tmp1 = _mm_mulhi_epi16(qcoeff, *shift); in calculate_qcoeff_64x64()
47 const __m128i high = _mm_mulhi_epi16(coeff, dequant); in calculate_dqcoeff_and_store_64x64()
Dbitdepth_conversion_sse2.h29 const __m128i a_hi = _mm_mulhi_epi16(a, one); in store_tran_low()
/external/libvpx/libvpx/vpx_dsp/x86/
Dquantize_sse2.h42 tmp = _mm_mulhi_epi16(qcoeff, quant); in calculate_qcoeff()
44 *coeff = _mm_mulhi_epi16(qcoeff, shift); in calculate_qcoeff()
51 const __m128i high = _mm_mulhi_epi16(qcoeff, dequant); in calculate_dqcoeff_and_store()
Dpost_proc_sse2.c53 tmp_1 = _mm_mulhi_epi16(sum, s); in vpx_mbpost_proc_down_sse2()
108 multmp_1 = _mm_mulhi_epi16(sum, sum); in vpx_mbpost_proc_down_sse2()
Dquantize_ssse3.h31 const __m128i high = _mm_mulhi_epi16(coeff, dequant); in calculate_dqcoeff_and_store_32x32()
Dbitdepth_conversion_sse2.h35 const __m128i a_hi = _mm_mulhi_epi16(a, one); in store_tran_low()
/external/libvpx/libvpx/vp9/encoder/x86/
Dvp9_quantize_sse2.c72 qtmp0 = _mm_mulhi_epi16(qcoeff0, quant); in vp9_quantize_fp_sse2()
74 qtmp1 = _mm_mulhi_epi16(qcoeff1, quant); in vp9_quantize_fp_sse2()
142 qtmp0 = _mm_mulhi_epi16(qcoeff0, quant); in vp9_quantize_fp_sse2()
143 qtmp1 = _mm_mulhi_epi16(qcoeff1, quant); in vp9_quantize_fp_sse2()
/external/webp/src/dsp/
Dlossless_enc_sse41.c76 const __m128i A = _mm_mulhi_epi16(r, mults_r); // x dbr in CollectColorBlueTransforms_SSE41()
77 const __m128i B = _mm_mulhi_epi16(g, mults_g); // x dbg in CollectColorBlueTransforms_SSE41()
116 const __m128i B = _mm_mulhi_epi16(g, mults_g); // x dr in CollectColorRedTransforms_SSE41()
Dlossless_enc_sse2.c65 const __m128i D = _mm_mulhi_epi16(C, mults_rb); // x dr x db1 in TransformColor_SSE2()
67 const __m128i F = _mm_mulhi_epi16(E, mults_b2); // x db2 0 0 in TransformColor_SSE2()
102 const __m128i C0 = _mm_mulhi_epi16(A0, mults_r); // x db | 0 0 in CollectColorBlueTransforms_SSE2()
103 const __m128i C1 = _mm_mulhi_epi16(A1, mults_r); in CollectColorBlueTransforms_SSE2()
104 const __m128i D0 = _mm_mulhi_epi16(B0, mults_g); // 0 0 | x db in CollectColorBlueTransforms_SSE2()
105 const __m128i D1 = _mm_mulhi_epi16(B1, mults_g); in CollectColorBlueTransforms_SSE2()
148 const __m128i C0 = _mm_mulhi_epi16(A0, mults_g); // 0 0 | x dr in CollectColorRedTransforms_SSE2()
149 const __m128i C1 = _mm_mulhi_epi16(A1, mults_g); in CollectColorRedTransforms_SSE2()
Ddec_sse2.c90 const __m128i c1 = _mm_mulhi_epi16(in1, k2); in Transform_SSE2()
91 const __m128i c2 = _mm_mulhi_epi16(in3, k1); in Transform_SSE2()
96 const __m128i d1 = _mm_mulhi_epi16(in1, k1); in Transform_SSE2()
97 const __m128i d2 = _mm_mulhi_epi16(in3, k2); in Transform_SSE2()
121 const __m128i c1 = _mm_mulhi_epi16(T1, k2); in Transform_SSE2()
122 const __m128i c2 = _mm_mulhi_epi16(T3, k1); in Transform_SSE2()
127 const __m128i d1 = _mm_mulhi_epi16(T1, k1); in Transform_SSE2()
128 const __m128i d2 = _mm_mulhi_epi16(T3, k2); in Transform_SSE2()
456 const __m128i f9_lo = _mm_mulhi_epi16(f_lo, k9); // Filter (lo) * 9 in DoFilter6_SSE2()
457 const __m128i f9_hi = _mm_mulhi_epi16(f_hi, k9); // Filter (hi) * 9 in DoFilter6_SSE2()

12