/external/XNNPACK/src/qs8-dwconv/gen/ |
D | up24x9-minmax-sse41-mul16.c | 107 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16() 109 const __m128i vp0x89ABCDEFhi = _mm_mulhi_epi16(vxi0x89ABCDEF, vxk0x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16() 111 const __m128i vp0xGHIJKLMNhi = _mm_mulhi_epi16(vxi0xGHIJKLMN, vxk0xGHIJKLMN); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16() 136 const __m128i vp1x01234567hi = _mm_mulhi_epi16(vxi1x01234567, vxk1x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16() 138 const __m128i vp1x89ABCDEFhi = _mm_mulhi_epi16(vxi1x89ABCDEF, vxk1x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16() 140 const __m128i vp1xGHIJKLMNhi = _mm_mulhi_epi16(vxi1xGHIJKLMN, vxk1xGHIJKLMN); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16() 165 const __m128i vp2x01234567hi = _mm_mulhi_epi16(vxi2x01234567, vxk2x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16() 167 const __m128i vp2x89ABCDEFhi = _mm_mulhi_epi16(vxi2x89ABCDEF, vxk2x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16() 169 const __m128i vp2xGHIJKLMNhi = _mm_mulhi_epi16(vxi2xGHIJKLMN, vxk2xGHIJKLMN); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16() 194 const __m128i vp3x01234567hi = _mm_mulhi_epi16(vxi3x01234567, vxk3x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16() [all …]
|
D | up16x9-minmax-sse41-mul16.c | 101 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16() 103 const __m128i vp0x89ABCDEFhi = _mm_mulhi_epi16(vxi0x89ABCDEF, vxk0x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16() 122 const __m128i vp1x01234567hi = _mm_mulhi_epi16(vxi1x01234567, vxk1x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16() 124 const __m128i vp1x89ABCDEFhi = _mm_mulhi_epi16(vxi1x89ABCDEF, vxk1x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16() 143 const __m128i vp2x01234567hi = _mm_mulhi_epi16(vxi2x01234567, vxk2x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16() 145 const __m128i vp2x89ABCDEFhi = _mm_mulhi_epi16(vxi2x89ABCDEF, vxk2x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16() 164 const __m128i vp3x01234567hi = _mm_mulhi_epi16(vxi3x01234567, vxk3x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16() 166 const __m128i vp3x89ABCDEFhi = _mm_mulhi_epi16(vxi3x89ABCDEF, vxk3x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16() 185 const __m128i vp4x01234567hi = _mm_mulhi_epi16(vxi4x01234567, vxk4x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16() 187 const __m128i vp4x89ABCDEFhi = _mm_mulhi_epi16(vxi4x89ABCDEF, vxk4x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16() [all …]
|
D | up8x9-minmax-sse41-mul16.c | 95 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse41_mul16() 108 const __m128i vp1x01234567hi = _mm_mulhi_epi16(vxi1x01234567, vxk1x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse41_mul16() 121 const __m128i vp2x01234567hi = _mm_mulhi_epi16(vxi2x01234567, vxk2x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse41_mul16() 134 const __m128i vp3x01234567hi = _mm_mulhi_epi16(vxi3x01234567, vxk3x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse41_mul16() 147 const __m128i vp4x01234567hi = _mm_mulhi_epi16(vxi4x01234567, vxk4x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse41_mul16() 160 const __m128i vp5x01234567hi = _mm_mulhi_epi16(vxi5x01234567, vxk5x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse41_mul16() 173 const __m128i vp6x01234567hi = _mm_mulhi_epi16(vxi6x01234567, vxk6x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse41_mul16() 186 const __m128i vp7x01234567hi = _mm_mulhi_epi16(vxi7x01234567, vxk7x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse41_mul16() 199 const __m128i vp8x01234567hi = _mm_mulhi_epi16(vxi8x01234567, vxk8x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse41_mul16() 262 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse41_mul16() [all …]
|
D | up16x9-minmax-ssse3-mul16.c | 101 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16() 103 const __m128i vp0x89ABCDEFhi = _mm_mulhi_epi16(vxi0x89ABCDEF, vxk0x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16() 122 const __m128i vp1x01234567hi = _mm_mulhi_epi16(vxi1x01234567, vxk1x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16() 124 const __m128i vp1x89ABCDEFhi = _mm_mulhi_epi16(vxi1x89ABCDEF, vxk1x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16() 143 const __m128i vp2x01234567hi = _mm_mulhi_epi16(vxi2x01234567, vxk2x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16() 145 const __m128i vp2x89ABCDEFhi = _mm_mulhi_epi16(vxi2x89ABCDEF, vxk2x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16() 164 const __m128i vp3x01234567hi = _mm_mulhi_epi16(vxi3x01234567, vxk3x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16() 166 const __m128i vp3x89ABCDEFhi = _mm_mulhi_epi16(vxi3x89ABCDEF, vxk3x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16() 185 const __m128i vp4x01234567hi = _mm_mulhi_epi16(vxi4x01234567, vxk4x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16() 187 const __m128i vp4x89ABCDEFhi = _mm_mulhi_epi16(vxi4x89ABCDEF, vxk4x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16() [all …]
|
D | up16x9-minmax-sse2-mul16.c | 101 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16() 103 const __m128i vp0x89ABCDEFhi = _mm_mulhi_epi16(vxi0x89ABCDEF, vxk0x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16() 122 const __m128i vp1x01234567hi = _mm_mulhi_epi16(vxi1x01234567, vxk1x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16() 124 const __m128i vp1x89ABCDEFhi = _mm_mulhi_epi16(vxi1x89ABCDEF, vxk1x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16() 143 const __m128i vp2x01234567hi = _mm_mulhi_epi16(vxi2x01234567, vxk2x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16() 145 const __m128i vp2x89ABCDEFhi = _mm_mulhi_epi16(vxi2x89ABCDEF, vxk2x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16() 164 const __m128i vp3x01234567hi = _mm_mulhi_epi16(vxi3x01234567, vxk3x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16() 166 const __m128i vp3x89ABCDEFhi = _mm_mulhi_epi16(vxi3x89ABCDEF, vxk3x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16() 185 const __m128i vp4x01234567hi = _mm_mulhi_epi16(vxi4x01234567, vxk4x01234567); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16() 187 const __m128i vp4x89ABCDEFhi = _mm_mulhi_epi16(vxi4x89ABCDEF, vxk4x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16() [all …]
|
D | up24x9-minmax-ssse3-mul16.c | 107 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16() 109 const __m128i vp0x89ABCDEFhi = _mm_mulhi_epi16(vxi0x89ABCDEF, vxk0x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16() 111 const __m128i vp0xGHIJKLMNhi = _mm_mulhi_epi16(vxi0xGHIJKLMN, vxk0xGHIJKLMN); in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16() 136 const __m128i vp1x01234567hi = _mm_mulhi_epi16(vxi1x01234567, vxk1x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16() 138 const __m128i vp1x89ABCDEFhi = _mm_mulhi_epi16(vxi1x89ABCDEF, vxk1x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16() 140 const __m128i vp1xGHIJKLMNhi = _mm_mulhi_epi16(vxi1xGHIJKLMN, vxk1xGHIJKLMN); in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16() 165 const __m128i vp2x01234567hi = _mm_mulhi_epi16(vxi2x01234567, vxk2x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16() 167 const __m128i vp2x89ABCDEFhi = _mm_mulhi_epi16(vxi2x89ABCDEF, vxk2x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16() 169 const __m128i vp2xGHIJKLMNhi = _mm_mulhi_epi16(vxi2xGHIJKLMN, vxk2xGHIJKLMN); in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16() 194 const __m128i vp3x01234567hi = _mm_mulhi_epi16(vxi3x01234567, vxk3x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16() [all …]
|
D | up24x9-minmax-sse2-mul16.c | 107 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16() 109 const __m128i vp0x89ABCDEFhi = _mm_mulhi_epi16(vxi0x89ABCDEF, vxk0x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16() 111 const __m128i vp0xGHIJKLMNhi = _mm_mulhi_epi16(vxi0xGHIJKLMN, vxk0xGHIJKLMN); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16() 136 const __m128i vp1x01234567hi = _mm_mulhi_epi16(vxi1x01234567, vxk1x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16() 138 const __m128i vp1x89ABCDEFhi = _mm_mulhi_epi16(vxi1x89ABCDEF, vxk1x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16() 140 const __m128i vp1xGHIJKLMNhi = _mm_mulhi_epi16(vxi1xGHIJKLMN, vxk1xGHIJKLMN); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16() 165 const __m128i vp2x01234567hi = _mm_mulhi_epi16(vxi2x01234567, vxk2x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16() 167 const __m128i vp2x89ABCDEFhi = _mm_mulhi_epi16(vxi2x89ABCDEF, vxk2x89ABCDEF); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16() 169 const __m128i vp2xGHIJKLMNhi = _mm_mulhi_epi16(vxi2xGHIJKLMN, vxk2xGHIJKLMN); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16() 194 const __m128i vp3x01234567hi = _mm_mulhi_epi16(vxi3x01234567, vxk3x01234567); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16() [all …]
|
D | up8x9-minmax-sse2-mul16.c | 95 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse2_mul16() 108 const __m128i vp1x01234567hi = _mm_mulhi_epi16(vxi1x01234567, vxk1x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse2_mul16() 121 const __m128i vp2x01234567hi = _mm_mulhi_epi16(vxi2x01234567, vxk2x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse2_mul16() 134 const __m128i vp3x01234567hi = _mm_mulhi_epi16(vxi3x01234567, vxk3x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse2_mul16() 147 const __m128i vp4x01234567hi = _mm_mulhi_epi16(vxi4x01234567, vxk4x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse2_mul16() 160 const __m128i vp5x01234567hi = _mm_mulhi_epi16(vxi5x01234567, vxk5x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse2_mul16() 173 const __m128i vp6x01234567hi = _mm_mulhi_epi16(vxi6x01234567, vxk6x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse2_mul16() 186 const __m128i vp7x01234567hi = _mm_mulhi_epi16(vxi7x01234567, vxk7x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse2_mul16() 199 const __m128i vp8x01234567hi = _mm_mulhi_epi16(vxi8x01234567, vxk8x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse2_mul16() 283 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__sse2_mul16() [all …]
|
D | up8x9-minmax-ssse3-mul16.c | 95 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__ssse3_mul16() 108 const __m128i vp1x01234567hi = _mm_mulhi_epi16(vxi1x01234567, vxk1x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__ssse3_mul16() 121 const __m128i vp2x01234567hi = _mm_mulhi_epi16(vxi2x01234567, vxk2x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__ssse3_mul16() 134 const __m128i vp3x01234567hi = _mm_mulhi_epi16(vxi3x01234567, vxk3x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__ssse3_mul16() 147 const __m128i vp4x01234567hi = _mm_mulhi_epi16(vxi4x01234567, vxk4x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__ssse3_mul16() 160 const __m128i vp5x01234567hi = _mm_mulhi_epi16(vxi5x01234567, vxk5x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__ssse3_mul16() 173 const __m128i vp6x01234567hi = _mm_mulhi_epi16(vxi6x01234567, vxk6x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__ssse3_mul16() 186 const __m128i vp7x01234567hi = _mm_mulhi_epi16(vxi7x01234567, vxk7x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__ssse3_mul16() 199 const __m128i vp8x01234567hi = _mm_mulhi_epi16(vxi8x01234567, vxk8x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__ssse3_mul16() 283 const __m128i vp0x01234567hi = _mm_mulhi_epi16(vxi0x01234567, vxk0x01234567); in xnn_qs8_dwconv_minmax_ukernel_up8x9__ssse3_mul16() [all …]
|
/external/XNNPACK/src/qu8-dwconv/ |
D | up8x9-minmax-sse2.c | 80 const __m128i vprod0_even = _mm_mulhi_epi16(vxi0, vxk0); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2() 89 const __m128i vprod1_even = _mm_mulhi_epi16(vxi1, vxk1); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2() 98 const __m128i vprod2_even = _mm_mulhi_epi16(vxi2, vxk2); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2() 107 const __m128i vprod3_even = _mm_mulhi_epi16(vxi3, vxk3); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2() 116 const __m128i vprod4_even = _mm_mulhi_epi16(vxi4, vxk4); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2() 125 const __m128i vprod5_even = _mm_mulhi_epi16(vxi5, vxk5); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2() 134 const __m128i vprod6_even = _mm_mulhi_epi16(vxi6, vxk6); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2() 143 const __m128i vprod7_even = _mm_mulhi_epi16(vxi7, vxk7); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2() 152 const __m128i vprod8_even = _mm_mulhi_epi16(vxi8, vxk8); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2() 232 const __m128i vprod0_even = _mm_mulhi_epi16(vxi0, vxk0); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2() [all …]
|
/external/libvpx/libvpx/vp8/encoder/x86/ |
D | vp8_quantize_sse2.c | 89 y0 = _mm_mulhi_epi16(x0, quant0); in vp8_regular_quantize_b_sse2() 90 y1 = _mm_mulhi_epi16(x1, quant1); in vp8_regular_quantize_b_sse2() 97 y0 = _mm_mulhi_epi16(y0, quant_shift0); in vp8_regular_quantize_b_sse2() 98 y1 = _mm_mulhi_epi16(y1, quant_shift1); in vp8_regular_quantize_b_sse2() 173 y0 = _mm_mulhi_epi16(x0, quant_fast0); in vp8_fast_quantize_b_sse2() 174 y1 = _mm_mulhi_epi16(x1, quant_fast1); in vp8_fast_quantize_b_sse2()
|
D | quantize_sse4.c | 76 y0 = _mm_mulhi_epi16(x0, quant0); in vp8_regular_quantize_b_sse4_1() 77 y1 = _mm_mulhi_epi16(x1, quant1); in vp8_regular_quantize_b_sse4_1() 84 y0 = _mm_mulhi_epi16(y0, quant_shift0); in vp8_regular_quantize_b_sse4_1() 85 y1 = _mm_mulhi_epi16(y1, quant_shift1); in vp8_regular_quantize_b_sse4_1()
|
D | vp8_quantize_ssse3.c | 73 y0 = _mm_mulhi_epi16(x0, quant_fast0); in vp8_fast_quantize_b_ssse3() 74 y1 = _mm_mulhi_epi16(x1, quant_fast1); in vp8_fast_quantize_b_ssse3()
|
/external/libhevc/common/x86/ |
D | ihevc_weighted_pred_ssse3_intr.c | 143 res_temp1_4x32b = _mm_mulhi_epi16(lvl_shift_4x32b, wgt0_8x16b); in ihevc_weighted_pred_uni_ssse3() 180 src_temp0_8x16b = _mm_mulhi_epi16(src_temp0_8x16b, wgt0_8x16b); in ihevc_weighted_pred_uni_ssse3() 181 src_temp1_8x16b = _mm_mulhi_epi16(src_temp1_8x16b, wgt0_8x16b); in ihevc_weighted_pred_uni_ssse3() 182 src_temp2_8x16b = _mm_mulhi_epi16(src_temp2_8x16b, wgt0_8x16b); in ihevc_weighted_pred_uni_ssse3() 183 src_temp3_8x16b = _mm_mulhi_epi16(src_temp3_8x16b, wgt0_8x16b); in ihevc_weighted_pred_uni_ssse3() 283 src_temp0_8x16b = _mm_mulhi_epi16(src_temp0_8x16b, wgt0_8x16b); in ihevc_weighted_pred_uni_ssse3() 284 src_temp1_8x16b = _mm_mulhi_epi16(src_temp1_8x16b, wgt0_8x16b); in ihevc_weighted_pred_uni_ssse3() 434 res_temp1_4x32b = _mm_mulhi_epi16(lvl_shift_4x32b, wgt0_8x16b); in ihevc_weighted_pred_chroma_uni_ssse3() 472 src_temp0_8x16b = _mm_mulhi_epi16(src_temp0_8x16b, wgt0_8x16b); in ihevc_weighted_pred_chroma_uni_ssse3() 473 src_temp1_8x16b = _mm_mulhi_epi16(src_temp1_8x16b, wgt0_8x16b); in ihevc_weighted_pred_chroma_uni_ssse3() [all …]
|
/external/libaom/libaom/aom_dsp/x86/ |
D | quantize_x86.h | 44 tmp = _mm_mulhi_epi16(qcoeff, quant); in calculate_qcoeff() 46 *coeff = _mm_mulhi_epi16(qcoeff, shift); in calculate_qcoeff() 56 tmp = _mm_mulhi_epi16(qcoeff, quant); in calculate_qcoeff_log_scale() 60 tmp1 = _mm_mulhi_epi16(qcoeff, *shift); in calculate_qcoeff_log_scale() 82 const __m128i high = _mm_mulhi_epi16(coeff, dequant); in calculate_dqcoeff_and_store_log_scale() 139 __m128i coeff_vals_hi = _mm_mulhi_epi16(coeff_vals, one); in store_coefficients()
|
D | quantize_ssse3.c | 27 tmp = _mm_mulhi_epi16(qcoeff, quant); in calculate_qcoeff_64x64() 31 tmp1 = _mm_mulhi_epi16(qcoeff, *shift); in calculate_qcoeff_64x64() 47 const __m128i high = _mm_mulhi_epi16(coeff, dequant); in calculate_dqcoeff_and_store_64x64()
|
D | bitdepth_conversion_sse2.h | 29 const __m128i a_hi = _mm_mulhi_epi16(a, one); in store_tran_low()
|
/external/libvpx/libvpx/vpx_dsp/x86/ |
D | quantize_sse2.h | 42 tmp = _mm_mulhi_epi16(qcoeff, quant); in calculate_qcoeff() 44 *coeff = _mm_mulhi_epi16(qcoeff, shift); in calculate_qcoeff() 51 const __m128i high = _mm_mulhi_epi16(qcoeff, dequant); in calculate_dqcoeff_and_store()
|
D | post_proc_sse2.c | 53 tmp_1 = _mm_mulhi_epi16(sum, s); in vpx_mbpost_proc_down_sse2() 108 multmp_1 = _mm_mulhi_epi16(sum, sum); in vpx_mbpost_proc_down_sse2()
|
D | quantize_ssse3.h | 31 const __m128i high = _mm_mulhi_epi16(coeff, dequant); in calculate_dqcoeff_and_store_32x32()
|
D | bitdepth_conversion_sse2.h | 35 const __m128i a_hi = _mm_mulhi_epi16(a, one); in store_tran_low()
|
/external/libvpx/libvpx/vp9/encoder/x86/ |
D | vp9_quantize_sse2.c | 72 qtmp0 = _mm_mulhi_epi16(qcoeff0, quant); in vp9_quantize_fp_sse2() 74 qtmp1 = _mm_mulhi_epi16(qcoeff1, quant); in vp9_quantize_fp_sse2() 142 qtmp0 = _mm_mulhi_epi16(qcoeff0, quant); in vp9_quantize_fp_sse2() 143 qtmp1 = _mm_mulhi_epi16(qcoeff1, quant); in vp9_quantize_fp_sse2()
|
/external/webp/src/dsp/ |
D | lossless_enc_sse41.c | 76 const __m128i A = _mm_mulhi_epi16(r, mults_r); // x dbr in CollectColorBlueTransforms_SSE41() 77 const __m128i B = _mm_mulhi_epi16(g, mults_g); // x dbg in CollectColorBlueTransforms_SSE41() 116 const __m128i B = _mm_mulhi_epi16(g, mults_g); // x dr in CollectColorRedTransforms_SSE41()
|
D | lossless_enc_sse2.c | 65 const __m128i D = _mm_mulhi_epi16(C, mults_rb); // x dr x db1 in TransformColor_SSE2() 67 const __m128i F = _mm_mulhi_epi16(E, mults_b2); // x db2 0 0 in TransformColor_SSE2() 102 const __m128i C0 = _mm_mulhi_epi16(A0, mults_r); // x db | 0 0 in CollectColorBlueTransforms_SSE2() 103 const __m128i C1 = _mm_mulhi_epi16(A1, mults_r); in CollectColorBlueTransforms_SSE2() 104 const __m128i D0 = _mm_mulhi_epi16(B0, mults_g); // 0 0 | x db in CollectColorBlueTransforms_SSE2() 105 const __m128i D1 = _mm_mulhi_epi16(B1, mults_g); in CollectColorBlueTransforms_SSE2() 148 const __m128i C0 = _mm_mulhi_epi16(A0, mults_g); // 0 0 | x dr in CollectColorRedTransforms_SSE2() 149 const __m128i C1 = _mm_mulhi_epi16(A1, mults_g); in CollectColorRedTransforms_SSE2()
|
D | dec_sse2.c | 90 const __m128i c1 = _mm_mulhi_epi16(in1, k2); in Transform_SSE2() 91 const __m128i c2 = _mm_mulhi_epi16(in3, k1); in Transform_SSE2() 96 const __m128i d1 = _mm_mulhi_epi16(in1, k1); in Transform_SSE2() 97 const __m128i d2 = _mm_mulhi_epi16(in3, k2); in Transform_SSE2() 121 const __m128i c1 = _mm_mulhi_epi16(T1, k2); in Transform_SSE2() 122 const __m128i c2 = _mm_mulhi_epi16(T3, k1); in Transform_SSE2() 127 const __m128i d1 = _mm_mulhi_epi16(T1, k1); in Transform_SSE2() 128 const __m128i d2 = _mm_mulhi_epi16(T3, k2); in Transform_SSE2() 456 const __m128i f9_lo = _mm_mulhi_epi16(f_lo, k9); // Filter (lo) * 9 in DoFilter6_SSE2() 457 const __m128i f9_hi = _mm_mulhi_epi16(f_hi, k9); // Filter (hi) * 9 in DoFilter6_SSE2()
|