/external/XNNPACK/src/qs8-dwconv/gen/ |
D | up16x9-minmax-wasmsimd-mul16.c | 245 const v128_t vq31prodCDEF = wasm_v32x4_shuffle(vprodCD, vprodEF, 1, 3, 5, 7); in xnn_qs8_dwconv_minmax_ukernel_up16x9__wasmsimd_mul16() local 251 …v128_t vremCDEF = wasm_i32x4_add(wasm_v128_and(vq31prodCDEF, vremainder_mask), wasm_i32x4_shr(vq31… in xnn_qs8_dwconv_minmax_ukernel_up16x9__wasmsimd_mul16() 258 …vaccCDEF = wasm_i32x4_sub(wasm_i32x4_shr(vq31prodCDEF, vshift), wasm_i32x4_gt(vremCDEF, vthreshold… in xnn_qs8_dwconv_minmax_ukernel_up16x9__wasmsimd_mul16()
|
D | up24x9-minmax-wasmsimd-mul16.c | 302 const v128_t vq31prodCDEF = wasm_v32x4_shuffle(vprodCD, vprodEF, 1, 3, 5, 7); in xnn_qs8_dwconv_minmax_ukernel_up24x9__wasmsimd_mul16() local 310 …v128_t vremCDEF = wasm_i32x4_add(wasm_v128_and(vq31prodCDEF, vremainder_mask), wasm_i32x4_shr(vq31… in xnn_qs8_dwconv_minmax_ukernel_up24x9__wasmsimd_mul16() 319 …vaccCDEF = wasm_i32x4_sub(wasm_i32x4_shr(vq31prodCDEF, vshift), wasm_i32x4_gt(vremCDEF, vthreshold… in xnn_qs8_dwconv_minmax_ukernel_up24x9__wasmsimd_mul16()
|
D | up16x9-minmax-sse41-mul16.c | 308 const __m128i vq31prodCDEF = _mm_blend_epi16(vq31prodCE, vq31prodDF, 0xCC); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16() local 318 …_mm_add_epi32(_mm_and_si128(vq31prodCDEF, vremainder_mask), _mm_cmpgt_epi32(_mm_setzero_si128(), v… in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16() 329 …_mm_sub_epi32(_mm_sra_epi32(vq31prodCDEF, vshift), _mm_cmpgt_epi32(vremCDEF, vremainder_threshold)… in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse41_mul16()
|
D | up16x9-minmax-ssse3-mul16.c | 345 const __m128i vq31prodCDEF = _mm_shuffle_epi32(vq31prodCEDF, _MM_SHUFFLE(3, 1, 2, 0)); in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16() local 355 …_mm_add_epi32(_mm_and_si128(vq31prodCDEF, vremainder_mask), _mm_cmpgt_epi32(_mm_setzero_si128(), v… in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16() 366 …_mm_sub_epi32(_mm_sra_epi32(vq31prodCDEF, vshift), _mm_cmpgt_epi32(vremCDEF, vremainder_threshold)… in xnn_qs8_dwconv_minmax_ukernel_up16x9__ssse3_mul16()
|
D | up16x9-minmax-sse2-mul16.c | 345 const __m128i vq31prodCDEF = _mm_shuffle_epi32(vq31prodCEDF, _MM_SHUFFLE(3, 1, 2, 0)); in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16() local 355 …_mm_add_epi32(_mm_and_si128(vq31prodCDEF, vremainder_mask), _mm_cmpgt_epi32(_mm_setzero_si128(), v… in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16() 366 …_mm_sub_epi32(_mm_sra_epi32(vq31prodCDEF, vshift), _mm_cmpgt_epi32(vremCDEF, vremainder_threshold)… in xnn_qs8_dwconv_minmax_ukernel_up16x9__sse2_mul16()
|
D | up24x9-minmax-sse41-mul16.c | 392 const __m128i vq31prodCDEF = _mm_blend_epi16(vq31prodCE, vq31prodDF, 0xCC); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16() local 404 …_mm_add_epi32(_mm_and_si128(vq31prodCDEF, vremainder_mask), _mm_cmpgt_epi32(_mm_setzero_si128(), v… in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16() 419 …_mm_sub_epi32(_mm_sra_epi32(vq31prodCDEF, vshift), _mm_cmpgt_epi32(vremCDEF, vremainder_threshold)… in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse41_mul16()
|
D | up24x9-minmax-ssse3-mul16.c | 445 const __m128i vq31prodCDEF = _mm_shuffle_epi32(vq31prodCEDF, _MM_SHUFFLE(3, 1, 2, 0)); in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16() local 457 …_mm_add_epi32(_mm_and_si128(vq31prodCDEF, vremainder_mask), _mm_cmpgt_epi32(_mm_setzero_si128(), v… in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16() 472 …_mm_sub_epi32(_mm_sra_epi32(vq31prodCDEF, vshift), _mm_cmpgt_epi32(vremCDEF, vremainder_threshold)… in xnn_qs8_dwconv_minmax_ukernel_up24x9__ssse3_mul16()
|
D | up24x9-minmax-sse2-mul16.c | 445 const __m128i vq31prodCDEF = _mm_shuffle_epi32(vq31prodCEDF, _MM_SHUFFLE(3, 1, 2, 0)); in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16() local 457 …_mm_add_epi32(_mm_and_si128(vq31prodCDEF, vremainder_mask), _mm_cmpgt_epi32(_mm_setzero_si128(), v… in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16() 472 …_mm_sub_epi32(_mm_sra_epi32(vq31prodCDEF, vshift), _mm_cmpgt_epi32(vremCDEF, vremainder_threshold)… in xnn_qs8_dwconv_minmax_ukernel_up24x9__sse2_mul16()
|