| /external/XNNPACK/src/s8-ibilinear/gen/ |
| D | neon-c16.c | 73 …const int32x4_t vd0123 = vmlal_s16(vshll_n_s16(vget_low_s16(vdl01234567), 11), vget_low_s16(vdd012… in xnn_s8_ibilinear_ukernel__neon_c16() local 83 …const int32x4_t vd0123 = vmlal_s16(vshll_n_s16(vget_low_s16(vdl01234567), 11), vget_low_s16(vdd012… in xnn_s8_ibilinear_ukernel__neon_c16() local 125 …const int32x4_t vd0123 = vmlal_s16(vshll_n_s16(vget_low_s16(vdl01234567), 11), vget_low_s16(vdd012… in xnn_s8_ibilinear_ukernel__neon_c16() local 131 …const int32x4_t vd0123 = vmlal_s16(vshll_n_s16(vget_low_s16(vdl01234567), 11), vget_low_s16(vdd012… in xnn_s8_ibilinear_ukernel__neon_c16() local 165 …const int32x4_t vd0123 = vmlal_s16(vshll_n_s16(vget_low_s16(vdl01234567), 11), vget_low_s16(vdd012… in xnn_s8_ibilinear_ukernel__neon_c16() local 171 …const int32x4_t vd0123 = vmlal_s16(vshll_n_s16(vget_low_s16(vdl01234567), 11), vget_low_s16(vdd012… in xnn_s8_ibilinear_ukernel__neon_c16() local
|
| D | neon-c8.c | 62 …const int32x4_t vd0123 = vmlal_s16(vshll_n_s16(vget_low_s16(vdl01234567), 11), vget_low_s16(vdd012… in xnn_s8_ibilinear_ukernel__neon_c8() local 68 …const int32x4_t vd0123 = vmlal_s16(vshll_n_s16(vget_low_s16(vdl01234567), 11), vget_low_s16(vdd012… in xnn_s8_ibilinear_ukernel__neon_c8() local 102 …const int32x4_t vd0123 = vmlal_s16(vshll_n_s16(vget_low_s16(vdl01234567), 11), vget_low_s16(vdd012… in xnn_s8_ibilinear_ukernel__neon_c8() local 108 …const int32x4_t vd0123 = vmlal_s16(vshll_n_s16(vget_low_s16(vdl01234567), 11), vget_low_s16(vdd012… in xnn_s8_ibilinear_ukernel__neon_c8() local
|
| D | sse2-c16.c | 83 const __m128i vd0123 = _mm_madd_epi16(_mm_unpacklo_epi16(vdr01234567, vdl01234567), valphah); in xnn_s8_ibilinear_ukernel__sse2_c16() local 136 const __m128i vd0123 = _mm_madd_epi16(_mm_unpacklo_epi16(vdr01234567, vdl01234567), valphah); in xnn_s8_ibilinear_ukernel__sse2_c16() local 174 const __m128i vd0123 = _mm_madd_epi16(_mm_unpacklo_epi16(vdr01234567, vdl01234567), valphah); in xnn_s8_ibilinear_ukernel__sse2_c16() local
|
| D | sse41-c16.c | 74 const __m128i vd0123 = _mm_madd_epi16(_mm_unpacklo_epi16(vdr01234567, vdl01234567), valphah); in xnn_s8_ibilinear_ukernel__sse41_c16() local 118 const __m128i vd0123 = _mm_madd_epi16(_mm_unpacklo_epi16(vdr01234567, vdl01234567), valphah); in xnn_s8_ibilinear_ukernel__sse41_c16() local 149 const __m128i vd0123 = _mm_madd_epi16(_mm_unpacklo_epi16(vdr01234567, vdl01234567), valphah); in xnn_s8_ibilinear_ukernel__sse41_c16() local
|
| D | wasmsimd-dot16x2-c16.c | 72 …const v128_t vd0123 = wasm_i32x4_dot_i16x8(wasm_v16x8_shuffle(vdr01234567, vdl01234567, 0, 8, 1, 9… in xnn_s8_ibilinear_ukernel__wasmsimd_dot16x2_c16() local 115 …const v128_t vd0123 = wasm_i32x4_dot_i16x8(wasm_v16x8_shuffle(vdr01234567, vdl01234567, 0, 8, 1, 9… in xnn_s8_ibilinear_ukernel__wasmsimd_dot16x2_c16() local 145 …const v128_t vd0123 = wasm_i32x4_dot_i16x8(wasm_v16x8_shuffle(vdr01234567, vdl01234567, 0, 8, 1, 9… in xnn_s8_ibilinear_ukernel__wasmsimd_dot16x2_c16() local
|
| D | wasmsimd-mul32-c16.c | 69 …const v128_t vd0123 = wasm_i32x4_add(wasm_i32x4_shl(wasm_i32x4_extend_low_i16x8(vdl01234567), 11),… in xnn_s8_ibilinear_ukernel__wasmsimd_mul32_c16() local 116 …const v128_t vd0123 = wasm_i32x4_add(wasm_i32x4_shl(wasm_i32x4_extend_low_i16x8(vdl01234567), 11),… in xnn_s8_ibilinear_ukernel__wasmsimd_mul32_c16() local 148 …const v128_t vd0123 = wasm_i32x4_add(wasm_i32x4_shl(wasm_i32x4_extend_low_i16x8(vdl01234567), 11),… in xnn_s8_ibilinear_ukernel__wasmsimd_mul32_c16() local
|
| D | sse41-c8.c | 66 const __m128i vd0123 = _mm_madd_epi16(_mm_unpacklo_epi16(vdr01234567, vdl01234567), valphah); in xnn_s8_ibilinear_ukernel__sse41_c8() local 97 const __m128i vd0123 = _mm_madd_epi16(_mm_unpacklo_epi16(vdr01234567, vdl01234567), valphah); in xnn_s8_ibilinear_ukernel__sse41_c8() local
|
| D | wasmsimd-dot16x2-c8.c | 64 …const v128_t vd0123 = wasm_i32x4_dot_i16x8(wasm_v16x8_shuffle(vdr01234567, vdl01234567, 0, 8, 1, 9… in xnn_s8_ibilinear_ukernel__wasmsimd_dot16x2_c8() local 94 …const v128_t vd0123 = wasm_i32x4_dot_i16x8(wasm_v16x8_shuffle(vdr01234567, vdl01234567, 0, 8, 1, 9… in xnn_s8_ibilinear_ukernel__wasmsimd_dot16x2_c8() local
|
| D | sse2-c8.c | 71 const __m128i vd0123 = _mm_madd_epi16(_mm_unpacklo_epi16(vdr01234567, vdl01234567), valphah); in xnn_s8_ibilinear_ukernel__sse2_c8() local 109 const __m128i vd0123 = _mm_madd_epi16(_mm_unpacklo_epi16(vdr01234567, vdl01234567), valphah); in xnn_s8_ibilinear_ukernel__sse2_c8() local
|
| /external/XNNPACK/src/u8-ibilinear/gen/ |
| D | neon-c16.c | 73 …const int32x4_t vd0123 = vmlal_s16(vshll_n_s16(vget_low_s16(vdl01234567), 11), vget_low_s16(vdd012… in xnn_u8_ibilinear_ukernel__neon_c16() local 83 …const int32x4_t vd0123 = vmlal_s16(vshll_n_s16(vget_low_s16(vdl01234567), 11), vget_low_s16(vdd012… in xnn_u8_ibilinear_ukernel__neon_c16() local 125 …const int32x4_t vd0123 = vmlal_s16(vshll_n_s16(vget_low_s16(vdl01234567), 11), vget_low_s16(vdd012… in xnn_u8_ibilinear_ukernel__neon_c16() local 131 …const int32x4_t vd0123 = vmlal_s16(vshll_n_s16(vget_low_s16(vdl01234567), 11), vget_low_s16(vdd012… in xnn_u8_ibilinear_ukernel__neon_c16() local 165 …const int32x4_t vd0123 = vmlal_s16(vshll_n_s16(vget_low_s16(vdl01234567), 11), vget_low_s16(vdd012… in xnn_u8_ibilinear_ukernel__neon_c16() local 171 …const int32x4_t vd0123 = vmlal_s16(vshll_n_s16(vget_low_s16(vdl01234567), 11), vget_low_s16(vdd012… in xnn_u8_ibilinear_ukernel__neon_c16() local
|
| D | neon-c8.c | 62 …const int32x4_t vd0123 = vmlal_s16(vshll_n_s16(vget_low_s16(vdl01234567), 11), vget_low_s16(vdd012… in xnn_u8_ibilinear_ukernel__neon_c8() local 68 …const int32x4_t vd0123 = vmlal_s16(vshll_n_s16(vget_low_s16(vdl01234567), 11), vget_low_s16(vdd012… in xnn_u8_ibilinear_ukernel__neon_c8() local 102 …const int32x4_t vd0123 = vmlal_s16(vshll_n_s16(vget_low_s16(vdl01234567), 11), vget_low_s16(vdd012… in xnn_u8_ibilinear_ukernel__neon_c8() local 108 …const int32x4_t vd0123 = vmlal_s16(vshll_n_s16(vget_low_s16(vdl01234567), 11), vget_low_s16(vdd012… in xnn_u8_ibilinear_ukernel__neon_c8() local
|
| D | wasmsimd-dot16x2-c16.c | 72 …const v128_t vd0123 = wasm_i32x4_dot_i16x8(wasm_v16x8_shuffle(vdr01234567, vdl01234567, 0, 8, 1, 9… in xnn_u8_ibilinear_ukernel__wasmsimd_dot16x2_c16() local 115 …const v128_t vd0123 = wasm_i32x4_dot_i16x8(wasm_v16x8_shuffle(vdr01234567, vdl01234567, 0, 8, 1, 9… in xnn_u8_ibilinear_ukernel__wasmsimd_dot16x2_c16() local 145 …const v128_t vd0123 = wasm_i32x4_dot_i16x8(wasm_v16x8_shuffle(vdr01234567, vdl01234567, 0, 8, 1, 9… in xnn_u8_ibilinear_ukernel__wasmsimd_dot16x2_c16() local
|
| D | sse41-c16.c | 74 const __m128i vd0123 = _mm_madd_epi16(_mm_unpacklo_epi16(vdr01234567, vdl01234567), valphah); in xnn_u8_ibilinear_ukernel__sse41_c16() local 118 const __m128i vd0123 = _mm_madd_epi16(_mm_unpacklo_epi16(vdr01234567, vdl01234567), valphah); in xnn_u8_ibilinear_ukernel__sse41_c16() local 149 const __m128i vd0123 = _mm_madd_epi16(_mm_unpacklo_epi16(vdr01234567, vdl01234567), valphah); in xnn_u8_ibilinear_ukernel__sse41_c16() local
|
| D | sse2-c16.c | 84 const __m128i vd0123 = _mm_madd_epi16(_mm_unpacklo_epi16(vdr01234567, vdl01234567), valphah); in xnn_u8_ibilinear_ukernel__sse2_c16() local 138 const __m128i vd0123 = _mm_madd_epi16(_mm_unpacklo_epi16(vdr01234567, vdl01234567), valphah); in xnn_u8_ibilinear_ukernel__sse2_c16() local 177 const __m128i vd0123 = _mm_madd_epi16(_mm_unpacklo_epi16(vdr01234567, vdl01234567), valphah); in xnn_u8_ibilinear_ukernel__sse2_c16() local
|
| D | wasmsimd-mul32-c16.c | 69 …const v128_t vd0123 = wasm_i32x4_add(wasm_i32x4_shl(wasm_i32x4_extend_low_i16x8(vdl01234567), 11),… in xnn_u8_ibilinear_ukernel__wasmsimd_mul32_c16() local 116 …const v128_t vd0123 = wasm_i32x4_add(wasm_i32x4_shl(wasm_i32x4_extend_low_i16x8(vdl01234567), 11),… in xnn_u8_ibilinear_ukernel__wasmsimd_mul32_c16() local 148 …const v128_t vd0123 = wasm_i32x4_add(wasm_i32x4_shl(wasm_i32x4_extend_low_i16x8(vdl01234567), 11),… in xnn_u8_ibilinear_ukernel__wasmsimd_mul32_c16() local
|
| D | wasmsimd-dot16x2-c8.c | 64 …const v128_t vd0123 = wasm_i32x4_dot_i16x8(wasm_v16x8_shuffle(vdr01234567, vdl01234567, 0, 8, 1, 9… in xnn_u8_ibilinear_ukernel__wasmsimd_dot16x2_c8() local 94 …const v128_t vd0123 = wasm_i32x4_dot_i16x8(wasm_v16x8_shuffle(vdr01234567, vdl01234567, 0, 8, 1, 9… in xnn_u8_ibilinear_ukernel__wasmsimd_dot16x2_c8() local
|
| D | sse41-c8.c | 66 const __m128i vd0123 = _mm_madd_epi16(_mm_unpacklo_epi16(vdr01234567, vdl01234567), valphah); in xnn_u8_ibilinear_ukernel__sse41_c8() local 97 const __m128i vd0123 = _mm_madd_epi16(_mm_unpacklo_epi16(vdr01234567, vdl01234567), valphah); in xnn_u8_ibilinear_ukernel__sse41_c8() local
|
| D | sse2-c8.c | 72 const __m128i vd0123 = _mm_madd_epi16(_mm_unpacklo_epi16(vdr01234567, vdl01234567), valphah); in xnn_u8_ibilinear_ukernel__sse2_c8() local 111 const __m128i vd0123 = _mm_madd_epi16(_mm_unpacklo_epi16(vdr01234567, vdl01234567), valphah); in xnn_u8_ibilinear_ukernel__sse2_c8() local
|
| D | wasmsimd-mul32-c8.c | 61 …const v128_t vd0123 = wasm_i32x4_add(wasm_i32x4_shl(wasm_i32x4_extend_low_i16x8(vdl01234567), 11),… in xnn_u8_ibilinear_ukernel__wasmsimd_mul32_c8() local 93 …const v128_t vd0123 = wasm_i32x4_add(wasm_i32x4_shl(wasm_i32x4_extend_low_i16x8(vdl01234567), 11),… in xnn_u8_ibilinear_ukernel__wasmsimd_mul32_c8() local
|
| /external/XNNPACK/src/f32-ibilinear/gen/ |
| D | neon-c8.c | 61 const float32x4_t vd0123 = vsubq_f32(vb0123, vt0123); in xnn_f32_ibilinear_ukernel__neon_c8() local 82 const float32x4_t vd0123 = vsubq_f32(vb0123, vt0123); in xnn_f32_ibilinear_ukernel__neon_c8() local 101 const float32x4_t vd0123 = vsubq_f32(vb0123, vt0123); in xnn_f32_ibilinear_ukernel__neon_c8() local
|
| D | sse-c8.c | 68 const __m128 vd0123 = _mm_sub_ps(vb0123, vt0123); in xnn_f32_ibilinear_ukernel__sse_c8() local 94 const __m128 vd0123 = _mm_sub_ps(vb0123, vt0123); in xnn_f32_ibilinear_ukernel__sse_c8() local 113 const __m128 vd0123 = _mm_sub_ps(vb0123, vt0123); in xnn_f32_ibilinear_ukernel__sse_c8() local
|
| D | neonfma-c8.c | 72 const float32x4_t vd0123 = vsubq_f32(vb0123, vt0123); in xnn_f32_ibilinear_ukernel__neonfma_c8() local 103 const float32x4_t vd0123 = vsubq_f32(vb0123, vt0123); in xnn_f32_ibilinear_ukernel__neonfma_c8() local 131 const float32x4_t vd0123 = vsubq_f32(vb0123, vt0123); in xnn_f32_ibilinear_ukernel__neonfma_c8() local
|
| D | neon-c4.c | 53 const float32x4_t vd0123 = vsubq_f32(vb0123, vt0123); in xnn_f32_ibilinear_ukernel__neon_c4() local 71 const float32x4_t vd0123 = vsubq_f32(vb0123, vt0123); in xnn_f32_ibilinear_ukernel__neon_c4() local
|
| D | sse-c4.c | 60 const __m128 vd0123 = _mm_sub_ps(vb0123, vt0123); in xnn_f32_ibilinear_ukernel__sse_c4() local 79 const __m128 vd0123 = _mm_sub_ps(vb0123, vt0123); in xnn_f32_ibilinear_ukernel__sse_c4() local
|
| D | neonfma-c4.c | 62 const float32x4_t vd0123 = vsubq_f32(vb0123, vt0123); in xnn_f32_ibilinear_ukernel__neonfma_c4() local 89 const float32x4_t vd0123 = vsubq_f32(vb0123, vt0123); in xnn_f32_ibilinear_ukernel__neonfma_c4() local
|