Searched refs:o0c0 (Results 1 – 8 of 8) sorted by relevance
/external/XNNPACK/src/f32-conv-hwc2chw/ |
D | 3x3s2p1c3x4-sse-1x1.c | 60 float* o0c0 = output0; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_1x1() local 61 float* o0c1 = (float*) ((uintptr_t) o0c0 + output_channel_stride); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_1x1() 66 o0c1 = o0c0; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_1x1() 204 _mm_store_ss(o0c0, voc0123); o0c0++; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_1x1() 283 _mm_store_ss(o0c0, voc0123); o0c0++; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_1x1() 290 o0c0 = (float*) ((uintptr_t) o0c0 + output_channel_increment); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_1x1()
|
D | 3x3s2p1c3x4-neonfma-2x2.c | 73 float* o0c0 = output0; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfma_2x2() local 75 float* o0c1 = (float*) ((uintptr_t) o0c0 + output_channel_stride); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfma_2x2() 83 o0c1 = o0c0; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfma_2x2() 346 vst1_f32(o0c0, vget_low_f32(vo0c01)); o0c0 += 2; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfma_2x2() 606 vst1_f32(o0c0, vget_low_f32(vo0c01)); o0c0 += 2; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfma_2x2() 618 vst1q_lane_f32(o0c0, vo0x0, 0); o0c0 += 1; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfma_2x2() 626 o0c0 = (float*) ((uintptr_t) o0c0 + output_channel_increment); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfma_2x2()
|
D | 3x3s2p1c3x4-scalar-1x1.c | 58 float* o0c0 = output0; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__scalar_1x1() local 59 float* o0c1 = (float*) ((uintptr_t) o0c0 + output_channel_stride); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__scalar_1x1() 64 o0c1 = o0c0; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__scalar_1x1() 419 *o0c0++ = voc0; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__scalar_1x1() 643 *o0c0++ = voc0; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__scalar_1x1() 650 o0c0 = (float*) ((uintptr_t) o0c0 + output_channel_increment); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__scalar_1x1()
|
D | 3x3s2p1c3x4-neon-2x2.c | 73 float* o0c0 = output0; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neon_2x2() local 75 float* o0c1 = (float*) ((uintptr_t) o0c0 + output_channel_stride); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neon_2x2() 83 o0c1 = o0c0; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neon_2x2() 344 vst1_f32(o0c0, vget_low_f32(vo0c0123.val[0])); o0c0 += 2; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neon_2x2() 602 vst1_f32(o0c0, vget_low_f32(vo0c0123.val[0])); o0c0 += 2; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neon_2x2() 614 vst1q_lane_f32(o0c0, vo0x0, 0); o0c0 += 1; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neon_2x2() 622 o0c0 = (float*) ((uintptr_t) o0c0 + output_channel_increment); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neon_2x2()
|
D | 3x3s2p1c3x4-wasmsimd-2x2.c | 73 float* o0c0 = output0; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__wasmsimd_2x2() local 75 float* o0c1 = (float*) ((uintptr_t) o0c0 + output_channel_stride); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__wasmsimd_2x2() 83 o0c1 = o0c0; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__wasmsimd_2x2() 345 *((double*) o0c0) = wasm_f64x2_extract_lane(vo0c01, 0); o0c0 += 2; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__wasmsimd_2x2() 605 *((double*) o0c0) = wasm_f64x2_extract_lane(vo0c01, 0); o0c0 += 2; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__wasmsimd_2x2() 616 *o0c0 = wasm_f32x4_extract_lane(vo0x0, 0); o0c0 += 1; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__wasmsimd_2x2() 624 o0c0 = (float*) ((uintptr_t) o0c0 + output_channel_increment); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__wasmsimd_2x2()
|
D | 3x3s2p1c3x4-sse-2x2.c | 73 float* o0c0 = output0; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_2x2() local 75 float* o0c1 = (float*) ((uintptr_t) o0c0 + output_channel_stride); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_2x2() 83 o0c1 = o0c0; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_2x2() 346 _mm_storel_pi((__m64 *)o0c0, vo0c01); o0c0 += 2; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_2x2() 606 _mm_storel_pi((__m64 *)o0c0, vo0c01); o0c0 += 2; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_2x2() 618 _mm_store_ss(o0c0, _mm_shuffle_ps(vo0x0, vo0x0, _MM_SHUFFLE(0, 0, 0, 0))); o0c0 += 1; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_2x2() 626 o0c0 = (float*) ((uintptr_t) o0c0 + output_channel_increment); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_2x2()
|
/external/XNNPACK/src/f16-conv-hwc2chw/ |
D | 3x3s2p1c3x4-neonfp16arith-2x2.c | 73 __fp16* o0c0 = output0; in xnn_f16_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfp16arith_2x2() local 75 __fp16* o0c1 = (__fp16*) ((uintptr_t) o0c0 + output_channel_stride); in xnn_f16_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfp16arith_2x2() 83 o0c1 = o0c0; in xnn_f16_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfp16arith_2x2() 346 vst1_lane_u32((void*) o0c0, vreinterpret_u32_f16(vo0c01), 0); o0c0 += 2; in xnn_f16_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfp16arith_2x2() 607 vst1_lane_u32((void*) o0c0, vreinterpret_u32_f16(vo0c01), 0); o0c0 += 2; in xnn_f16_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfp16arith_2x2() 619 vst1_lane_f16(o0c0, vo0x0, 0); o0c0 += 1; in xnn_f16_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfp16arith_2x2() 627 o0c0 = (__fp16*) ((uintptr_t) o0c0 + output_channel_increment); in xnn_f16_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfp16arith_2x2()
|
/external/XNNPACK/src/amalgam/ |
D | sse.c | 581 float* o0c0 = output0; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_2x2() local 583 float* o0c1 = (float*) ((uintptr_t) o0c0 + output_channel_stride); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_2x2() 591 o0c1 = o0c0; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_2x2() 854 _mm_storel_pi((__m64 *)o0c0, vo0c01); o0c0 += 2; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_2x2() 1114 _mm_storel_pi((__m64 *)o0c0, vo0c01); o0c0 += 2; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_2x2() 1126 _mm_store_ss(o0c0, _mm_shuffle_ps(vo0x0, vo0x0, _MM_SHUFFLE(0, 0, 0, 0))); o0c0 += 1; in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_2x2() 1134 o0c0 = (float*) ((uintptr_t) o0c0 + output_channel_increment); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_2x2()
|