/external/XNNPACK/src/f32-dwconv-spchw/ |
D | 3x3s2p1-scalar.c | 51 float vi0x0 = 0.0f; in xnn_f32_dwconv_spchw_ukernel_3x3s2p1__scalar() local 64 const float vrow0_accum = vw1 * vi0x0 + vw2 * vi0x1 + vw3 * vi0x2; in xnn_f32_dwconv_spchw_ukernel_3x3s2p1__scalar() 65 vi0x0 = vi0x2; in xnn_f32_dwconv_spchw_ukernel_3x3s2p1__scalar() 84 const float vrow0_accum = vw1 * vi0x0 + vw2 * vi0x1; in xnn_f32_dwconv_spchw_ukernel_3x3s2p1__scalar()
|
D | 3x3p1-scalar.c | 51 float vi0x0 = 0.0f; in xnn_f32_dwconv_spchw_ukernel_3x3p1__scalar() local 64 const float vrow0_accum = vw1 * vi0x0 + vw2 * vi0x1 + vw3 * vi0x2; in xnn_f32_dwconv_spchw_ukernel_3x3p1__scalar() 65 vi0x0 = vi0x1; in xnn_f32_dwconv_spchw_ukernel_3x3p1__scalar() 84 const float vrow0_accum = vw1 * vi0x0 + vw2 * vi0x1; in xnn_f32_dwconv_spchw_ukernel_3x3p1__scalar()
|
D | 5x5p2-scalar.c | 71 float vi0x0 = 0.0f; in xnn_f32_dwconv_spchw_ukernel_5x5p2__scalar() local 108 …const float vrow0_accum = vw1 * vi0x0 + vw2 * vi0x1 + vw3 * vi0x2 + vw4 * vi0x3 + vw5 * vi0x4; in xnn_f32_dwconv_spchw_ukernel_5x5p2__scalar() 109 vi0x0 = vi0x1; in xnn_f32_dwconv_spchw_ukernel_5x5p2__scalar() 142 const float vrow0_accum = vw1 * vi0x0 + vw2 * vi0x1 + vw3 * vi0x2 + vw4 * vi0x3; in xnn_f32_dwconv_spchw_ukernel_5x5p2__scalar() 143 vi0x0 = vi0x1; in xnn_f32_dwconv_spchw_ukernel_5x5p2__scalar() 173 const float vrow0_accum = vw1 * vi0x0 + vw2 * vi0x1 + vw3 * vi0x2; in xnn_f32_dwconv_spchw_ukernel_5x5p2__scalar()
|
D | 5x5s2p2-scalar.c | 71 float vi0x0 = 0.0f; in xnn_f32_dwconv_spchw_ukernel_5x5s2p2__scalar() local 102 …const float vrow0_accum = vw1 * vi0x0 + vw2 * vi0x1 + vw3 * vi0x2 + vw4 * vi0x3 + vw5 * vi0x4; in xnn_f32_dwconv_spchw_ukernel_5x5s2p2__scalar() 103 vi0x0 = vi0x2; in xnn_f32_dwconv_spchw_ukernel_5x5s2p2__scalar() 137 const float vrow0_accum = vw1 * vi0x0 + vw2 * vi0x1 + vw3 * vi0x2 + vw4 * vi0x3; in xnn_f32_dwconv_spchw_ukernel_5x5s2p2__scalar() 151 const float vrow0_accum = vw1 * vi0x0 + vw2 * vi0x1 + vw3 * vi0x2; in xnn_f32_dwconv_spchw_ukernel_5x5s2p2__scalar()
|
/external/XNNPACK/src/f32-prelu/gen/ |
D | scalar-2x4.c | 55 const float vi0x0 = i0[0]; in xnn_f32_prelu_ukernel__scalar_2x4() local 66 float vacc0x0 = signbit(vi0x0) ? vi0x0 * vw0 : vi0x0; in xnn_f32_prelu_ukernel__scalar_2x4()
|
D | wasm-2x4.c | 55 const float vi0x0 = i0[0]; in xnn_f32_prelu_ukernel__wasm_2x4() local 66 float vacc0x0 = signbit(vi0x0) ? vi0x0 * vw0 : vi0x0; in xnn_f32_prelu_ukernel__wasm_2x4()
|
/external/XNNPACK/src/f32-dwconv/gen/ |
D | up2x4-scalar.c | 49 const float vi0x0 = i0[0]; in xnn_f32_dwconv_ukernel_up2x4__scalar() local 54 vacc0p0 += vi0x0 * vk0x0; in xnn_f32_dwconv_ukernel_up2x4__scalar()
|
D | up2x4-wasm.c | 49 const float vi0x0 = i0[0]; in xnn_f32_dwconv_ukernel_up2x4__wasm() local 54 vacc0p0 += vi0x0 * vk0x0; in xnn_f32_dwconv_ukernel_up2x4__wasm()
|
D | up2x4-wasm-acc2.c | 49 const float vi0x0 = i0[0]; in xnn_f32_dwconv_ukernel_up2x4__wasm_acc2() local 54 vacc0p0 += vi0x0 * vk0x0; in xnn_f32_dwconv_ukernel_up2x4__wasm_acc2()
|
D | up2x4-scalar-acc2.c | 49 const float vi0x0 = i0[0]; in xnn_f32_dwconv_ukernel_up2x4__scalar_acc2() local 54 vacc0p0 += vi0x0 * vk0x0; in xnn_f32_dwconv_ukernel_up2x4__scalar_acc2()
|
D | up2x9-wasm.c | 59 const float vi0x0 = i0[0]; in xnn_f32_dwconv_ukernel_up2x9__wasm() local 64 vacc0p0 += vi0x0 * vk0x0; in xnn_f32_dwconv_ukernel_up2x9__wasm()
|
D | up2x9-scalar.c | 59 const float vi0x0 = i0[0]; in xnn_f32_dwconv_ukernel_up2x9__scalar() local 64 vacc0p0 += vi0x0 * vk0x0; in xnn_f32_dwconv_ukernel_up2x9__scalar()
|
D | up2x9-scalar-acc2.c | 59 const float vi0x0 = i0[0]; in xnn_f32_dwconv_ukernel_up2x9__scalar_acc2() local 64 vacc0p0 += vi0x0 * vk0x0; in xnn_f32_dwconv_ukernel_up2x9__scalar_acc2()
|
D | up2x9-wasm-acc2.c | 59 const float vi0x0 = i0[0]; in xnn_f32_dwconv_ukernel_up2x9__wasm_acc2() local 64 vacc0p0 += vi0x0 * vk0x0; in xnn_f32_dwconv_ukernel_up2x9__wasm_acc2()
|
D | up2x25-scalar.c | 91 const float vi0x0 = i0[0]; in xnn_f32_dwconv_ukernel_up2x25__scalar() local 96 vacc0p0 += vi0x0 * vk0x0; in xnn_f32_dwconv_ukernel_up2x25__scalar()
|
D | up2x25-scalar-acc2.c | 91 const float vi0x0 = i0[0]; in xnn_f32_dwconv_ukernel_up2x25__scalar_acc2() local 96 vacc0p0 += vi0x0 * vk0x0; in xnn_f32_dwconv_ukernel_up2x25__scalar_acc2()
|
D | up2x25-wasm-acc2.c | 91 const float vi0x0 = i0[0]; in xnn_f32_dwconv_ukernel_up2x25__wasm_acc2() local 96 vacc0p0 += vi0x0 * vk0x0; in xnn_f32_dwconv_ukernel_up2x25__wasm_acc2()
|
D | up2x25-wasm.c | 91 const float vi0x0 = i0[0]; in xnn_f32_dwconv_ukernel_up2x25__wasm() local 96 vacc0p0 += vi0x0 * vk0x0; in xnn_f32_dwconv_ukernel_up2x25__wasm()
|
/external/XNNPACK/src/f32-conv-hwc/ |
D | 3x3s2p1c3x8-neonfma-2x2.c | 77 float32x4_t vi0x0 = vmovq_n_f32(0.0f); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neonfma_2x2() local 104 vo0x0c0123 = vfmaq_laneq_f32(vo0x0c0123, vk00c0x0123, vi0x0, 1); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neonfma_2x2() 106 vo0x0c4567 = vfmaq_laneq_f32(vo0x0c4567, vk00c0x4567, vi0x0, 1); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neonfma_2x2() 150 vo0x0c0123 = vfmaq_laneq_f32(vo0x0c0123, vk00c1x0123, vi0x0, 2); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neonfma_2x2() 152 vo0x0c4567 = vfmaq_laneq_f32(vo0x0c4567, vk00c1x4567, vi0x0, 2); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neonfma_2x2() 189 vo0x0c0123 = vfmaq_laneq_f32(vo0x0c0123, vk00c2x0123, vi0x0, 3); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neonfma_2x2() 191 vo0x0c4567 = vfmaq_laneq_f32(vo0x0c4567, vk00c2x4567, vi0x0, 3); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neonfma_2x2() 466 vi0x0 = vi0x3; in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neonfma_2x2() 567 vo0x0c0123 = vfmaq_laneq_f32(vo0x0c0123, vk00c0x0123, vi0x0, 1); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neonfma_2x2() 569 vo0x0c4567 = vfmaq_laneq_f32(vo0x0c4567, vk00c0x4567, vi0x0, 1); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neonfma_2x2() [all …]
|
D | 3x3s2p1c3x4-neonfma-2x2.c | 77 float32x4_t vi0x0 = vmovq_n_f32(0.0f); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x2() local 99 vo0x0 = vfmaq_laneq_f32(vo0x0, vk00c0, vi0x0, 1); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x2() 127 vo0x0 = vfmaq_laneq_f32(vo0x0, vk00c1, vi0x0, 2); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x2() 148 vo0x0 = vfmaq_laneq_f32(vo0x0, vk00c2, vi0x0, 3); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x2() 300 vi0x0 = vi0x3; in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x2() 371 vo0x0 = vfmaq_laneq_f32(vo0x0, vk00c0, vi0x0, 1); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x2() 412 vo0x0 = vfmaq_laneq_f32(vo0x0, vk00c1, vi0x0, 2); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x2() 433 vo0x0 = vfmaq_laneq_f32(vo0x0, vk00c2, vi0x0, 3); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x2()
|
/external/XNNPACK/src/f32-conv-hwc2spchw/ |
D | 3x3s2p1c3x4-neonfma-2x2.c | 96 float32x4_t vi0x0 = vmovq_n_f32(0.0f); in xnn_f32_conv_hwc2spchw_ukernel_3x3s2p1c3x4__neonfma_2x2() local 118 vo0x0 = vfmaq_laneq_f32(vo0x0, vk00c0, vi0x0, 1); in xnn_f32_conv_hwc2spchw_ukernel_3x3s2p1c3x4__neonfma_2x2() 146 vo0x0 = vfmaq_laneq_f32(vo0x0, vk00c1, vi0x0, 2); in xnn_f32_conv_hwc2spchw_ukernel_3x3s2p1c3x4__neonfma_2x2() 167 vo0x0 = vfmaq_laneq_f32(vo0x0, vk00c2, vi0x0, 3); in xnn_f32_conv_hwc2spchw_ukernel_3x3s2p1c3x4__neonfma_2x2() 319 vi0x0 = vi0x3; in xnn_f32_conv_hwc2spchw_ukernel_3x3s2p1c3x4__neonfma_2x2() 367 vo0x0 = vfmaq_laneq_f32(vo0x0, vk00c0, vi0x0, 1); in xnn_f32_conv_hwc2spchw_ukernel_3x3s2p1c3x4__neonfma_2x2() 408 vo0x0 = vfmaq_laneq_f32(vo0x0, vk00c1, vi0x0, 2); in xnn_f32_conv_hwc2spchw_ukernel_3x3s2p1c3x4__neonfma_2x2() 429 vo0x0 = vfmaq_laneq_f32(vo0x0, vk00c2, vi0x0, 3); in xnn_f32_conv_hwc2spchw_ukernel_3x3s2p1c3x4__neonfma_2x2()
|