// Copyright 2020 Google LLC // // This source code is licensed under the BSD-style license found in the // LICENSE file in the root directory of this source tree. $assert BATCH_TILE >= 1 $ABC = "0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ" $assert OP in ["ABS", "NEG", "SQR"] #include $if OP == "ABS": #include #include #include #include $OP_FUNC = { $ "ABS": lambda x: "fabsf(%s)" % x, $ "NEG": lambda x: "-%s" % x, $ "SQR": lambda x: "%s * %s" % (x, x), $}[OP] $PARAMS = { $ "ABS": "xnn_f32_abs_params", $ "NEG": "xnn_f32_neg_params", $ "SQR": "xnn_f32_default_params", $}[OP] void xnn_f32_v${OP.lower()}_ukernel__scalar_x${BATCH_TILE}( size_t n, const float* x, float* y, const union ${PARAMS} params[restrict XNN_MIN_ELEMENTS(1)]) { assert(n != 0); assert(n % sizeof(float) == 0); assert(x != NULL); assert(y != NULL); $if BATCH_TILE > 1: for (; n >= ${BATCH_TILE} * sizeof(float); n -= ${BATCH_TILE} * sizeof(float)) { $for N in range(BATCH_TILE): const float vx${ABC[N]} = x[${N}]; x += ${BATCH_TILE}; $for N in range(BATCH_TILE): const float vy${ABC[N]} = ${OP_FUNC("vx" + ABC[N])}; $for N in range(BATCH_TILE): y[${N}] = vy${ABC[N]}; y += ${BATCH_TILE}; } if XNN_UNLIKELY(n != 0) { $if BATCH_TILE > 2: do { const float vx = *x++; const float vy = ${OP_FUNC("vx")}; *y++ = vy; n -= sizeof(float); } while (n != 0); $else: const float vx = *x; const float vy = ${OP_FUNC("vx")}; *y = vy; } $else: for (; n >= sizeof(float); n -= sizeof(float)) { const float vx = *x++; const float vy = ${OP_FUNC("vx")}; *y++ = vy; } }