• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 // Auto-generated file. Do not edit!
2 //   Template: src/f32-clamp/scalar.c.in
3 //   Generator: tools/xngen
4 //
5 // Copyright 2020 Google LLC
6 //
7 // This source code is licensed under the BSD-style license found in the
8 // LICENSE file in the root directory of this source tree.
9 
10 #include <assert.h>
11 
12 #include <xnnpack/clamp.h>
13 #include <xnnpack/common.h>
14 #include <xnnpack/math.h>
15 
16 
xnn_f32_clamp_ukernel__scalar_x4(size_t n,const float * x,float * y,const union xnn_f32_minmax_params params[restrict XNN_MIN_ELEMENTS (1)])17 void xnn_f32_clamp_ukernel__scalar_x4(
18     size_t n,
19     const float* x,
20     float* y,
21     const union xnn_f32_minmax_params params[restrict XNN_MIN_ELEMENTS(1)])
22 {
23   assert(n != 0);
24   assert(n % sizeof(float) == 0);
25   assert(x != NULL);
26   assert(y != NULL);
27 
28   const float vy_min = params->scalar.min;
29   const float vy_max = params->scalar.max;
30 
31   for (; n >= 4 * sizeof(float); n -= 4 * sizeof(float)) {
32     float vacc0 = x[0];
33     float vacc1 = x[1];
34     float vacc2 = x[2];
35     float vacc3 = x[3];
36     x += 4;
37 
38     vacc0 = math_max_f32(vacc0, vy_min);
39     vacc1 = math_max_f32(vacc1, vy_min);
40     vacc2 = math_max_f32(vacc2, vy_min);
41     vacc3 = math_max_f32(vacc3, vy_min);
42 
43     vacc0 = math_min_f32(vacc0, vy_max);
44     vacc1 = math_min_f32(vacc1, vy_max);
45     vacc2 = math_min_f32(vacc2, vy_max);
46     vacc3 = math_min_f32(vacc3, vy_max);
47 
48     y[0] = vacc0;
49     y[1] = vacc1;
50     y[2] = vacc2;
51     y[3] = vacc3;
52     y += 4;
53   }
54   if XNN_UNLIKELY(n != 0) {
55     do {
56       float vacc = *x++;
57       vacc = math_max_f32(vacc, vy_min);
58       vacc = math_min_f32(vacc, vy_max);
59       *y++ = vacc;
60       n -= sizeof(float);
61     } while (n != 0);
62   }
63 }
64