• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /* ----------------------------------------------------------------------
2  * Project:      CMSIS DSP Library
3  * Title:        arm_max_no_idx_f16.c
4  * Description:  Maximum value of a floating-point vector without returning the index
5  *
6  * $Date:        23 April 2021
7  * $Revision:    V1.9.0
8  *
9  * Target Processor: Cortex-M and Cortex-A cores
10  * -------------------------------------------------------------------- */
11 /*
12  * Copyright (C) 2010-2021 ARM Limited or its affiliates. All rights reserved.
13  *
14  * SPDX-License-Identifier: Apache-2.0
15  *
16  * Licensed under the Apache License, Version 2.0 (the License); you may
17  * not use this file except in compliance with the License.
18  * You may obtain a copy of the License at
19  *
20  * www.apache.org/licenses/LICENSE-2.0
21  *
22  * Unless required by applicable law or agreed to in writing, software
23  * distributed under the License is distributed on an AS IS BASIS, WITHOUT
24  * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
25  * See the License for the specific language governing permissions and
26  * limitations under the License.
27  */
28 
29 #include "dsp/statistics_functions_f16.h"
30 
31 #if defined(ARM_FLOAT16_SUPPORTED)
32 
33 #if (defined(ARM_MATH_NEON) || defined(ARM_MATH_MVEF)) && !defined(ARM_MATH_AUTOVECTORIZE)
34 #include <limits.h>
35 #endif
36 
37 /**
38   @ingroup groupStats
39  */
40 
41 
42 /**
43   @addtogroup Max
44   @{
45  */
46 
47 /**
48   @brief         Maximum value of a floating-point vector.
49   @param[in]     pSrc       points to the input vector
50   @param[in]     blockSize  number of samples in input vector
51   @param[out]    pResult    maximum value returned here
52   @return        none
53  */
54 
55 #if defined(ARM_MATH_MVE_FLOAT16) && !defined(ARM_MATH_AUTOVECTORIZE)
56 
arm_max_no_idx_f16(const float16_t * pSrc,uint32_t blockSize,float16_t * pResult)57 void arm_max_no_idx_f16(
58     const float16_t *pSrc,
59     uint32_t   blockSize,
60     float16_t *pResult)
61 {
62    f16x8_t     vecSrc;
63    f16x8_t     curExtremValVec = vdupq_n_f16(F16_MIN);
64    float16_t   maxValue = F16_MIN;
65    float16_t   newVal;
66    uint32_t    blkCnt;
67 
68    /* Loop unrolling: Compute 4 outputs at a time */
69    blkCnt = blockSize >> 3U;
70 
71    while (blkCnt > 0U)
72    {
73 
74         vecSrc = vldrhq_f16(pSrc);
75         /*
76          * update per-lane max.
77          */
78         curExtremValVec = vmaxnmq(vecSrc, curExtremValVec);
79         /*
80          * Decrement the blockSize loop counter
81          * Advance vector source and destination pointers
82          */
83         pSrc += 8;
84         blkCnt --;
85     }
86     /*
87      * Get max value across the vector
88      */
89     maxValue = vmaxnmvq(maxValue, curExtremValVec);
90 
91     blkCnt = blockSize & 7;
92 
93     while (blkCnt > 0U)
94     {
95         newVal = *pSrc++;
96 
97         /* compare for the maximum value */
98         if ((_Float16)maxValue < (_Float16)newVal)
99         {
100             /* Update the maximum value and it's index */
101             maxValue = newVal;
102         }
103 
104         blkCnt --;
105     }
106 
107     *pResult = maxValue;
108 }
109 
110 #else
111 
arm_max_no_idx_f16(const float16_t * pSrc,uint32_t blockSize,float16_t * pResult)112 void arm_max_no_idx_f16(
113     const float16_t *pSrc,
114     uint32_t   blockSize,
115     float16_t *pResult)
116 {
117    float16_t   maxValue = F16_MIN;
118    float16_t   newVal;
119 
120    while (blockSize > 0U)
121    {
122        newVal = *pSrc++;
123 
124        /* compare for the maximum value */
125        if ((_Float16)maxValue < (_Float16)newVal)
126        {
127            /* Update the maximum value and it's index */
128            maxValue = newVal;
129        }
130 
131        blockSize --;
132    }
133 
134    *pResult = maxValue;
135 }
136 
137 #endif /* defined(ARM_MATH_MVEF) && !defined(ARM_MATH_AUTOVECTORIZE) */
138 
139 /**
140   @} end of Max group
141  */
142 
143 #endif /* #if defined(ARM_FLOAT16_SUPPORTED) */
144 
145