1 /* 2 * Copyright (C) 2013 The Android Open Source Project 3 * 4 * Licensed under the Apache License, Version 2.0 (the "License"); 5 * you may not use this file except in compliance with the License. 6 * You may obtain a copy of the License at 7 * 8 * http://www.apache.org/licenses/LICENSE-2.0 9 * 10 * Unless required by applicable law or agreed to in writing, software 11 * distributed under the License is distributed on an "AS IS" BASIS, 12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13 * See the License for the specific language governing permissions and 14 * limitations under the License. 15 */ 16 17 #ifndef ANDROID_AUDIO_RESAMPLER_FIR_OPS_H 18 #define ANDROID_AUDIO_RESAMPLER_FIR_OPS_H 19 20 namespace android { 21 22 #if defined(__arm__) && !defined(__thumb__) 23 #define USE_INLINE_ASSEMBLY (true) 24 #else 25 #define USE_INLINE_ASSEMBLY (false) 26 #endif 27 28 #if defined(__aarch64__) || defined(__ARM_NEON__) 29 #ifndef USE_NEON 30 #define USE_NEON (true) 31 #endif 32 #else 33 #define USE_NEON (false) 34 #endif 35 #if USE_NEON 36 #include <arm_neon.h> 37 #endif 38 39 #if defined(__AVX2__) // Should be supported in x86 ABI for both 32 & 64-bit. 40 #define USE_AVX2 (true) // Inference AVX2/FMA Intrinsics 41 #define USE_SSE (true) 42 #include <immintrin.h> 43 #elif defined(__SSSE3__) // Should be supported in x86 ABI for both 32 & 64-bit. 44 #define USE_SSE (true) // Inference SSE Intrinsics 45 #define USE_AVX2 (false) 46 #include <tmmintrin.h> 47 #else 48 #define USE_SSE (false) 49 #define USE_AVX2(false) 50 #endif 51 52 53 template<typename T, typename U> 54 struct is_same 55 { 56 static const bool value = false; 57 }; 58 59 template<typename T> 60 struct is_same<T, T> // partial specialization 61 { 62 static const bool value = true; 63 }; 64 65 static inline 66 int32_t mulRL(int left, int32_t in, uint32_t vRL) 67 { 68 #if USE_INLINE_ASSEMBLY 69 int32_t out; 70 if (left) { 71 asm( "smultb %[out], %[in], %[vRL] \n" 72 : [out]"=r"(out) 73 : [in]"%r"(in), [vRL]"r"(vRL) 74 : ); 75 } else { 76 asm( "smultt %[out], %[in], %[vRL] \n" 77 : [out]"=r"(out) 78 : [in]"%r"(in), [vRL]"r"(vRL) 79 : ); 80 } 81 return out; 82 #else 83 int16_t v = left ? static_cast<int16_t>(vRL) : static_cast<int16_t>(vRL>>16); 84 return static_cast<int32_t>((static_cast<int64_t>(in) * v) >> 16); 85 #endif 86 } 87 88 static inline 89 int32_t mulAdd(int16_t in, int16_t v, int32_t a) 90 { 91 #if USE_INLINE_ASSEMBLY 92 int32_t out; 93 asm( "smlabb %[out], %[v], %[in], %[a] \n" 94 : [out]"=r"(out) 95 : [in]"%r"(in), [v]"r"(v), [a]"r"(a) 96 : ); 97 return out; 98 #else 99 return a + v * in; 100 #endif 101 } 102 103 static inline 104 int32_t mulAdd(int16_t in, int32_t v, int32_t a) 105 { 106 #if USE_INLINE_ASSEMBLY 107 int32_t out; 108 asm( "smlawb %[out], %[v], %[in], %[a] \n" 109 : [out]"=r"(out) 110 : [in]"%r"(in), [v]"r"(v), [a]"r"(a) 111 : ); 112 return out; 113 #else 114 return a + static_cast<int32_t>((static_cast<int64_t>(v) * in) >> 16); 115 #endif 116 } 117 118 static inline 119 int32_t mulAdd(int32_t in, int32_t v, int32_t a) 120 { 121 #if USE_INLINE_ASSEMBLY 122 int32_t out; 123 asm( "smmla %[out], %[v], %[in], %[a] \n" 124 : [out]"=r"(out) 125 : [in]"%r"(in), [v]"r"(v), [a]"r"(a) 126 : ); 127 return out; 128 #else 129 return a + static_cast<int32_t>((static_cast<int64_t>(v) * in) >> 32); 130 #endif 131 } 132 133 static inline 134 int32_t mulAddRL(int left, uint32_t inRL, int16_t v, int32_t a) 135 { 136 #if 0 // USE_INLINE_ASSEMBLY Seems to fail with Clang b/34110890 137 int32_t out; 138 if (left) { 139 asm( "smlabb %[out], %[v], %[inRL], %[a] \n" 140 : [out]"=r"(out) 141 : [inRL]"%r"(inRL), [v]"r"(v), [a]"r"(a) 142 : ); 143 } else { 144 asm( "smlabt %[out], %[v], %[inRL], %[a] \n" 145 : [out]"=r"(out) 146 : [inRL]"%r"(inRL), [v]"r"(v), [a]"r"(a) 147 : ); 148 } 149 return out; 150 #else 151 int16_t s = left ? static_cast<int16_t>(inRL) : static_cast<int16_t>(inRL>>16); 152 return a + v * s; 153 #endif 154 } 155 156 static inline 157 int32_t mulAddRL(int left, uint32_t inRL, int32_t v, int32_t a) 158 { 159 #if 0 // USE_INLINE_ASSEMBLY Seems to fail with Clang b/34110890 160 int32_t out; 161 if (left) { 162 asm( "smlawb %[out], %[v], %[inRL], %[a] \n" 163 : [out]"=r"(out) 164 : [inRL]"%r"(inRL), [v]"r"(v), [a]"r"(a) 165 : ); 166 } else { 167 asm( "smlawt %[out], %[v], %[inRL], %[a] \n" 168 : [out]"=r"(out) 169 : [inRL]"%r"(inRL), [v]"r"(v), [a]"r"(a) 170 : ); 171 } 172 return out; 173 #else 174 int16_t s = left ? static_cast<int16_t>(inRL) : static_cast<int16_t>(inRL>>16); 175 return a + static_cast<int32_t>((static_cast<int64_t>(v) * s) >> 16); 176 #endif 177 } 178 179 } // namespace android 180 181 #endif /*ANDROID_AUDIO_RESAMPLER_FIR_OPS_H*/ 182