1 /* 2 * Copyright (c) 2018-2020 Arm Limited. 3 * 4 * SPDX-License-Identifier: MIT 5 * 6 * Permission is hereby granted, free of charge, to any person obtaining a copy 7 * of this software and associated documentation files (the "Software"), to 8 * deal in the Software without restriction, including without limitation the 9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or 10 * sell copies of the Software, and to permit persons to whom the Software is 11 * furnished to do so, subject to the following conditions: 12 * 13 * The above copyright notice and this permission notice shall be included in all 14 * copies or substantial portions of the Software. 15 * 16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 22 * SOFTWARE. 23 */ 24 #ifndef ARM_COMPUTE_WRAPPER_SET_LANE_H 25 #define ARM_COMPUTE_WRAPPER_SET_LANE_H 26 27 #include <arm_neon.h> 28 29 namespace arm_compute 30 { 31 namespace wrapper 32 { 33 #define VSETLANE_IMPL_8(stype, atype, vtype, postfix) \ 34 inline stype vsetlane(const atype value, const vtype vector, const unsigned int lane) \ 35 { \ 36 switch(lane) \ 37 { \ 38 case 0: \ 39 return vset_lane_##postfix(value, vector, 0); \ 40 case 1: \ 41 return vset_lane_##postfix(value, vector, 1); \ 42 case 2: \ 43 return vset_lane_##postfix(value, vector, 2); \ 44 case 3: \ 45 return vset_lane_##postfix(value, vector, 3); \ 46 case 4: \ 47 return vset_lane_##postfix(value, vector, 4); \ 48 case 5: \ 49 return vset_lane_##postfix(value, vector, 5); \ 50 case 6: \ 51 return vset_lane_##postfix(value, vector, 6); \ 52 case 7: \ 53 return vset_lane_##postfix(value, vector, 7); \ 54 default: \ 55 ARM_COMPUTE_ERROR("Invalid lane"); \ 56 } \ 57 } 58 59 #define VSETLANE_IMPL_4(stype, atype, vtype, postfix) \ 60 inline stype vsetlane(const atype value, const vtype vector, const unsigned int lane) \ 61 { \ 62 switch(lane) \ 63 { \ 64 case 0: \ 65 return vset_lane_##postfix(value, vector, 0); \ 66 case 1: \ 67 return vset_lane_##postfix(value, vector, 1); \ 68 case 2: \ 69 return vset_lane_##postfix(value, vector, 2); \ 70 case 3: \ 71 return vset_lane_##postfix(value, vector, 3); \ 72 default: \ 73 ARM_COMPUTE_ERROR("Invalid lane"); \ 74 } \ 75 } 76 77 #define VSETLANE_IMPL_2(stype, atype, vtype, postfix) \ 78 inline stype vsetlane(const atype value, const vtype vector, const unsigned int lane) \ 79 { \ 80 switch(lane) \ 81 { \ 82 case 0: \ 83 return vset_lane_##postfix(value, vector, 0); \ 84 case 1: \ 85 return vset_lane_##postfix(value, vector, 1); \ 86 default: \ 87 ARM_COMPUTE_ERROR("Invalid lane"); \ 88 } \ 89 } 90 91 VSETLANE_IMPL_8(uint8x8_t, uint8_t, uint8x8_t, u8) 92 VSETLANE_IMPL_8(int8x8_t, int8_t, int8x8_t, s8) 93 VSETLANE_IMPL_4(uint16x4_t, uint16_t, uint16x4_t, u16) 94 VSETLANE_IMPL_4(int16x4_t, int16_t, int16x4_t, s16) 95 VSETLANE_IMPL_2(uint32x2_t, uint32_t, uint32x2_t, u32) 96 VSETLANE_IMPL_2(int32x2_t, int32_t, int32x2_t, s32) 97 VSETLANE_IMPL_2(float32x2_t, float, float32x2_t, f32) 98 #ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC 99 VSETLANE_IMPL_4(float16x4_t, float16_t, float16x4_t, f16) 100 #endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC 101 102 #define VSETQLANE_IMPL_16(stype, atype, vtype, postfix) \ 103 inline stype vsetlane(const atype value, const vtype vector, const unsigned int lane) \ 104 { \ 105 switch(lane) \ 106 { \ 107 case 0: \ 108 return vsetq_lane_##postfix(value, vector, 0); \ 109 case 1: \ 110 return vsetq_lane_##postfix(value, vector, 1); \ 111 case 2: \ 112 return vsetq_lane_##postfix(value, vector, 2); \ 113 case 3: \ 114 return vsetq_lane_##postfix(value, vector, 3); \ 115 case 4: \ 116 return vsetq_lane_##postfix(value, vector, 4); \ 117 case 5: \ 118 return vsetq_lane_##postfix(value, vector, 5); \ 119 case 6: \ 120 return vsetq_lane_##postfix(value, vector, 6); \ 121 case 7: \ 122 return vsetq_lane_##postfix(value, vector, 7); \ 123 case 8: \ 124 return vsetq_lane_##postfix(value, vector, 8); \ 125 case 9: \ 126 return vsetq_lane_##postfix(value, vector, 9); \ 127 case 10: \ 128 return vsetq_lane_##postfix(value, vector, 10); \ 129 case 11: \ 130 return vsetq_lane_##postfix(value, vector, 11); \ 131 case 12: \ 132 return vsetq_lane_##postfix(value, vector, 12); \ 133 case 13: \ 134 return vsetq_lane_##postfix(value, vector, 13); \ 135 case 14: \ 136 return vsetq_lane_##postfix(value, vector, 14); \ 137 case 15: \ 138 return vsetq_lane_##postfix(value, vector, 15); \ 139 default: \ 140 ARM_COMPUTE_ERROR("Invalid lane"); \ 141 } \ 142 } 143 144 #define VSETQLANE_IMPL_8(stype, atype, vtype, postfix) \ 145 inline stype vsetlane(const atype value, const vtype vector, const unsigned int lane) \ 146 { \ 147 switch(lane) \ 148 { \ 149 case 0: \ 150 return vsetq_lane_##postfix(value, vector, 0); \ 151 case 1: \ 152 return vsetq_lane_##postfix(value, vector, 1); \ 153 case 2: \ 154 return vsetq_lane_##postfix(value, vector, 2); \ 155 case 3: \ 156 return vsetq_lane_##postfix(value, vector, 3); \ 157 case 4: \ 158 return vsetq_lane_##postfix(value, vector, 4); \ 159 case 5: \ 160 return vsetq_lane_##postfix(value, vector, 5); \ 161 case 6: \ 162 return vsetq_lane_##postfix(value, vector, 6); \ 163 case 7: \ 164 return vsetq_lane_##postfix(value, vector, 7); \ 165 default: \ 166 ARM_COMPUTE_ERROR("Invalid lane"); \ 167 } \ 168 } 169 170 #define VSETQLANE_IMPL_4(stype, atype, vtype, postfix) \ 171 inline stype vsetlane(const atype value, const vtype vector, const unsigned int lane) \ 172 { \ 173 switch(lane) \ 174 { \ 175 case 0: \ 176 return vsetq_lane_##postfix(value, vector, 0); \ 177 case 1: \ 178 return vsetq_lane_##postfix(value, vector, 1); \ 179 case 2: \ 180 return vsetq_lane_##postfix(value, vector, 2); \ 181 case 3: \ 182 return vsetq_lane_##postfix(value, vector, 3); \ 183 default: \ 184 ARM_COMPUTE_ERROR("Invalid lane"); \ 185 } \ 186 } 187 188 VSETQLANE_IMPL_16(uint8x16_t, uint8_t, uint8x16_t, u8) 189 VSETQLANE_IMPL_16(int8x16_t, int8_t, int8x16_t, s8) 190 VSETQLANE_IMPL_8(uint16x8_t, uint16_t, uint16x8_t, u16) 191 VSETQLANE_IMPL_8(int16x8_t, int16_t, int16x8_t, s16) 192 VSETQLANE_IMPL_4(uint32x4_t, uint32_t, uint32x4_t, u32) 193 VSETQLANE_IMPL_4(int32x4_t, int32_t, int32x4_t, s32) 194 VSETQLANE_IMPL_4(float32x4_t, float, float32x4_t, f32) 195 #ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC 196 VSETQLANE_IMPL_8(float16x8_t, float16_t, float16x8_t, f16) 197 #endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC 198 199 #undef VSETLANE_IMPL_8 200 #undef VSETLANE_IMPL_4 201 #undef VSETLANE_IMPL_2 202 203 #undef VSETQLANE_IMPL_16 204 #undef VSETQLANE_IMPL_8 205 #undef VSETQLANE_IMPL_4 206 } // namespace wrapper 207 } // namespace arm_compute 208 #endif /* ARM_COMPUTE_WRAPPER_SET_LANE_H */ 209