blob: 107ce44e0cae1e836908b4c6b75ffacdfee1aa88 [file] [log] [blame]
Michalis Spyroubcf8a962018-10-12 10:51:31 +01001/*
2 * Copyright (c) 2018 ARM Limited.
3 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
24#ifndef __ARM_COMPUTE_WRAPPER_GET_LANE_H__
25#define __ARM_COMPUTE_WRAPPER_GET_LANE_H__
26
27#include <arm_neon.h>
28
29namespace arm_compute
30{
31namespace wrapper
32{
33#define VGETLANE_IMPL_8(stype, vtype, postfix) \
34 inline stype vgetlane(const vtype vector, const int lane) \
35 { \
36 switch(lane) \
37 { \
38 case 0: \
39 return vget_lane_##postfix(vector, 0); \
40 case 1: \
41 return vget_lane_##postfix(vector, 1); \
42 case 2: \
43 return vget_lane_##postfix(vector, 2); \
44 case 3: \
45 return vget_lane_##postfix(vector, 3); \
46 case 4: \
47 return vget_lane_##postfix(vector, 4); \
48 case 5: \
49 return vget_lane_##postfix(vector, 5); \
50 case 6: \
51 return vget_lane_##postfix(vector, 6); \
52 case 7: \
53 return vget_lane_##postfix(vector, 7); \
54 default: \
55 ARM_COMPUTE_ERROR("Invalid lane"); \
56 } \
57 }
58
59#define VGETLANE_IMPL_4(stype, vtype, postfix) \
60 inline stype vgetlane(const vtype vector, const int lane) \
61 { \
62 switch(lane) \
63 { \
64 case 0: \
65 return vget_lane_##postfix(vector, 0); \
66 case 1: \
67 return vget_lane_##postfix(vector, 1); \
68 case 2: \
69 return vget_lane_##postfix(vector, 2); \
70 case 3: \
71 return vget_lane_##postfix(vector, 3); \
72 default: \
73 ARM_COMPUTE_ERROR("Invalid lane"); \
74 } \
75 }
76
77#define VGETLANE_IMPL_2(stype, vtype, postfix) \
78 inline stype vgetlane(const vtype vector, const int lane) \
79 { \
80 switch(lane) \
81 { \
82 case 0: \
83 return vget_lane_##postfix(vector, 0); \
84 case 1: \
85 return vget_lane_##postfix(vector, 1); \
86 default: \
87 ARM_COMPUTE_ERROR("Invalid lane"); \
88 } \
89 }
90
91VGETLANE_IMPL_8(uint8_t, uint8x8_t, u8)
92VGETLANE_IMPL_8(int8_t, int8x8_t, s8)
93VGETLANE_IMPL_4(uint16_t, uint16x4_t, u16)
94VGETLANE_IMPL_4(int16_t, int16x4_t, s16)
95VGETLANE_IMPL_2(uint32_t, uint32x2_t, u32)
96VGETLANE_IMPL_2(int32_t, int32x2_t, s32)
97VGETLANE_IMPL_2(float, float32x2_t, f32)
98#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
99VGETLANE_IMPL_4(float16_t, float16x4_t, f16)
100#endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
101
102#define VGETQLANE_IMPL_16(stype, vtype, postfix) \
103 inline stype vgetqlane(const vtype vector, const int lane) \
104 { \
105 switch(lane) \
106 { \
107 case 0: \
108 return vgetq_lane_##postfix(vector, 0); \
109 case 1: \
110 return vgetq_lane_##postfix(vector, 1); \
111 case 2: \
112 return vgetq_lane_##postfix(vector, 2); \
113 case 3: \
114 return vgetq_lane_##postfix(vector, 3); \
115 case 4: \
116 return vgetq_lane_##postfix(vector, 4); \
117 case 5: \
118 return vgetq_lane_##postfix(vector, 5); \
119 case 6: \
120 return vgetq_lane_##postfix(vector, 6); \
121 case 7: \
122 return vgetq_lane_##postfix(vector, 7); \
123 case 8: \
124 return vgetq_lane_##postfix(vector, 8); \
125 case 9: \
126 return vgetq_lane_##postfix(vector, 9); \
127 case 10: \
128 return vgetq_lane_##postfix(vector, 10); \
129 case 11: \
130 return vgetq_lane_##postfix(vector, 11); \
131 case 12: \
132 return vgetq_lane_##postfix(vector, 12); \
133 case 13: \
134 return vgetq_lane_##postfix(vector, 13); \
135 case 14: \
136 return vgetq_lane_##postfix(vector, 14); \
137 case 15: \
138 return vgetq_lane_##postfix(vector, 15); \
139 default: \
140 ARM_COMPUTE_ERROR("Invalid lane"); \
141 } \
142 }
143
144#define VGETQLANE_IMPL_8(stype, vtype, postfix) \
145 inline stype vgetqlane(const vtype vector, const int lane) \
146 { \
147 switch(lane) \
148 { \
149 case 0: \
150 return vgetq_lane_##postfix(vector, 0); \
151 case 1: \
152 return vgetq_lane_##postfix(vector, 1); \
153 case 2: \
154 return vgetq_lane_##postfix(vector, 2); \
155 case 3: \
156 return vgetq_lane_##postfix(vector, 3); \
157 case 4: \
158 return vgetq_lane_##postfix(vector, 4); \
159 case 5: \
160 return vgetq_lane_##postfix(vector, 5); \
161 case 6: \
162 return vgetq_lane_##postfix(vector, 6); \
163 case 7: \
164 return vgetq_lane_##postfix(vector, 7); \
165 default: \
166 ARM_COMPUTE_ERROR("Invalid lane"); \
167 } \
168 }
169
170#define VGETQLANE_IMPL_4(stype, vtype, postfix) \
171 inline stype vgetqlane(const vtype vector, const int lane) \
172 { \
173 switch(lane) \
174 { \
175 case 0: \
176 return vgetq_lane_##postfix(vector, 0); \
177 case 1: \
178 return vgetq_lane_##postfix(vector, 1); \
179 case 2: \
180 return vgetq_lane_##postfix(vector, 2); \
181 case 3: \
182 return vgetq_lane_##postfix(vector, 3); \
183 default: \
184 ARM_COMPUTE_ERROR("Invalid lane"); \
185 } \
186 }
187
188VGETQLANE_IMPL_16(uint8_t, uint8x16_t, u8)
189VGETQLANE_IMPL_16(int8_t, int8x16_t, s8)
190VGETQLANE_IMPL_8(uint16_t, uint16x8_t, u16)
191VGETQLANE_IMPL_8(int16_t, int16x8_t, s16)
192VGETQLANE_IMPL_4(uint32_t, uint32x4_t, u32)
193VGETQLANE_IMPL_4(int32_t, int32x4_t, s32)
194VGETQLANE_IMPL_4(float, float32x4_t, f32)
195#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
196VGETQLANE_IMPL_8(float16_t, float16x8_t, f16)
197#endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
198
199#undef VGETLANE_IMPL_8
200#undef VGETLANE_IMPL_4
201#undef VGETLANE_IMPL_2
202} // namespace wrapper
203} // namespace arm_compute
204#endif /* __ARM_COMPUTE_WRAPPER_GET_LANE_H__ */