blob: ece991a5b0575a300e5db761740c253845b25da8 [file] [log] [blame]
George Worta1e7e282019-01-15 11:00:29 +00001/*
Georgios Pinitasddb93bb2020-10-02 16:38:59 +01002 * Copyright (c) 2019-2020 Arm Limited.
George Worta1e7e282019-01-15 11:00:29 +00003 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
Michalis Spyrouf4643372019-11-29 16:17:13 +000024#ifndef ARM_COMPUTE_WRAPPER_DIV_H
25#define ARM_COMPUTE_WRAPPER_DIV_H
George Worta1e7e282019-01-15 11:00:29 +000026
Georgios Pinitasddb93bb2020-10-02 16:38:59 +010027#include "src/core/NEON/NEMath.h"
Felix Thomasmathibalanafd38f02023-09-27 17:46:17 +010028
George Worta1e7e282019-01-15 11:00:29 +000029#include <arm_neon.h>
30
31namespace arm_compute
32{
33namespace wrapper
34{
35#ifdef __aarch64__
36
37#define VDIV_IMPL(stype, vtype, prefix, postfix) \
38 inline vtype vdiv(const vtype &a, const vtype &b) \
39 { \
40 return prefix##_##postfix(a, b); \
41 }
42VDIV_IMPL(float32x2_t, float32x2_t, vdiv, f32)
43#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
44VDIV_IMPL(float16x4_t, float16x4_t, vdiv, f16)
45#endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
46
47VDIV_IMPL(float32x4_t, float32x4_t, vdivq, f32)
48#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
49VDIV_IMPL(float16x8_t, float16x8_t, vdivq, f16)
50#endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
51
52#else // __aarch64__
53
54#define VDIV_IMPL(stype, vtype, mul_prefix, inv_prefix, postfix) \
55 inline vtype vdiv(const vtype &a, const vtype &b) \
56 { \
57 return mul_prefix##_##postfix(a, inv_prefix##_##postfix(b)); \
58 }
59VDIV_IMPL(float32x2_t, float32x2_t, vmul, vinv, f32)
60#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
61VDIV_IMPL(float16x4_t, float16x4_t, vmul, vinv, f16)
62#endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
63
64VDIV_IMPL(float32x4_t, float32x4_t, vmulq, vinvq, f32)
65#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
66VDIV_IMPL(float16x8_t, float16x8_t, vmulq, vinvq, f16)
67#endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
68
69#endif // __aarch64__
70
71#undef VDIV_IMPL
72} // namespace wrapper
73} // namespace arm_compute
Michalis Spyrouf4643372019-11-29 16:17:13 +000074#endif /* ARM_COMPUTE_WRAPPER_DIV_H */