blob: 7dbbe91ba22ddcdadffd2b3b2bdd71075d9046f1 [file] [log] [blame]
Michele Di Giorgio5b6904b2018-01-29 12:24:14 +00001/*
Georgios Pinitas1d480652019-01-23 11:24:50 +00002 * Copyright (c) 2017-2019 Arm Limited.
Michele Di Giorgio5b6904b2018-01-29 12:24:14 +00003 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
Pablo Telloeb82fd22018-02-23 13:43:50 +000024
Michele Di Giorgio5b6904b2018-01-29 12:24:14 +000025#pragma once
26
Georgios Pinitas7cd26d42019-01-09 18:35:17 +000027#include <cstddef>
Georgios Pinitas421405b2018-10-26 19:05:32 +010028
Pablo Telloeb82fd22018-02-23 13:43:50 +000029// Macro for unreachable code (e.g. impossible default cases on switch)
Anthony Barbier5f707732018-07-03 16:22:02 +010030#define UNREACHABLE(why) __builtin_unreachable()
Michele Di Giorgio5b6904b2018-01-29 12:24:14 +000031
Pablo Telloeb82fd22018-02-23 13:43:50 +000032// Paranoid option for the above with assert
33// #define UNREACHABLE(why) assert(0 && why)
Michele Di Giorgio5b6904b2018-01-29 12:24:14 +000034
Michalis Spyrou6bff1952019-10-02 17:22:11 +010035#define UNUSED(x) (void)(x)
36
Georgios Pinitas1d480652019-01-23 11:24:50 +000037template<typename T>
38inline T iceildiv(const T a, const T b) {
Georgios Pinitas421405b2018-10-26 19:05:32 +010039 return (a + b - 1) / b;
Pablo Telloeb82fd22018-02-23 13:43:50 +000040}
Michele Di Giorgio5b6904b2018-01-29 12:24:14 +000041
Pablo Telloeb82fd22018-02-23 13:43:50 +000042template <typename T>
Anthony Barbier5f707732018-07-03 16:22:02 +010043inline T roundup(const T a, const T b) {
Georgios Pinitas421405b2018-10-26 19:05:32 +010044 T rem = a % b;
Michele Di Giorgio5b6904b2018-01-29 12:24:14 +000045
Georgios Pinitas421405b2018-10-26 19:05:32 +010046 if (rem) {
47 return a + b - rem;
48 } else {
49 return a;
50 }
Pablo Telloeb82fd22018-02-23 13:43:50 +000051}
David Manselld93991e2018-07-06 14:52:52 +010052
Georgios Pinitas7cd26d42019-01-09 18:35:17 +000053namespace arm_gemm {
54namespace utils {
55namespace {
56
57#ifdef __ARM_FEATURE_SVE
58template<size_t sz>
59inline unsigned long get_vector_length_sz() {
60 unsigned long v;
61
62 __asm (
63 "cntb %0"
64 : "=r" (v)
65 );
66
67 return v / sz;
68}
69
70#define VEC_LEN_SPEC(sz, opcode) template <> inline unsigned long get_vector_length_sz<sz>() { unsigned long v; __asm ( opcode " %0" : "=r" (v)); return v; }
71
72VEC_LEN_SPEC(8, "cntd")
73VEC_LEN_SPEC(4, "cntw")
74VEC_LEN_SPEC(2, "cnth")
75VEC_LEN_SPEC(1, "cntb")
76#endif
77
78} // anonymous namespace
79
David Manselld93991e2018-07-06 14:52:52 +010080template <typename T>
81inline unsigned long get_vector_length() {
Georgios Pinitas421405b2018-10-26 19:05:32 +010082#ifdef __ARM_FEATURE_SVE
Georgios Pinitas7cd26d42019-01-09 18:35:17 +000083 return get_vector_length_sz<sizeof(T)>();
Georgios Pinitas421405b2018-10-26 19:05:32 +010084#else
Georgios Pinitas7cd26d42019-01-09 18:35:17 +000085 return 16 / sizeof(T);
Georgios Pinitas421405b2018-10-26 19:05:32 +010086#endif
Georgios Pinitas7cd26d42019-01-09 18:35:17 +000087}
David Manselld93991e2018-07-06 14:52:52 +010088
Georgios Pinitas7cd26d42019-01-09 18:35:17 +000089} // utils namespace
90} // arm_gemm namespace
91
Georgios Pinitascfa2bba2019-06-27 17:00:52 +010092using namespace arm_gemm::utils;