blob: 6e47a97c78b9c9db361a26483868c24d8ecbe73b [file] [log] [blame]
Michele Di Giorgio5b6904b2018-01-29 12:24:14 +00001/*
Michele Di Giorgiod9eaf612020-07-08 11:12:57 +01002 * Copyright (c) 2017 Arm Limited.
Michele Di Giorgio5b6904b2018-01-29 12:24:14 +00003 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
Pablo Telloeb82fd22018-02-23 13:43:50 +000024
Michele Di Giorgio5b6904b2018-01-29 12:24:14 +000025#pragma once
26
Georgios Pinitas7cd26d42019-01-09 18:35:17 +000027#include <cstddef>
Georgios Pinitas421405b2018-10-26 19:05:32 +010028
Pablo Telloeb82fd22018-02-23 13:43:50 +000029// Macro for unreachable code (e.g. impossible default cases on switch)
Anthony Barbier5f707732018-07-03 16:22:02 +010030#define UNREACHABLE(why) __builtin_unreachable()
Michele Di Giorgio5b6904b2018-01-29 12:24:14 +000031
Pablo Telloeb82fd22018-02-23 13:43:50 +000032// Paranoid option for the above with assert
33// #define UNREACHABLE(why) assert(0 && why)
Michele Di Giorgio5b6904b2018-01-29 12:24:14 +000034
Georgios Pinitas1d480652019-01-23 11:24:50 +000035template<typename T>
36inline T iceildiv(const T a, const T b) {
Georgios Pinitas421405b2018-10-26 19:05:32 +010037 return (a + b - 1) / b;
Pablo Telloeb82fd22018-02-23 13:43:50 +000038}
Michele Di Giorgio5b6904b2018-01-29 12:24:14 +000039
Pablo Telloeb82fd22018-02-23 13:43:50 +000040template <typename T>
Anthony Barbier5f707732018-07-03 16:22:02 +010041inline T roundup(const T a, const T b) {
Georgios Pinitas421405b2018-10-26 19:05:32 +010042 T rem = a % b;
Michele Di Giorgio5b6904b2018-01-29 12:24:14 +000043
Georgios Pinitas421405b2018-10-26 19:05:32 +010044 if (rem) {
45 return a + b - rem;
46 } else {
47 return a;
48 }
Pablo Telloeb82fd22018-02-23 13:43:50 +000049}
David Manselld93991e2018-07-06 14:52:52 +010050
Georgios Pinitas7cd26d42019-01-09 18:35:17 +000051namespace arm_gemm {
52namespace utils {
53namespace {
54
55#ifdef __ARM_FEATURE_SVE
56template<size_t sz>
57inline unsigned long get_vector_length_sz() {
58 unsigned long v;
59
60 __asm (
61 "cntb %0"
62 : "=r" (v)
63 );
64
65 return v / sz;
66}
67
68#define VEC_LEN_SPEC(sz, opcode) template <> inline unsigned long get_vector_length_sz<sz>() { unsigned long v; __asm ( opcode " %0" : "=r" (v)); return v; }
69
70VEC_LEN_SPEC(8, "cntd")
71VEC_LEN_SPEC(4, "cntw")
72VEC_LEN_SPEC(2, "cnth")
73VEC_LEN_SPEC(1, "cntb")
74#endif
75
76} // anonymous namespace
77
David Manselld93991e2018-07-06 14:52:52 +010078template <typename T>
79inline unsigned long get_vector_length() {
Georgios Pinitas421405b2018-10-26 19:05:32 +010080#ifdef __ARM_FEATURE_SVE
Georgios Pinitas7cd26d42019-01-09 18:35:17 +000081 return get_vector_length_sz<sizeof(T)>();
Georgios Pinitas421405b2018-10-26 19:05:32 +010082#else
Georgios Pinitas7cd26d42019-01-09 18:35:17 +000083 return 16 / sizeof(T);
Georgios Pinitas421405b2018-10-26 19:05:32 +010084#endif
Georgios Pinitas7cd26d42019-01-09 18:35:17 +000085}
David Manselld93991e2018-07-06 14:52:52 +010086
Georgios Pinitas7cd26d42019-01-09 18:35:17 +000087} // utils namespace
88} // arm_gemm namespace
89
Georgios Pinitascfa2bba2019-06-27 17:00:52 +010090using namespace arm_gemm::utils;