blob: b3efe5c8a0b086beb24306d9ec9cf320da863887 [file] [log] [blame]
Giorgio Arena657bdb32018-04-26 18:52:01 +01001/*
Teresa Charlin91b7f742021-04-12 13:57:00 +01002 * Copyright (c) 2018-2021 Arm Limited.
Giorgio Arena657bdb32018-04-26 18:52:01 +01003 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
24#include "arm_compute/runtime/CL/functions/CLConvertFullyConnectedWeights.h"
Teresa Charlin91b7f742021-04-12 13:57:00 +010025
26#include "arm_compute/core/CL/CLKernelLibrary.h"
27#include "arm_compute/core/CL/ICLTensor.h"
28#include "arm_compute/core/Types.h"
29#include "arm_compute/core/Validate.h"
30#include "src/core/CL/ICLKernel.h"
Georgios Pinitas7891a732021-08-20 21:39:25 +010031#include "src/gpu/cl/operators/ClConvertFullyConnectedWeights.h"
Giorgio Arena657bdb32018-04-26 18:52:01 +010032
ramelg016d891572021-09-29 10:05:09 +010033#include "src/common/utils/Log.h"
34
Michele Di Giorgiocbbed282019-12-20 13:26:08 +000035namespace arm_compute
36{
Teresa Charlin91b7f742021-04-12 13:57:00 +010037struct CLConvertFullyConnectedWeights::Impl
38{
39 const ICLTensor *src{ nullptr };
40 ICLTensor *dst{ nullptr };
41 std::unique_ptr<opencl::ClConvertFullyConnectedWeights> op{ nullptr };
42};
43CLConvertFullyConnectedWeights::CLConvertFullyConnectedWeights()
44 : _impl(std::make_unique<Impl>())
45{
46}
47CLConvertFullyConnectedWeights::~CLConvertFullyConnectedWeights() = default;
48
Giorgio Arena657bdb32018-04-26 18:52:01 +010049void CLConvertFullyConnectedWeights::configure(const ICLTensor *input, ICLTensor *output, const TensorShape &original_input_shape,
50 DataLayout data_layout)
51{
Manuel Bottini2b84be52020-04-08 10:15:51 +010052 configure(CLKernelLibrary::get().get_compile_context(), input, output, original_input_shape, data_layout);
53}
54
55void CLConvertFullyConnectedWeights::configure(const CLCompileContext &compile_context, const ICLTensor *input, ICLTensor *output, const TensorShape &original_input_shape,
56 DataLayout data_layout)
57{
Teresa Charlin91b7f742021-04-12 13:57:00 +010058 ARM_COMPUTE_ERROR_ON_NULLPTR(input, output);
ramelg016d891572021-09-29 10:05:09 +010059 ARM_COMPUTE_LOG_PARAMS(input, output, original_input_shape, data_layout);
Teresa Charlin91b7f742021-04-12 13:57:00 +010060 _impl->src = input;
61 _impl->dst = output;
62 _impl->op = std::make_unique<opencl::ClConvertFullyConnectedWeights>();
63 _impl->op->configure(compile_context, _impl->src->info(), _impl->dst->info(), original_input_shape, data_layout);
Giorgio Arena657bdb32018-04-26 18:52:01 +010064}
65
66Status CLConvertFullyConnectedWeights::validate(const ITensorInfo *input, const ITensorInfo *output, const TensorShape &original_input_shape,
67 DataLayout data_layout)
68{
Teresa Charlin91b7f742021-04-12 13:57:00 +010069 return opencl::ClConvertFullyConnectedWeights::validate(input, output, original_input_shape, data_layout);
Michele Di Giorgiocbbed282019-12-20 13:26:08 +000070}
Teresa Charlin91b7f742021-04-12 13:57:00 +010071
72void CLConvertFullyConnectedWeights::run()
73{
74 ITensorPack pack;
75 pack.add_tensor(TensorType::ACL_SRC, _impl->src);
76 pack.add_tensor(TensorType::ACL_DST, _impl->dst);
77 _impl->op->run(pack);
78}
79
ramelg016d891572021-09-29 10:05:09 +010080} // namespace arm_compute