blob: 3b980ce60b53b30eab7434c24ac094b3ff1f5357 [file] [log] [blame]
/*
* Copyright (c) 2021, 2023-2024 Arm Limited.
*
* SPDX-License-Identifier: MIT
*
* Permission is hereby granted, free of charge, to any person obtaining a copy
* of this software and associated documentation files (the "Software"), to
* deal in the Software without restriction, including without limitation the
* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
* sell copies of the Software, and to permit persons to whom the Software is
* furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice shall be included in all
* copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
* SOFTWARE.
*/
#ifndef ACL_SRC_CPU_UTILS_CPUAUXTENSORHANDLER_H
#define ACL_SRC_CPU_UTILS_CPUAUXTENSORHANDLER_H
#include "arm_compute/core/ITensorPack.h"
#include "arm_compute/core/TensorInfo.h"
#include "arm_compute/runtime/Tensor.h"
#include "src/common/utils/Log.h"
#include "support/Cast.h"
namespace arm_compute
{
namespace cpu
{
/** Tensor handler to wrap and handle tensor allocations on workspace buffers
*
* @note Important: Despite the impression given by its name, the handler owns, rather than merely points to, the
* underlying tensor memory.
*
* @note About memory handling using bypass_* flags
* The bypass_alloc / bypass_import flags are meant to skip the expensive auxiliary tensor memory allocations or
* imports that are not needed during runtime, e.g. when the handler is not used at all in some branch of execution.
*
* If not handled correctly, these two flags can lead to performance issues (not bypass when needed to), or memory
* bugs (bypass when should not to).
*
* Make sure:
*
* 1. The aux tensor handlers must always be declared at the root level, or the same level as the run/prepare
* methods that potentially use them.
*
* Once the handler is destroyed (e.g. when going out of scope), the memory it owns (returned by the get()
* method) will also be destroyed.
*
* Thus it's important to ensure the handler is always in-scope when it is being used by a operator / kernel.
*
* 2. The handler's bypass_alloc and bypass_import flags should always be inverse of whether the handler is used in
* its surrounding scope by run/prepare. (This usually means being added to some tensor pack)
*
* This ensures we only bypass if and only if the aux tensor is not used by the op / kernel later.
*
*
* So the general usage pattern goes like this:
*
* bool use_aux_tensor = some_condition_about_when_to_use_the_aux_tensor
*
* CpuAuxTensorHandler aux_handler {..., !use_aux_tensor || bypass_alloc / bypass_import ||};
*
* if (use_aux_tensor)
* {
* tensor_pack.add_tensor(aux_handler.get());
* }
* op.run(tensor_pack);
*/
class CpuAuxTensorHandler
{
public:
/** Create a temporary tensor handle, by either important an existing tensor from a tensor pack, or allocating a
* new one.
*
* @param[in] slot_id Slot id of the tensor to be retrieved in the tensor pack
* If no such tensor exists in the tensor pack, a new tensor will be allocated.
* @param[in] info Tensor info containing requested size of the new tensor.
* If requested size is larger than the tensor retrieved from the tensor pack,
* a new tensor will be allocated.
* @param[in,out] pack Tensor pack to retrieve the old tensor. When @p pack_inject is true, the new
* tensor will also be added here.
* @param[in] pack_inject In case of a newly allocated tensor, whether to add this tensor back to the
* @p pack
* @param[in] bypass_alloc Bypass allocation in case of a new tensor
* This is to prevent unnecessary memory operations when the handler object is not
* used
* @param[in] bypass_import Bypass importation in case of a retrieved tensor
* This is to prevent unnecessary memory operations when the handler object is not
* used
*/
CpuAuxTensorHandler(int slot_id,
TensorInfo &info,
ITensorPack &pack,
bool pack_inject = false,
bool bypass_alloc = false,
bool bypass_import = false)
: _tensor()
{
if (info.total_size() == 0)
{
return;
}
_tensor.allocator()->soft_init(info);
ITensor *packed_tensor = utils::cast::polymorphic_downcast<ITensor *>(pack.get_tensor(slot_id));
if ((packed_tensor == nullptr) || (info.total_size() > packed_tensor->info()->total_size()))
{
if (!bypass_alloc)
{
_tensor.allocator()->allocate();
ARM_COMPUTE_LOG_INFO_WITH_FUNCNAME_ACL("Allocating auxiliary tensor");
}
if (pack_inject)
{
pack.add_tensor(slot_id, &_tensor);
_injected_tensor_pack = &pack;
_injected_slot_id = slot_id;
}
}
else
{
if (!bypass_import)
{
_tensor.allocator()->import_memory(packed_tensor->buffer());
}
}
}
/** Create a temporary handle to the original tensor with a new @ref TensorInfo
* This is useful if we want to change a tensor's tensor info at run time without modifying the original tensor
*
* @param[in] info New tensor info to "assign" to @p tensor
* @param[in] tensor Tensor to be assigned a new @ref TensorInfo
* @param[in] bypass_import Bypass importing @p tensor's memory into the handler.
* This is to prevent unnecessary memory operations when the handler object is not used
*/
CpuAuxTensorHandler(TensorInfo &info, const ITensor &tensor, bool bypass_import = false) : _tensor()
{
_tensor.allocator()->soft_init(info);
if (!bypass_import)
{
ARM_COMPUTE_ERROR_ON(tensor.info() == nullptr);
if (info.total_size() <= tensor.info()->total_size())
{
_tensor.allocator()->import_memory(tensor.buffer());
}
}
}
CpuAuxTensorHandler(const CpuAuxTensorHandler &) = delete;
CpuAuxTensorHandler &operator=(const CpuAuxTensorHandler) = delete;
~CpuAuxTensorHandler()
{
if (_injected_tensor_pack)
{
_injected_tensor_pack->remove_tensor(_injected_slot_id);
}
}
ITensor *get()
{
return &_tensor;
}
ITensor *operator()()
{
return &_tensor;
}
private:
Tensor _tensor{};
ITensorPack *_injected_tensor_pack{nullptr};
int _injected_slot_id{TensorType::ACL_UNKNOWN};
};
} // namespace cpu
} // namespace arm_compute
#endif // ACL_SRC_CPU_UTILS_CPUAUXTENSORHANDLER_H