blob: b756485e003233dde63cc6c8590698e648e3b003 [file] [log] [blame]
Francis Murtagh4fc3c482019-08-02 13:20:54 +01001//
Teresa Charlin588cbdf2022-01-19 15:55:37 +00002// Copyright © 2017 Arm Ltd and Contributors. All rights reserved.
Francis Murtagh4fc3c482019-08-02 13:20:54 +01003// SPDX-License-Identifier: MIT
4//
5
6#pragma once
7
Matthew Bentham39ef3e52020-01-20 10:09:09 +00008#include <armnn/QuantizedLstmParams.hpp>
Teresa Charlin588cbdf2022-01-19 15:55:37 +00009#include "NeonBaseWorkload.hpp"
Colm Donelan0c479742021-12-10 12:43:54 +000010#include <armnn/backends/WorkloadData.hpp>
Francis Murtagh4fc3c482019-08-02 13:20:54 +010011
12#include <arm_compute/graph/Tensor.h>
13#include <arm_compute/runtime/NEON/functions/NELSTMLayerQuantized.h>
14
15namespace armnn
16{
17
Teresa Charlin588cbdf2022-01-19 15:55:37 +000018class NeonQuantizedLstmWorkload : public NeonBaseWorkload<QuantizedLstmQueueDescriptor>
Francis Murtagh4fc3c482019-08-02 13:20:54 +010019{
20public:
Francis Murtaghb3fc2522019-08-09 13:20:50 +010021 using BaseWorkload<QuantizedLstmQueueDescriptor>::m_Data;
Francis Murtagh4fc3c482019-08-02 13:20:54 +010022 NeonQuantizedLstmWorkload(const QuantizedLstmQueueDescriptor& descriptor, const WorkloadInfo& info);
23 virtual void Execute() const override;
24
25private:
26 mutable arm_compute::NELSTMLayerQuantized m_QuantizedLstmLayer;
27
28 std::unique_ptr<arm_compute::Tensor> m_InputToInputWeightsTensor;
29 std::unique_ptr<arm_compute::Tensor> m_InputToForgetWeightsTensor;
30 std::unique_ptr<arm_compute::Tensor> m_InputToCellWeightsTensor;
31 std::unique_ptr<arm_compute::Tensor> m_InputToOutputWeightsTensor;
32 std::unique_ptr<arm_compute::Tensor> m_RecurrentToInputWeightsTensor;
33 std::unique_ptr<arm_compute::Tensor> m_RecurrentToForgetWeightsTensor;
34 std::unique_ptr<arm_compute::Tensor> m_RecurrentToCellWeightsTensor;
35 std::unique_ptr<arm_compute::Tensor> m_RecurrentToOutputWeightsTensor;
36 std::unique_ptr<arm_compute::Tensor> m_InputGateBiasTensor;
37 std::unique_ptr<arm_compute::Tensor> m_ForgetGateBiasTensor;
38 std::unique_ptr<arm_compute::Tensor> m_CellBiasTensor;
39 std::unique_ptr<arm_compute::Tensor> m_OutputGateBiasTensor;
40 std::unique_ptr<arm_compute::Tensor> m_CellStateInTensor;
41 std::unique_ptr<arm_compute::Tensor> m_OutputStateInTensor;
42 std::unique_ptr<arm_compute::Tensor> m_CellStateOutTensor;
43
44 void FreeUnusedTensors();
45};
46
47arm_compute::Status NeonQuantizedLstmWorkloadValidate(const TensorInfo& input,
48 const TensorInfo& outputStateIn,
49 const TensorInfo& cellStateIn,
50 const TensorInfo& outputStateOut,
51 const TensorInfo& cellStateOut,
52 const QuantizedLstmInputParamsInfo& paramsInfo);
53
54} //namespace armnn