blob: 740cb4a316f4b5f3727b9d138fb6c605df89dc49 [file] [log] [blame]
Francis Murtagh4fc3c482019-08-02 13:20:54 +01001//
2// Copyright © 2017 Arm Ltd. All rights reserved.
3// SPDX-License-Identifier: MIT
4//
5
6#pragma once
7
Matthew Bentham39ef3e52020-01-20 10:09:09 +00008#include <armnn/QuantizedLstmParams.hpp>
Francis Murtagh4fc3c482019-08-02 13:20:54 +01009#include <backendsCommon/Workload.hpp>
10#include <backendsCommon/WorkloadData.hpp>
11
12#include <arm_compute/graph/Tensor.h>
13#include <arm_compute/runtime/NEON/functions/NELSTMLayerQuantized.h>
14
15namespace armnn
16{
17
18class NeonQuantizedLstmWorkload : public BaseWorkload<QuantizedLstmQueueDescriptor>
19{
20public:
Francis Murtaghb3fc2522019-08-09 13:20:50 +010021 using BaseWorkload<QuantizedLstmQueueDescriptor>::m_Data;
Francis Murtagh4fc3c482019-08-02 13:20:54 +010022 NeonQuantizedLstmWorkload(const QuantizedLstmQueueDescriptor& descriptor, const WorkloadInfo& info);
23 virtual void Execute() const override;
24
25private:
26 mutable arm_compute::NELSTMLayerQuantized m_QuantizedLstmLayer;
27
28 std::unique_ptr<arm_compute::Tensor> m_InputToInputWeightsTensor;
29 std::unique_ptr<arm_compute::Tensor> m_InputToForgetWeightsTensor;
30 std::unique_ptr<arm_compute::Tensor> m_InputToCellWeightsTensor;
31 std::unique_ptr<arm_compute::Tensor> m_InputToOutputWeightsTensor;
32 std::unique_ptr<arm_compute::Tensor> m_RecurrentToInputWeightsTensor;
33 std::unique_ptr<arm_compute::Tensor> m_RecurrentToForgetWeightsTensor;
34 std::unique_ptr<arm_compute::Tensor> m_RecurrentToCellWeightsTensor;
35 std::unique_ptr<arm_compute::Tensor> m_RecurrentToOutputWeightsTensor;
36 std::unique_ptr<arm_compute::Tensor> m_InputGateBiasTensor;
37 std::unique_ptr<arm_compute::Tensor> m_ForgetGateBiasTensor;
38 std::unique_ptr<arm_compute::Tensor> m_CellBiasTensor;
39 std::unique_ptr<arm_compute::Tensor> m_OutputGateBiasTensor;
40 std::unique_ptr<arm_compute::Tensor> m_CellStateInTensor;
41 std::unique_ptr<arm_compute::Tensor> m_OutputStateInTensor;
42 std::unique_ptr<arm_compute::Tensor> m_CellStateOutTensor;
43
44 void FreeUnusedTensors();
45};
46
47arm_compute::Status NeonQuantizedLstmWorkloadValidate(const TensorInfo& input,
48 const TensorInfo& outputStateIn,
49 const TensorInfo& cellStateIn,
50 const TensorInfo& outputStateOut,
51 const TensorInfo& cellStateOut,
52 const QuantizedLstmInputParamsInfo& paramsInfo);
53
54} //namespace armnn