Blame - ArmnnPreparedModel.cpp - ml/android-nn-driver

blob: 2cd560d76d9592893d18a45ca1c27d444b7d7db8 [file] [log] [blame]

telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	1	//
				2	// Copyright © 2017 Arm Ltd. All rights reserved.
David Beck	93e4898	2018-09-05 13:05:09 +0100	[diff] [blame]	3	// SPDX-License-Identifier: MIT
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	4	//
				5
				6	#define LOG_TAG "ArmnnDriver"
				7
				8	#include "ArmnnPreparedModel.hpp"
				9	#include "Utils.hpp"
				10
				11	#include <boost/format.hpp>
				12	#include <log/log.h>
				13	#include <OperationsUtils.h>
surmeh01	deb3bdb	2018-07-05 12:06:04 +0100	[diff] [blame]	14	#include <ValidateHal.h>
Kevin May	ec1e5b8	2020-02-26 17:00:39 +0000	[diff] [blame^]	15
surmeh01	deb3bdb	2018-07-05 12:06:04 +0100	[diff] [blame]	16
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	17	#include <cassert>
				18	#include <cinttypes>
				19
				20	using namespace android;
				21
				22	namespace
				23	{
				24	using namespace armnn_driver;
				25
Kevin May	ec1e5b8	2020-02-26 17:00:39 +0000	[diff] [blame^]	26	void NotifyCallbackAndCheck(const ::android::sp<V1_0::IExecutionCallback>& callback, V1_0::ErrorStatus errorStatus,
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	27	std::string callingFunction)
				28	{
				29	Return<void> returned = callback->notify(errorStatus);
				30	// This check is required, if the callback fails and it isn't checked it will bring down the service
				31	if (!returned.isOk())
				32	{
				33	ALOGE("ArmnnDriver::%s: hidl callback failed to return properly: %s",
				34	callingFunction.c_str(), returned.description().c_str());
				35	}
				36	}
				37
				38	bool ValidateRequestArgument(const RequestArgument& requestArg, const armnn::TensorInfo& tensorInfo)
				39	{
				40	if (requestArg.dimensions.size() != 0)
				41	{
				42	if (requestArg.dimensions.size() != tensorInfo.GetNumDimensions())
				43	{
				44	ALOGE("Mismatched dimensions (request argument: %zu, expected: %u)",
				45	requestArg.dimensions.size(), tensorInfo.GetNumDimensions());
				46	return false;
				47	}
				48
				49	for (unsigned int d = 0; d < tensorInfo.GetNumDimensions(); ++d)
				50	{
				51	if (requestArg.dimensions[d] != tensorInfo.GetShape()[d])
				52	{
				53	ALOGE("Mismatched size for dimension %d (request argument: %u, expected %u)",
				54	d, requestArg.dimensions[d], tensorInfo.GetShape()[d]);
				55	return false;
				56	}
				57	}
				58	}
				59
				60	return true;
				61	}
				62
				63	armnn::Tensor GetTensorForRequestArgument(const RequestArgument& requestArg,
				64	const armnn::TensorInfo& tensorInfo,
				65	const std::vector<::android::nn::RunTimePoolInfo>& requestPools)
				66	{
				67	if (!ValidateRequestArgument(requestArg, tensorInfo))
				68	{
				69	return armnn::Tensor();
				70	}
				71
				72	return armnn::Tensor(tensorInfo, GetMemoryFromPool(requestArg.location, requestPools));
				73	}
				74
				75	inline std::string BuildTensorName(const char* tensorNamePrefix, std::size_t index)
				76	{
				77	return tensorNamePrefix + std::to_string(index);
				78	}
				79
Matteo Martincigh	e48bdff	2018-09-03 13:50:50 +0100	[diff] [blame]	80	} // anonymous namespace
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	81
telsoa01	ce3e84a	2018-08-31 09:31:35 +0100	[diff] [blame]	82	using namespace android::hardware;
				83
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	84	namespace armnn_driver
				85	{
Matteo Martincigh	e48bdff	2018-09-03 13:50:50 +0100	[diff] [blame]	86	template<typename HalVersion>
Mike Kelly	65c42dc	2019-07-22 14:06:00 +0100	[diff] [blame]	87	RequestThread<ArmnnPreparedModel, HalVersion, ArmnnCallback_1_0> ArmnnPreparedModel<HalVersion>::m_RequestThread;
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	88
Matteo Martincigh	e48bdff	2018-09-03 13:50:50 +0100	[diff] [blame]	89	template<typename HalVersion>
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	90	template <typename TensorBindingCollection>
Matteo Martincigh	e48bdff	2018-09-03 13:50:50 +0100	[diff] [blame]	91	void ArmnnPreparedModel<HalVersion>::DumpTensorsIfRequired(char const* tensorNamePrefix,
				92	const TensorBindingCollection& tensorBindings)
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	93	{
				94	if (!m_RequestInputsAndOutputsDumpDir.empty())
				95	{
				96	const std::string requestName = boost::str(boost::format("%1%_%2%.dump") % m_NetworkId % m_RequestCount);
				97	for (std::size_t i = 0u; i < tensorBindings.size(); ++i)
				98	{
				99	DumpTensor(m_RequestInputsAndOutputsDumpDir,
				100	requestName,
				101	BuildTensorName(tensorNamePrefix, i),
				102	tensorBindings[i].second);
				103	}
				104	}
				105	}
				106
Matteo Martincigh	e48bdff	2018-09-03 13:50:50 +0100	[diff] [blame]	107	template<typename HalVersion>
				108	ArmnnPreparedModel<HalVersion>::ArmnnPreparedModel(armnn::NetworkId networkId,
				109	armnn::IRuntime* runtime,
				110	const HalModel& model,
				111	const std::string& requestInputsAndOutputsDumpDir,
				112	const bool gpuProfilingEnabled)
telsoa01	ce3e84a	2018-08-31 09:31:35 +0100	[diff] [blame]	113	: m_NetworkId(networkId)
				114	, m_Runtime(runtime)
				115	, m_Model(model)
				116	, m_RequestCount(0)
				117	, m_RequestInputsAndOutputsDumpDir(requestInputsAndOutputsDumpDir)
				118	, m_GpuProfilingEnabled(gpuProfilingEnabled)
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	119	{
telsoa01	ce3e84a	2018-08-31 09:31:35 +0100	[diff] [blame]	120	// Enable profiling if required.
				121	m_Runtime->GetProfiler(m_NetworkId)->EnableProfiling(m_GpuProfilingEnabled);
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	122	}
				123
Matteo Martincigh	e48bdff	2018-09-03 13:50:50 +0100	[diff] [blame]	124	template<typename HalVersion>
				125	ArmnnPreparedModel<HalVersion>::~ArmnnPreparedModel()
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	126	{
telsoa01	ce3e84a	2018-08-31 09:31:35 +0100	[diff] [blame]	127	// Get a hold of the profiler used by this model.
				128	std::shared_ptr<armnn::IProfiler> profiler = m_Runtime->GetProfiler(m_NetworkId);
				129
				130	// Unload the network associated with this model.
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	131	m_Runtime->UnloadNetwork(m_NetworkId);
telsoa01	ce3e84a	2018-08-31 09:31:35 +0100	[diff] [blame]	132
				133	// Dump the profiling info to a file if required.
				134	DumpJsonProfilingIfRequired(m_GpuProfilingEnabled, m_RequestInputsAndOutputsDumpDir, m_NetworkId, profiler.get());
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	135	}
				136
Matteo Martincigh	e48bdff	2018-09-03 13:50:50 +0100	[diff] [blame]	137	template<typename HalVersion>
Kevin May	ec1e5b8	2020-02-26 17:00:39 +0000	[diff] [blame^]	138	Return<V1_0::ErrorStatus> ArmnnPreparedModel<HalVersion>::execute(
				139	const V1_0::Request& request,
				140	const ::android::sp<V1_0::IExecutionCallback>& callback)
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	141	{
				142	ALOGV("ArmnnPreparedModel::execute(): %s", GetModelSummary(m_Model).c_str());
				143	m_RequestCount++;
				144
				145	if (callback.get() == nullptr) {
				146	ALOGE("ArmnnPreparedModel::execute invalid callback passed");
Kevin May	ec1e5b8	2020-02-26 17:00:39 +0000	[diff] [blame^]	147	return V1_0::ErrorStatus::INVALID_ARGUMENT;
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	148	}
				149
				150	if (!android::nn::validateRequest(request, m_Model))
				151	{
Kevin May	ec1e5b8	2020-02-26 17:00:39 +0000	[diff] [blame^]	152	NotifyCallbackAndCheck(callback, V1_0::ErrorStatus::INVALID_ARGUMENT, "ArmnnPreparedModel::execute");
				153	return V1_0::ErrorStatus::INVALID_ARGUMENT;
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	154	}
				155
				156	if (!m_RequestInputsAndOutputsDumpDir.empty())
				157	{
				158	ALOGD("Dumping inputs and outputs for request %" PRIuPTR, reinterpret_cast<std::uintptr_t>(callback.get()));
				159	}
				160
				161	// allocate the tensors on the heap, as they are passed to the request thread
				162	auto pInputTensors = std::make_shared<armnn::InputTensors>();
				163	auto pOutputTensors = std::make_shared<armnn::OutputTensors>();
				164
				165	// map the memory pool into shared pointers
				166	// use a shared memory pools vector on the heap, as it is passed to the request thread
				167	auto pMemPools = std::make_shared<std::vector<android::nn::RunTimePoolInfo>>();
				168	if (!setRunTimePoolInfosFromHidlMemories(pMemPools.get(), request.pools))
				169	{
Kevin May	ec1e5b8	2020-02-26 17:00:39 +0000	[diff] [blame^]	170	NotifyCallbackAndCheck(callback, V1_0::ErrorStatus::GENERAL_FAILURE, "ArmnnPreparedModel::execute");
				171	return V1_0::ErrorStatus::GENERAL_FAILURE;
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	172	}
				173
				174	// add the inputs and outputs with their data
				175	try
				176	{
				177	pInputTensors->reserve(request.inputs.size());
				178	for (unsigned int i = 0; i < request.inputs.size(); i++)
				179	{
				180	const auto& inputArg = request.inputs[i];
				181
				182	const armnn::TensorInfo inputTensorInfo = m_Runtime->GetInputTensorInfo(m_NetworkId, i);
				183	const armnn::Tensor inputTensor = GetTensorForRequestArgument(inputArg, inputTensorInfo, *pMemPools);
				184	if (inputTensor.GetMemoryArea() == nullptr)
				185	{
				186	ALOGE("Cannot execute request. Error converting request input %u to tensor", i);
Kevin May	ec1e5b8	2020-02-26 17:00:39 +0000	[diff] [blame^]	187	return V1_0::ErrorStatus::GENERAL_FAILURE;
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	188	}
				189
				190	pInputTensors->emplace_back(i, inputTensor);
				191	}
				192
				193	pOutputTensors->reserve(request.outputs.size());
				194	for (unsigned int i = 0; i < request.outputs.size(); i++)
				195	{
				196	const auto& outputArg = request.outputs[i];
				197
				198	const armnn::TensorInfo outputTensorInfo = m_Runtime->GetOutputTensorInfo(m_NetworkId, i);
				199	const armnn::Tensor outputTensor = GetTensorForRequestArgument(outputArg, outputTensorInfo, *pMemPools);
				200	if (outputTensor.GetMemoryArea() == nullptr)
				201	{
				202	ALOGE("Cannot execute request. Error converting request output %u to tensor", i);
Kevin May	ec1e5b8	2020-02-26 17:00:39 +0000	[diff] [blame^]	203	return V1_0::ErrorStatus::GENERAL_FAILURE;
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	204	}
				205
				206	pOutputTensors->emplace_back(i, outputTensor);
				207	}
				208	}
Kevin May	7bdaac5	2020-02-10 12:10:07 +0000	[diff] [blame]	209	catch (armnn::Exception& e)
				210	{
				211	ALOGW("armnn::Exception caught while preparing for EnqueueWorkload: %s", e.what());
Kevin May	ec1e5b8	2020-02-26 17:00:39 +0000	[diff] [blame^]	212	NotifyCallbackAndCheck(callback, V1_0::ErrorStatus::GENERAL_FAILURE, "ArmnnPreparedModel::execute");
				213	return V1_0::ErrorStatus::GENERAL_FAILURE;
Kevin May	7bdaac5	2020-02-10 12:10:07 +0000	[diff] [blame]	214	}
Derek Lamberti	b9cb844	2019-11-28 13:34:48 +0000	[diff] [blame]	215	catch (std::exception& e)
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	216	{
Kevin May	7bdaac5	2020-02-10 12:10:07 +0000	[diff] [blame]	217	ALOGE("std::exception caught while preparing for EnqueueWorkload: %s", e.what());
Kevin May	ec1e5b8	2020-02-26 17:00:39 +0000	[diff] [blame^]	218	NotifyCallbackAndCheck(callback, V1_0::ErrorStatus::GENERAL_FAILURE, "ArmnnPreparedModel::execute");
				219	return V1_0::ErrorStatus::GENERAL_FAILURE;
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	220	}
				221
				222	ALOGV("ArmnnPreparedModel::execute(...) before PostMsg");
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	223
Kevin May	ec1e5b8	2020-02-26 17:00:39 +0000	[diff] [blame^]	224	auto cb = [callback](V1_0::ErrorStatus errorStatus, std::string callingFunction)
Mike Kelly	65c42dc	2019-07-22 14:06:00 +0100	[diff] [blame]	225	{
				226	NotifyCallbackAndCheck(callback, errorStatus, callingFunction);
				227	};
				228
				229	ArmnnCallback_1_0 armnnCb;
				230	armnnCb.callback = cb;
				231	// post the request for asynchronous execution
				232	m_RequestThread.PostMsg(this, pMemPools, pInputTensors, pOutputTensors, armnnCb);
				233	ALOGV("ArmnnPreparedModel::execute(...) after PostMsg");
Kevin May	ec1e5b8	2020-02-26 17:00:39 +0000	[diff] [blame^]	234	return V1_0::ErrorStatus::NONE; // successfully queued
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	235	}
				236
Matteo Martincigh	e48bdff	2018-09-03 13:50:50 +0100	[diff] [blame]	237	template<typename HalVersion>
				238	void ArmnnPreparedModel<HalVersion>::ExecuteGraph(
				239	std::shared_ptr<std::vector<::android::nn::RunTimePoolInfo>>& pMemPools,
				240	std::shared_ptr<armnn::InputTensors>& pInputTensors,
				241	std::shared_ptr<armnn::OutputTensors>& pOutputTensors,
Mike Kelly	65c42dc	2019-07-22 14:06:00 +0100	[diff] [blame]	242	ArmnnCallback_1_0 cb)
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	243	{
				244	ALOGV("ArmnnPreparedModel::ExecuteGraph(...)");
				245
				246	DumpTensorsIfRequired("Input", *pInputTensors);
				247
				248	// run it
				249	try
				250	{
Matthew Bentham	16196e2	2019-04-01 17:17:58 +0100	[diff] [blame]	251	armnn::Status status = m_Runtime->EnqueueWorkload(m_NetworkId, pInputTensors, pOutputTensors);
				252	if (status != armnn::Status::Success)
				253	{
				254	ALOGW("EnqueueWorkload failed");
Kevin May	ec1e5b8	2020-02-26 17:00:39 +0000	[diff] [blame^]	255	cb.callback(V1_0::ErrorStatus::GENERAL_FAILURE, "ArmnnPreparedModel::ExecuteGraph");
Matthew Bentham	16196e2	2019-04-01 17:17:58 +0100	[diff] [blame]	256	return;
				257	}
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	258	}
Kevin May	7bdaac5	2020-02-10 12:10:07 +0000	[diff] [blame]	259	catch (armnn::Exception& e)
				260	{
				261	ALOGW("armnn::Exception caught from EnqueueWorkload: %s", e.what());
Kevin May	ec1e5b8	2020-02-26 17:00:39 +0000	[diff] [blame^]	262	cb.callback(V1_0::ErrorStatus::GENERAL_FAILURE, "ArmnnPreparedModel::ExecuteGraph");
Kevin May	7bdaac5	2020-02-10 12:10:07 +0000	[diff] [blame]	263	return;
				264	}
Derek Lamberti	b9cb844	2019-11-28 13:34:48 +0000	[diff] [blame]	265	catch (std::exception& e)
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	266	{
Kevin May	7bdaac5	2020-02-10 12:10:07 +0000	[diff] [blame]	267	ALOGE("std::exception caught from EnqueueWorkload: %s", e.what());
Kevin May	ec1e5b8	2020-02-26 17:00:39 +0000	[diff] [blame^]	268	cb.callback(V1_0::ErrorStatus::GENERAL_FAILURE, "ArmnnPreparedModel::ExecuteGraph");
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	269	return;
				270	}
				271
				272	DumpTensorsIfRequired("Output", *pOutputTensors);
				273
				274	// Commit output buffers.
				275	// Note that we update all pools, even if they aren't actually used as outputs -
				276	// this is simpler and is what the CpuExecutor does.
				277	for (android::nn::RunTimePoolInfo& pool : *pMemPools)
				278	{
Kevin May	ec1e5b8	2020-02-26 17:00:39 +0000	[diff] [blame^]	279	// Type android::nn::RunTimePoolInfo has changed between Android P & Q and Android R, where
				280	// update() has been removed and flush() added.
				281	#if defined(ARMNN_ANDROID_R) // Use the new Android implementation.
				282	pool.flush();
				283	#else
				284	pool.update();
				285	#endif
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	286	}
				287
Kevin May	ec1e5b8	2020-02-26 17:00:39 +0000	[diff] [blame^]	288	cb.callback(V1_0::ErrorStatus::NONE, "ExecuteGraph");
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	289	}
				290
Matteo Martincigh	e48bdff	2018-09-03 13:50:50 +0100	[diff] [blame]	291	template<typename HalVersion>
Matthew Bentham	16196e2	2019-04-01 17:17:58 +0100	[diff] [blame]	292	bool ArmnnPreparedModel<HalVersion>::ExecuteWithDummyInputs()
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	293	{
				294	std::vector<std::vector<char>> storage;
				295	armnn::InputTensors inputTensors;
				296	for (unsigned int i = 0; i < m_Model.inputIndexes.size(); i++)
				297	{
				298	const armnn::TensorInfo inputTensorInfo = m_Runtime->GetInputTensorInfo(m_NetworkId, i);
				299	storage.emplace_back(inputTensorInfo.GetNumBytes());
				300	const armnn::ConstTensor inputTensor(inputTensorInfo, storage.back().data());
				301
				302	inputTensors.emplace_back(i, inputTensor);
				303	}
				304
				305	armnn::OutputTensors outputTensors;
				306	for (unsigned int i = 0; i < m_Model.outputIndexes.size(); i++)
				307	{
				308	const armnn::TensorInfo outputTensorInfo = m_Runtime->GetOutputTensorInfo(m_NetworkId, i);
				309	storage.emplace_back(outputTensorInfo.GetNumBytes());
				310	const armnn::Tensor outputTensor(outputTensorInfo, storage.back().data());
				311
				312	outputTensors.emplace_back(i, outputTensor);
				313	}
				314
				315	try
				316	{
Matthew Bentham	16196e2	2019-04-01 17:17:58 +0100	[diff] [blame]	317	armnn::Status status = m_Runtime->EnqueueWorkload(m_NetworkId, inputTensors, outputTensors);
				318	if (status != armnn::Status::Success)
				319	{
				320	ALOGW("ExecuteWithDummyInputs: EnqueueWorkload failed");
				321	return false;
				322	}
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	323	}
Kevin May	7bdaac5	2020-02-10 12:10:07 +0000	[diff] [blame]	324	catch (armnn::Exception& e)
				325	{
				326	ALOGW("ExecuteWithDummyInputs: armnn::Exception caught from EnqueueWorkload: %s", e.what());
				327	return false;
				328	}
Derek Lamberti	b9cb844	2019-11-28 13:34:48 +0000	[diff] [blame]	329	catch (std::exception& e)
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	330	{
Kevin May	7bdaac5	2020-02-10 12:10:07 +0000	[diff] [blame]	331	ALOGE("ExecuteWithDummyInputs: std::exception caught from EnqueueWorkload: %s", e.what());
Matthew Bentham	16196e2	2019-04-01 17:17:58 +0100	[diff] [blame]	332	return false;
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	333	}
Matthew Bentham	16196e2	2019-04-01 17:17:58 +0100	[diff] [blame]	334	return true;
telsoa01	5307bc1	2018-03-09 13:51:08 +0000	[diff] [blame]	335	}
				336
arovir01	b0717b5	2018-09-05 17:03:25 +0100	[diff] [blame]	337	///
				338	/// Class template specializations
				339	///
Matteo Martincigh	e48bdff	2018-09-03 13:50:50 +0100	[diff] [blame]	340
arovir01	b0717b5	2018-09-05 17:03:25 +0100	[diff] [blame]	341	template class ArmnnPreparedModel<hal_1_0::HalPolicy>;
				342
Matteo Martincigh	8b287c2	2018-09-07 09:25:10 +0100	[diff] [blame]	343	#ifdef ARMNN_ANDROID_NN_V1_1
arovir01	b0717b5	2018-09-05 17:03:25 +0100	[diff] [blame]	344	template class ArmnnPreparedModel<hal_1_1::HalPolicy>;
Matteo Martincigh	e48bdff	2018-09-03 13:50:50 +0100	[diff] [blame]	345	#endif
				346
Mike Kelly	b5fdf38	2019-06-11 16:35:25 +0100	[diff] [blame]	347	#ifdef ARMNN_ANDROID_NN_V1_2
				348	template class ArmnnPreparedModel<hal_1_1::HalPolicy>;
				349	template class ArmnnPreparedModel<hal_1_2::HalPolicy>;
				350	#endif
Nikhil Raj	7760582	2018-09-03 11:25:56 +0100	[diff] [blame]	351	} // namespace armnn_driver