Blame - src/backends/backendsCommon/test/EndToEndTestImpl.hpp - ml/armnn

blob: a5fe8c6a625e1b9c3c32a2684807c2bcd1334b42 [file] [log] [blame]

Aron Virginas-Tar	7010400	2018-10-24 15:33:28 +0100	[diff] [blame]	1	//
				2	// Copyright © 2017 Arm Ltd. All rights reserved.
				3	// SPDX-License-Identifier: MIT
				4	//
				5	#pragma once
				6
Mike Kelly	386ff1a	2021-03-29 15:04:50 +0100	[diff] [blame]	7	#include "CommonTestUtils.hpp"
				8
Matthew Bentham	246bd46	2020-01-20 16:16:06 +0000	[diff] [blame]	9	#include <armnn/Descriptors.hpp>
narpra01	b9546cf	2018-11-20 15:21:28 +0000	[diff] [blame]	10	#include <armnn/INetwork.hpp>
Matthew Bentham	246bd46	2020-01-20 16:16:06 +0000	[diff] [blame]	11	#include <armnn/IRuntime.hpp>
Aron Virginas-Tar	7010400	2018-10-24 15:33:28 +0100	[diff] [blame]	12
Aron Virginas-Tar	48623a0	2019-10-22 10:00:28 +0100	[diff] [blame]	13	#include <Profiling.hpp>
				14	#include <QuantizeHelper.hpp>
				15	#include <ResolveType.hpp>
Aron Virginas-Tar	7010400	2018-10-24 15:33:28 +0100	[diff] [blame]	16
narpra01	b9546cf	2018-11-20 15:21:28 +0000	[diff] [blame]	17	#include <boost/test/unit_test.hpp>
				18
Aron Virginas-Tar	7010400	2018-10-24 15:33:28 +0100	[diff] [blame]	19	#include <vector>
				20
				21	namespace
				22	{
				23
				24	using namespace armnn;
				25
				26	template<typename T>
				27	bool ConstantUsageTest(const std::vector<BackendId>& computeDevice,
				28	const TensorInfo& commonTensorInfo,
				29	const std::vector<T>& inputData,
				30	const std::vector<T>& constantData,
				31	const std::vector<T>& expectedOutputData)
				32	{
				33	// Create runtime in which test will run
				34	IRuntime::CreationOptions options;
				35	IRuntimePtr runtime(IRuntime::Create(options));
				36
				37	// Builds up the structure of the network.
				38	INetworkPtr net(INetwork::Create());
				39
				40	IConnectableLayer* input = net->AddInputLayer(0);
				41	IConnectableLayer* constant = net->AddConstantLayer(ConstTensor(commonTensorInfo, constantData));
				42	IConnectableLayer* add = net->AddAdditionLayer();
				43	IConnectableLayer* output = net->AddOutputLayer(0);
				44
				45	input->GetOutputSlot(0).Connect(add->GetInputSlot(0));
				46	constant->GetOutputSlot(0).Connect(add->GetInputSlot(1));
				47	add->GetOutputSlot(0).Connect(output->GetInputSlot(0));
				48
				49	// Sets the tensors in the network.
				50	input->GetOutputSlot(0).SetTensorInfo(commonTensorInfo);
				51	constant->GetOutputSlot(0).SetTensorInfo(commonTensorInfo);
				52	add->GetOutputSlot(0).SetTensorInfo(commonTensorInfo);
				53
				54	// optimize the network
				55	IOptimizedNetworkPtr optNet = Optimize(*net, computeDevice, runtime->GetDeviceSpec());
				56
				57	// Loads it into the runtime.
				58	NetworkId netId;
				59	runtime->LoadNetwork(netId, std::move(optNet));
				60
				61	// Creates structures for input & output.
				62	std::vector<T> outputData(inputData.size());
				63
				64	InputTensors inputTensors
				65	{
				66	{0, ConstTensor(runtime->GetInputTensorInfo(netId, 0), inputData.data())}
				67	};
				68	OutputTensors outputTensors
				69	{
				70	{0, Tensor(runtime->GetOutputTensorInfo(netId, 0), outputData.data())}
				71	};
				72
				73	// Does the inference.
				74	runtime->EnqueueWorkload(netId, inputTensors, outputTensors);
				75
				76	// Checks the results.
				77	return outputData == expectedOutputData;
				78	}
				79
				80	inline bool ConstantUsageFloat32Test(const std::vector<BackendId>& backends)
				81	{
				82	const TensorInfo commonTensorInfo({ 2, 3 }, DataType::Float32);
				83
				84	return ConstantUsageTest(backends,
				85	commonTensorInfo,
				86	std::vector<float>{ 1.f, 2.f, 3.f, 4.f, 5.f, 6.f }, // Input.
				87	std::vector<float>{ 6.f, 5.f, 4.f, 3.f, 2.f, 1.f }, // Const input.
				88	std::vector<float>{ 7.f, 7.f, 7.f, 7.f, 7.f, 7.f } // Expected output.
				89	);
				90	}
				91
				92	inline bool ConstantUsageUint8Test(const std::vector<BackendId>& backends)
				93	{
Derek Lamberti	f90c56d	2020-01-10 17:14:08 +0000	[diff] [blame]	94	TensorInfo commonTensorInfo({ 2, 3 }, DataType::QAsymmU8);
Aron Virginas-Tar	7010400	2018-10-24 15:33:28 +0100	[diff] [blame]	95
				96	const float scale = 0.023529f;
				97	const int8_t offset = -43;
				98
				99	commonTensorInfo.SetQuantizationScale(scale);
				100	commonTensorInfo.SetQuantizationOffset(offset);
				101
				102	return ConstantUsageTest(backends,
				103	commonTensorInfo,
Aron Virginas-Tar	48623a0	2019-10-22 10:00:28 +0100	[diff] [blame]	104	armnnUtils::QuantizedVector<uint8_t>({ 1.f, 2.f, 3.f, 4.f, 5.f, 6.f }, scale, offset), // Input.
				105	armnnUtils::QuantizedVector<uint8_t>({ 6.f, 5.f, 4.f, 3.f, 2.f, 1.f }, scale, offset), // Const input.
				106	armnnUtils::QuantizedVector<uint8_t>({ 7.f, 7.f, 7.f, 7.f, 7.f, 7.f }, scale, offset) // Expected output.
Aron Virginas-Tar	7010400	2018-10-24 15:33:28 +0100	[diff] [blame]	107	);
				108	}
				109
Ferran Balaguer	83239f9	2019-09-19 11:49:25 +0100	[diff] [blame]	110	// Utility function to find the number of instances of a substring within a string.
				111	int SubStringCounter(std::string& string, std::string&& substring)
				112	{
				113	std::size_t found = 0;
				114	int count = 0;
				115	// Look for the substring starting from where we last found the substring
				116	while((found = string.find(substring, found)) != std::string::npos)
				117	{
				118	count++;
				119	// Offset by substring length to avoid finding the same substring twice
				120	found += substring.length();
				121	}
				122	return count;
				123	}
				124
Nattapat Chaimanowong	1fcb4ff	2019-01-24 15:25:26 +0000	[diff] [blame]	125	template<DataType ArmnnIType, DataType ArmnnOType,
				126	typename TInput = ResolveType<ArmnnIType>, typename TOutput = ResolveType<ArmnnOType>>
narpra01	b9546cf	2018-11-20 15:21:28 +0000	[diff] [blame]	127	void EndToEndLayerTestImpl(INetworkPtr network,
kevmay01	2b4d88e	2019-01-24 14:05:09 +0000	[diff] [blame]	128	const std::map<int, std::vector<TInput>>& inputTensorData,
				129	const std::map<int, std::vector<TOutput>>& expectedOutputData,
Jan Eilers	bca73e1	2020-03-11 12:52:46 +0000	[diff] [blame]	130	std::vector<BackendId> backends,
				131	float tolerance = 0.000001f)
narpra01	b9546cf	2018-11-20 15:21:28 +0000	[diff] [blame]	132	{
				133	// Create runtime in which test will run
				134	IRuntime::CreationOptions options;
				135	IRuntimePtr runtime(IRuntime::Create(options));
				136
				137	// optimize the network
				138	IOptimizedNetworkPtr optNet = Optimize(*network, backends, runtime->GetDeviceSpec());
				139
				140	// Loads it into the runtime.
				141	NetworkId netId;
				142	runtime->LoadNetwork(netId, std::move(optNet));
				143
				144	InputTensors inputTensors;
				145	inputTensors.reserve(inputTensorData.size());
				146	for (auto&& it : inputTensorData)
				147	{
				148	inputTensors.push_back({it.first,
				149	ConstTensor(runtime->GetInputTensorInfo(netId, it.first), it.second.data())});
				150	}
				151	OutputTensors outputTensors;
				152	outputTensors.reserve(expectedOutputData.size());
kevmay01	2b4d88e	2019-01-24 14:05:09 +0000	[diff] [blame]	153	std::map<int, std::vector<TOutput>> outputStorage;
narpra01	b9546cf	2018-11-20 15:21:28 +0000	[diff] [blame]	154	for (auto&& it : expectedOutputData)
				155	{
kevmay01	2b4d88e	2019-01-24 14:05:09 +0000	[diff] [blame]	156	std::vector<TOutput> out(it.second.size());
narpra01	b9546cf	2018-11-20 15:21:28 +0000	[diff] [blame]	157	outputStorage.emplace(it.first, out);
				158	outputTensors.push_back({it.first,
				159	Tensor(runtime->GetOutputTensorInfo(netId, it.first),
				160	outputStorage.at(it.first).data())});
				161	}
				162
				163	// Does the inference.
				164	runtime->EnqueueWorkload(netId, inputTensors, outputTensors);
				165
				166	// Checks the results.
				167	for (auto&& it : expectedOutputData)
				168	{
kevmay01	2b4d88e	2019-01-24 14:05:09 +0000	[diff] [blame]	169	std::vector<TOutput> out = outputStorage.at(it.first);
Aron Virginas-Tar	f97f6da	2019-10-01 18:35:44 +0100	[diff] [blame]	170	for (unsigned int i = 0; i < out.size(); ++i)
Nattapat Chaimanowong	1fcb4ff	2019-01-24 15:25:26 +0000	[diff] [blame]	171	{
Teresa Charlin	2e3f4d2	2020-07-29 14:29:20 +0100	[diff] [blame]	172	BOOST_CHECK_MESSAGE(Compare<ArmnnOType>(it.second[i], out[i], tolerance) == true,
				173	"Actual output: " << out[i] << ". Expected output:" << it.second[i]);
				174
Nattapat Chaimanowong	1fcb4ff	2019-01-24 15:25:26 +0000	[diff] [blame]	175	}
narpra01	b9546cf	2018-11-20 15:21:28 +0000	[diff] [blame]	176	}
				177	}
				178
David Monahan	4f1e8e4	2019-09-04 09:22:10 +0100	[diff] [blame]	179	inline void ImportNonAlignedInputPointerTest(std::vector<BackendId> backends)
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	180	{
				181	using namespace armnn;
				182
				183	// Create runtime in which test will run
				184	IRuntime::CreationOptions options;
				185	IRuntimePtr runtime(armnn::IRuntime::Create(options));
				186
				187	// build up the structure of the network
				188	INetworkPtr net(INetwork::Create());
				189
				190	IConnectableLayer* input = net->AddInputLayer(0);
				191
David Monahan	3fb7e10	2019-08-20 11:25:29 +0100	[diff] [blame]	192	ActivationDescriptor descriptor;
				193	descriptor.m_Function = ActivationFunction::Square;
				194	IConnectableLayer* pooling = net->AddActivationLayer(descriptor);
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	195
				196	IConnectableLayer* output = net->AddOutputLayer(0);
				197
David Monahan	3fb7e10	2019-08-20 11:25:29 +0100	[diff] [blame]	198	input->GetOutputSlot(0).Connect(pooling->GetInputSlot(0));
				199	pooling->GetOutputSlot(0).Connect(output->GetInputSlot(0));
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	200
David Monahan	3fb7e10	2019-08-20 11:25:29 +0100	[diff] [blame]	201	input->GetOutputSlot(0).SetTensorInfo(TensorInfo({ 1, 1, 1, 4 }, DataType::Float32));
				202	pooling->GetOutputSlot(0).SetTensorInfo(TensorInfo({ 1, 1, 1, 4 }, DataType::Float32));
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	203
				204	// Optimize the network
				205	IOptimizedNetworkPtr optNet = Optimize(*net, backends, runtime->GetDeviceSpec());
David Monahan	3fb7e10	2019-08-20 11:25:29 +0100	[diff] [blame]	206	BOOST_CHECK(optNet);
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	207
				208	// Loads it into the runtime.
				209	NetworkId netId;
David Monahan	4f1e8e4	2019-09-04 09:22:10 +0100	[diff] [blame]	210	std::string ignoredErrorMessage;
				211	// Enable Importing
Francis Murtagh	73d3e2e	2021-04-29 14:23:04 +0100	[diff] [blame^]	212	INetworkProperties networkProperties(false, MemorySource::Malloc, MemorySource::Undefined);
David Monahan	4f1e8e4	2019-09-04 09:22:10 +0100	[diff] [blame]	213	runtime->LoadNetwork(netId, std::move(optNet), ignoredErrorMessage, networkProperties);
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	214
				215	// Creates structures for input & output
				216	std::vector<float> inputData
				217	{
David Monahan	3fb7e10	2019-08-20 11:25:29 +0100	[diff] [blame]	218	1.0f, 2.0f, 3.0f, 4.0f
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	219	};
				220
				221	// Misaligned input
Aron Virginas-Tar	d9f7c8b	2019-09-13 13:37:03 +0100	[diff] [blame]	222	float* misalignedInputData = reinterpret_cast<float>(reinterpret_cast<char>(inputData.data()) + 1);
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	223
David Monahan	3fb7e10	2019-08-20 11:25:29 +0100	[diff] [blame]	224	std::vector<float> outputData(4);
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	225
David Monahan	4f1e8e4	2019-09-04 09:22:10 +0100	[diff] [blame]	226	// Aligned output
David Monahan	3fb7e10	2019-08-20 11:25:29 +0100	[diff] [blame]	227	float* alignedOutputData = outputData.data();
David Monahan	4f1e8e4	2019-09-04 09:22:10 +0100	[diff] [blame]	228
				229	InputTensors inputTensors
				230	{
				231	{0,armnn::ConstTensor(runtime->GetInputTensorInfo(netId, 0), misalignedInputData)},
				232	};
				233	OutputTensors outputTensors
				234	{
				235	{0,armnn::Tensor(runtime->GetOutputTensorInfo(netId, 0), alignedOutputData)}
				236	};
				237
David Monahan	4f1e8e4	2019-09-04 09:22:10 +0100	[diff] [blame]	238	runtime->GetProfiler(netId)->EnableProfiling(true);
				239
				240	// Do the inference and expect it to fail with a ImportMemoryException
				241	BOOST_CHECK_THROW(runtime->EnqueueWorkload(netId, inputTensors, outputTensors), MemoryImportException);
				242	}
				243
Ferran Balaguer	83239f9	2019-09-19 11:49:25 +0100	[diff] [blame]	244	inline void ExportNonAlignedOutputPointerTest(std::vector<BackendId> backends)
David Monahan	4f1e8e4	2019-09-04 09:22:10 +0100	[diff] [blame]	245	{
				246	using namespace armnn;
				247
				248	// Create runtime in which test will run
				249	IRuntime::CreationOptions options;
				250	IRuntimePtr runtime(armnn::IRuntime::Create(options));
				251
				252	// build up the structure of the network
				253	INetworkPtr net(INetwork::Create());
				254
				255	IConnectableLayer* input = net->AddInputLayer(0);
				256
David Monahan	3fb7e10	2019-08-20 11:25:29 +0100	[diff] [blame]	257	ActivationDescriptor descriptor;
				258	descriptor.m_Function = ActivationFunction::Square;
				259	IConnectableLayer* pooling = net->AddActivationLayer(descriptor);
David Monahan	4f1e8e4	2019-09-04 09:22:10 +0100	[diff] [blame]	260
				261	IConnectableLayer* output = net->AddOutputLayer(0);
				262
David Monahan	3fb7e10	2019-08-20 11:25:29 +0100	[diff] [blame]	263	input->GetOutputSlot(0).Connect(pooling->GetInputSlot(0));
				264	pooling->GetOutputSlot(0).Connect(output->GetInputSlot(0));
David Monahan	4f1e8e4	2019-09-04 09:22:10 +0100	[diff] [blame]	265
David Monahan	3fb7e10	2019-08-20 11:25:29 +0100	[diff] [blame]	266	input->GetOutputSlot(0).SetTensorInfo(TensorInfo({ 1, 1, 1, 4 }, DataType::Float32));
				267	pooling->GetOutputSlot(0).SetTensorInfo(TensorInfo({ 1, 1, 1, 4 }, DataType::Float32));
David Monahan	4f1e8e4	2019-09-04 09:22:10 +0100	[diff] [blame]	268
				269	// Optimize the network
				270	IOptimizedNetworkPtr optNet = Optimize(*net, backends, runtime->GetDeviceSpec());
David Monahan	3fb7e10	2019-08-20 11:25:29 +0100	[diff] [blame]	271	BOOST_CHECK(optNet);
David Monahan	4f1e8e4	2019-09-04 09:22:10 +0100	[diff] [blame]	272
				273	// Loads it into the runtime.
				274	NetworkId netId;
				275	std::string ignoredErrorMessage;
David Monahan	3fb7e10	2019-08-20 11:25:29 +0100	[diff] [blame]	276	// Enable Importing and Exporting
Francis Murtagh	73d3e2e	2021-04-29 14:23:04 +0100	[diff] [blame^]	277	INetworkProperties networkProperties(false, MemorySource::Malloc, MemorySource::Malloc);
David Monahan	4f1e8e4	2019-09-04 09:22:10 +0100	[diff] [blame]	278	runtime->LoadNetwork(netId, std::move(optNet), ignoredErrorMessage, networkProperties);
				279
				280	// Creates structures for input & output
				281	std::vector<float> inputData
				282	{
				283	1.0f, 2.0f, 3.0f, 4.0f, 5.0f
				284	};
				285
				286	// Aligned input
David Monahan	3fb7e10	2019-08-20 11:25:29 +0100	[diff] [blame]	287	float* alignedInputData = inputData.data();
David Monahan	4f1e8e4	2019-09-04 09:22:10 +0100	[diff] [blame]	288
				289	std::vector<float> outputData(5);
				290
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	291	// Misaligned output
Aron Virginas-Tar	d9f7c8b	2019-09-13 13:37:03 +0100	[diff] [blame]	292	float* misalignedOutputData = reinterpret_cast<float>(reinterpret_cast<char>(outputData.data()) + 1);
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	293
				294	InputTensors inputTensors
				295	{
David Monahan	4f1e8e4	2019-09-04 09:22:10 +0100	[diff] [blame]	296	{0,armnn::ConstTensor(runtime->GetInputTensorInfo(netId, 0), alignedInputData)},
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	297	};
				298	OutputTensors outputTensors
				299	{
				300	{0,armnn::Tensor(runtime->GetOutputTensorInfo(netId, 0), misalignedOutputData)}
				301	};
				302
Ferran Balaguer	83239f9	2019-09-19 11:49:25 +0100	[diff] [blame]	303	// Do the inference and expect it to fail with a ExportMemoryException
				304	if (backends[0] == Compute::CpuAcc)
				305	{
				306	// For CpuAcc the NeonTensorHandle will throw its own exception on misaligned memory
				307	BOOST_CHECK_THROW(runtime->EnqueueWorkload(netId, inputTensors, outputTensors), MemoryImportException);
				308	}
				309	else
				310	{
				311	BOOST_CHECK_THROW(runtime->EnqueueWorkload(netId, inputTensors, outputTensors), MemoryExportException);
				312	}
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	313	}
				314
				315	inline void ImportAlignedPointerTest(std::vector<BackendId> backends)
				316	{
				317	using namespace armnn;
				318
				319	// Create runtime in which test will run
				320	IRuntime::CreationOptions options;
				321	IRuntimePtr runtime(armnn::IRuntime::Create(options));
				322
				323	// build up the structure of the network
				324	INetworkPtr net(INetwork::Create());
				325
				326	IConnectableLayer* input = net->AddInputLayer(0);
				327
David Monahan	3fb7e10	2019-08-20 11:25:29 +0100	[diff] [blame]	328	ActivationDescriptor descriptor;
				329	descriptor.m_Function = ActivationFunction::Square;
				330	IConnectableLayer* pooling = net->AddActivationLayer(descriptor);
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	331
				332	IConnectableLayer* output = net->AddOutputLayer(0);
				333
David Monahan	3fb7e10	2019-08-20 11:25:29 +0100	[diff] [blame]	334	input->GetOutputSlot(0).Connect(pooling->GetInputSlot(0));
				335	pooling->GetOutputSlot(0).Connect(output->GetInputSlot(0));
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	336
David Monahan	3fb7e10	2019-08-20 11:25:29 +0100	[diff] [blame]	337	input->GetOutputSlot(0).SetTensorInfo(TensorInfo({ 1, 1, 1, 4 }, DataType::Float32));
				338	pooling->GetOutputSlot(0).SetTensorInfo(TensorInfo({ 1, 1, 1, 4 }, DataType::Float32));
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	339
				340	// Optimize the network
				341	IOptimizedNetworkPtr optNet = Optimize(*net, backends, runtime->GetDeviceSpec());
David Monahan	3fb7e10	2019-08-20 11:25:29 +0100	[diff] [blame]	342	BOOST_CHECK(optNet);
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	343
				344	// Loads it into the runtime.
				345	NetworkId netId;
David Monahan	4f1e8e4	2019-09-04 09:22:10 +0100	[diff] [blame]	346	std::string ignoredErrorMessage;
				347	// Enable Importing
Francis Murtagh	73d3e2e	2021-04-29 14:23:04 +0100	[diff] [blame^]	348	INetworkProperties networkProperties(false, MemorySource::Malloc, MemorySource::Malloc);
David Monahan	4f1e8e4	2019-09-04 09:22:10 +0100	[diff] [blame]	349	runtime->LoadNetwork(netId, std::move(optNet), ignoredErrorMessage, networkProperties);
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	350
				351	// Creates structures for input & output
				352	std::vector<float> inputData
				353	{
				354	1.0f, 2.0f, 3.0f, 4.0f
				355	};
				356
				357	std::vector<float> outputData(4);
				358
James Conroy	57d10b7	2019-10-25 09:44:14 +0100	[diff] [blame]	359	std::vector<float> expectedOutput
				360	{
				361	1.0f, 4.0f, 9.0f, 16.0f
				362	};
				363
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	364	InputTensors inputTensors
				365	{
				366	{0,armnn::ConstTensor(runtime->GetInputTensorInfo(netId, 0), inputData.data())},
				367	};
				368	OutputTensors outputTensors
				369	{
				370	{0,armnn::Tensor(runtime->GetOutputTensorInfo(netId, 0), outputData.data())}
				371	};
				372
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	373	runtime->GetProfiler(netId)->EnableProfiling(true);
				374
				375	// Do the inference
				376	runtime->EnqueueWorkload(netId, inputTensors, outputTensors);
				377
				378	// Retrieve the Profiler.Print() output to get the workload execution
				379	ProfilerManager& profilerManager = armnn::ProfilerManager::GetInstance();
				380	std::stringstream ss;
				381	profilerManager.GetProfiler()->Print(ss);;
				382	std::string dump = ss.str();
				383
David Monahan	3fb7e10	2019-08-20 11:25:29 +0100	[diff] [blame]	384	// Contains ActivationWorkload
				385	std::size_t found = dump.find("ActivationWorkload");
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	386	BOOST_TEST(found != std::string::npos);
James Conroy	57d10b7	2019-10-25 09:44:14 +0100	[diff] [blame]	387
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	388	// Contains SyncMemGeneric
				389	found = dump.find("SyncMemGeneric");
				390	BOOST_TEST(found != std::string::npos);
James Conroy	57d10b7	2019-10-25 09:44:14 +0100	[diff] [blame]	391
Ferran Balaguer	83239f9	2019-09-19 11:49:25 +0100	[diff] [blame]	392	// Does not contain CopyMemGeneric
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	393	found = dump.find("CopyMemGeneric");
				394	BOOST_TEST(found == std::string::npos);
James Conroy	57d10b7	2019-10-25 09:44:14 +0100	[diff] [blame]	395
				396	// Check output is as expected
				397	BOOST_TEST(outputData == expectedOutput);
Ferran Balaguer	dcaa610	2019-08-21 13:28:38 +0100	[diff] [blame]	398	}
				399
Ferran Balaguer	83239f9	2019-09-19 11:49:25 +0100	[diff] [blame]	400	inline void ImportOnlyWorkload(std::vector<BackendId> backends)
				401	{
				402	using namespace armnn;
				403
				404	IRuntime::CreationOptions options;
				405	IRuntimePtr runtime(IRuntime::Create(options));
				406
				407	// Builds up the structure of the network.
				408	INetworkPtr net(INetwork::Create());
				409
				410	IConnectableLayer* input = net->AddInputLayer(0);
				411
				412	ActivationDescriptor descriptor;
				413	descriptor.m_Function = ActivationFunction::Square;
				414	IConnectableLayer* pooling = net->AddActivationLayer(descriptor);
				415
				416	IConnectableLayer* output = net->AddOutputLayer(0);
				417
				418	input->GetOutputSlot(0).Connect(pooling->GetInputSlot(0));
				419	pooling->GetOutputSlot(0).Connect(output->GetInputSlot(0));
				420
				421	input->GetOutputSlot(0).SetTensorInfo(TensorInfo({ 1, 1, 1, 4 }, DataType::Float32));
				422	pooling->GetOutputSlot(0).SetTensorInfo(TensorInfo({ 1, 1, 1, 4 }, DataType::Float32));
				423
				424	// optimize the network
				425	IOptimizedNetworkPtr optNet = Optimize(*net, backends, runtime->GetDeviceSpec());
				426
				427	BOOST_TEST_CHECKPOINT("Load Network");
				428	// Load it into the runtime. It should pass.
				429	NetworkId netId;
				430	std::string ignoredErrorMessage;
Francis Murtagh	73d3e2e	2021-04-29 14:23:04 +0100	[diff] [blame^]	431
				432	INetworkProperties networkProperties(false, MemorySource::Malloc, MemorySource::Undefined);
				433
Ferran Balaguer	83239f9	2019-09-19 11:49:25 +0100	[diff] [blame]	434	BOOST_TEST(runtime->LoadNetwork(netId, std::move(optNet),ignoredErrorMessage, networkProperties)
				435	== Status::Success);
				436
				437	BOOST_TEST_CHECKPOINT("Generate Data");
				438	// Creates structures for input & output
				439	std::vector<float> inputData
				440	{
				441	1.0f, 2.0f, 3.0f, 4.0f
				442	};
				443
				444	std::vector<float> outputData(4);
				445
				446	std::vector<float> expectedOutput
				447	{
				448	1.0f, 4.0f, 9.0f, 16.0f
				449	};
				450
				451	BOOST_TEST_CHECKPOINT("Create Network");
				452	InputTensors inputTensors
				453	{
				454	{0,armnn::ConstTensor(runtime->GetInputTensorInfo(netId, 0), inputData.data())},
				455	};
				456	OutputTensors outputTensors
				457	{
				458	{0,armnn::Tensor(runtime->GetOutputTensorInfo(netId, 0), outputData.data())}
				459	};
				460
				461	BOOST_TEST_CHECKPOINT("Get Profiler");
				462
				463	runtime->GetProfiler(netId)->EnableProfiling(true);
				464
				465	BOOST_TEST_CHECKPOINT("Run Inference");
				466	// Do the inference
				467	runtime->EnqueueWorkload(netId, inputTensors, outputTensors);
				468
				469	BOOST_TEST_CHECKPOINT("Print Profiler");
				470	// Retrieve the Profiler.Print() output to get the workload execution
				471	ProfilerManager& profilerManager = armnn::ProfilerManager::GetInstance();
				472	std::stringstream ss;
				473	profilerManager.GetProfiler()->Print(ss);;
				474	std::string dump = ss.str();
				475
				476	// Check there are no SyncMemGeneric workloads as we didn't export
				477	BOOST_TEST_CHECKPOINT("Find SyncMemGeneric");
				478	int count = SubStringCounter(dump, "SyncMemGeneric");
				479	BOOST_TEST(count == 0);
				480
				481	// Should only be 1 CopyMemGeneric for the output as we imported
				482	BOOST_TEST_CHECKPOINT("Find CopyMemGeneric");
				483	count = SubStringCounter(dump, "CopyMemGeneric");
				484	BOOST_TEST(count == 1);
				485
				486	// Check the output is correct
				487	BOOST_CHECK_EQUAL_COLLECTIONS(outputData.begin(), outputData.end(), expectedOutput.begin(), expectedOutput.end());
				488	}
				489
				490	inline void ExportOnlyWorkload(std::vector<BackendId> backends)
				491	{
				492	using namespace armnn;
				493
				494	IRuntime::CreationOptions options;
				495	IRuntimePtr runtime(IRuntime::Create(options));
				496
				497	// Builds up the structure of the network.
				498	INetworkPtr net(INetwork::Create());
				499
				500	IConnectableLayer* input = net->AddInputLayer(0);
				501
				502	ActivationDescriptor descriptor;
				503	descriptor.m_Function = ActivationFunction::Square;
				504	IConnectableLayer* pooling = net->AddActivationLayer(descriptor);
				505
				506	IConnectableLayer* output = net->AddOutputLayer(0);
				507
				508	input->GetOutputSlot(0).Connect(pooling->GetInputSlot(0));
				509	pooling->GetOutputSlot(0).Connect(output->GetInputSlot(0));
				510
				511	input->GetOutputSlot(0).SetTensorInfo(TensorInfo({ 1, 1, 1, 4 }, DataType::Float32));
				512	pooling->GetOutputSlot(0).SetTensorInfo(TensorInfo({ 1, 1, 1, 4 }, DataType::Float32));
				513
				514	// optimize the network
				515	IOptimizedNetworkPtr optNet = Optimize(*net, backends, runtime->GetDeviceSpec());
				516
				517	BOOST_TEST_CHECKPOINT("Load Network");
				518	// Load it into the runtime. It should pass.
				519	NetworkId netId;
				520	std::string ignoredErrorMessage;
Francis Murtagh	73d3e2e	2021-04-29 14:23:04 +0100	[diff] [blame^]	521	INetworkProperties networkProperties(false, MemorySource::Undefined, MemorySource::Malloc);
Ferran Balaguer	83239f9	2019-09-19 11:49:25 +0100	[diff] [blame]	522	BOOST_TEST(runtime->LoadNetwork(netId, std::move(optNet),ignoredErrorMessage, networkProperties)
				523	== Status::Success);
				524
				525	BOOST_TEST_CHECKPOINT("Generate Data");
				526	// Creates structures for input & output
				527	std::vector<float> inputData
				528	{
				529	1.0f, 2.0f, 3.0f, 4.0f
				530	};
				531
				532	std::vector<float> outputData(4);
				533
				534	std::vector<float> expectedOutput
				535	{
				536	1.0f, 4.0f, 9.0f, 16.0f
				537	};
				538
				539	BOOST_TEST_CHECKPOINT("Create Network");
				540	InputTensors inputTensors
				541	{
				542	{0,armnn::ConstTensor(runtime->GetInputTensorInfo(netId, 0), inputData.data())},
				543	};
				544	OutputTensors outputTensors
				545	{
				546	{0,armnn::Tensor(runtime->GetOutputTensorInfo(netId, 0), outputData.data())}
				547	};
				548
				549	BOOST_TEST_CHECKPOINT("Get Profiler");
				550
				551	runtime->GetProfiler(netId)->EnableProfiling(true);
				552
				553	BOOST_TEST_CHECKPOINT("Run Inference");
				554	// Do the inference
				555	runtime->EnqueueWorkload(netId, inputTensors, outputTensors);
				556
				557	BOOST_TEST_CHECKPOINT("Print Profiler");
				558	// Retrieve the Profiler.Print() output to get the workload execution
				559	ProfilerManager& profilerManager = armnn::ProfilerManager::GetInstance();
				560	std::stringstream ss;
				561	profilerManager.GetProfiler()->Print(ss);;
				562	std::string dump = ss.str();
				563
				564	// Check there is a SyncMemGeneric workload as we exported
				565	BOOST_TEST_CHECKPOINT("Find SyncMemGeneric");
				566	int count = SubStringCounter(dump, "SyncMemGeneric");
				567	BOOST_TEST(count == 1);
				568
				569	// Should be 1 CopyMemGeneric for the output as we did not import
				570	BOOST_TEST_CHECKPOINT("Find CopyMemGeneric");
				571	count = SubStringCounter(dump, "CopyMemGeneric");
				572	BOOST_TEST(count == 1);
				573
				574	// Check the output is correct
				575	BOOST_CHECK_EQUAL_COLLECTIONS(outputData.begin(), outputData.end(), expectedOutput.begin(), expectedOutput.end());
				576	}
				577
				578	inline void ImportAndExportWorkload(std::vector<BackendId> backends)
				579	{
				580	using namespace armnn;
				581
				582	IRuntime::CreationOptions options;
				583	IRuntimePtr runtime(IRuntime::Create(options));
				584
				585	// Builds up the structure of the network.
				586	INetworkPtr net(INetwork::Create());
				587
				588	IConnectableLayer* input = net->AddInputLayer(0);
				589
				590	ActivationDescriptor descriptor;
				591	descriptor.m_Function = ActivationFunction::Square;
				592	IConnectableLayer* pooling = net->AddActivationLayer(descriptor);
				593
				594	IConnectableLayer* output = net->AddOutputLayer(0);
				595
				596	input->GetOutputSlot(0).Connect(pooling->GetInputSlot(0));
				597	pooling->GetOutputSlot(0).Connect(output->GetInputSlot(0));
				598
				599	input->GetOutputSlot(0).SetTensorInfo(TensorInfo({ 1, 1, 1, 4 }, DataType::Float32));
				600	pooling->GetOutputSlot(0).SetTensorInfo(TensorInfo({ 1, 1, 1, 4 }, DataType::Float32));
				601
				602	IOptimizedNetworkPtr optNet = Optimize(*net, backends, runtime->GetDeviceSpec());
				603
				604	BOOST_TEST_CHECKPOINT("Load Network");
				605	// Load it into the runtime. It should pass.
				606	NetworkId netId;
				607	std::string ignoredErrorMessage;
Francis Murtagh	73d3e2e	2021-04-29 14:23:04 +0100	[diff] [blame^]	608
				609	INetworkProperties networkProperties(false, MemorySource::Malloc, MemorySource::Malloc);
				610
Ferran Balaguer	83239f9	2019-09-19 11:49:25 +0100	[diff] [blame]	611	BOOST_TEST(runtime->LoadNetwork(netId, std::move(optNet),ignoredErrorMessage, networkProperties)
				612	== Status::Success);
				613
				614	BOOST_TEST_CHECKPOINT("Generate Data");
				615	// Creates structures for input & output
				616	std::vector<float> inputData
				617	{
				618	1.0f, 2.0f, 3.0f, 4.0f
				619	};
				620
				621	std::vector<float> outputData(4);
				622
				623	std::vector<float> expectedOutput
				624	{
				625	1.0f, 4.0f, 9.0f, 16.0f
				626	};
				627
				628	BOOST_TEST_CHECKPOINT("Create Network");
				629	InputTensors inputTensors
				630	{
				631	{0,armnn::ConstTensor(runtime->GetInputTensorInfo(netId, 0), inputData.data())},
				632	};
				633	OutputTensors outputTensors
				634	{
				635	{0,armnn::Tensor(runtime->GetOutputTensorInfo(netId, 0), outputData.data())}
				636	};
				637
				638	BOOST_TEST_CHECKPOINT("Get Profiler");
				639
				640	runtime->GetProfiler(netId)->EnableProfiling(true);
				641
				642	BOOST_TEST_CHECKPOINT("Run Inference");
				643	// Do the inference
				644	runtime->EnqueueWorkload(netId, inputTensors, outputTensors);
				645
				646	BOOST_TEST_CHECKPOINT("Print Profiler");
				647	// Retrieve the Profiler.Print() output to get the workload execution
				648	ProfilerManager& profilerManager = armnn::ProfilerManager::GetInstance();
				649	std::stringstream ss;
				650	profilerManager.GetProfiler()->Print(ss);;
				651	std::string dump = ss.str();
				652
				653	// Check there is a SyncMemGeneric workload as we exported
				654	BOOST_TEST_CHECKPOINT("Find SyncMemGeneric");
				655	int count = SubStringCounter(dump, "SyncMemGeneric");
				656	BOOST_TEST(count == 1);
				657
				658	// Shouldn't be any CopyMemGeneric workloads
				659	BOOST_TEST_CHECKPOINT("Find CopyMemGeneric");
				660	count = SubStringCounter(dump, "CopyMemGeneric");
				661	BOOST_TEST(count == 0);
				662
				663	// Check the output is correct
				664	BOOST_CHECK_EQUAL_COLLECTIONS(outputData.begin(), outputData.end(), expectedOutput.begin(), expectedOutput.end());
				665	}
				666
				667	inline void ExportOutputWithSeveralOutputSlotConnectionsTest(std::vector<BackendId> backends)
				668	{
				669	using namespace armnn;
				670
				671	// Create runtime in which test will run
				672	IRuntime::CreationOptions options;
				673	IRuntimePtr runtime(armnn::IRuntime::Create(options));
				674
				675	// build up the structure of the network
				676	INetworkPtr net(INetwork::Create());
				677
				678	IConnectableLayer* input = net->AddInputLayer(0);
				679
				680	ActivationDescriptor descriptor;
				681	descriptor.m_Function = ActivationFunction::Square;
				682	IConnectableLayer* activation = net->AddActivationLayer(descriptor);
				683
				684	IConnectableLayer* output0 = net->AddOutputLayer(0);
				685	IConnectableLayer* output1 = net->AddOutputLayer(1);
				686
				687	input->GetOutputSlot(0).Connect(activation->GetInputSlot(0));
				688	activation->GetOutputSlot(0).Connect(output0->GetInputSlot(0));
				689	activation->GetOutputSlot(0).Connect(output1->GetInputSlot(0));
				690
				691	input->GetOutputSlot(0).SetTensorInfo(TensorInfo({ 1, 1, 4, 1 }, DataType::Float32));
				692	activation->GetOutputSlot(0).SetTensorInfo(TensorInfo({ 1, 1, 4, 1 }, DataType::Float32));
				693
				694	// Optimize the network
				695	IOptimizedNetworkPtr optNet = Optimize(*net, backends, runtime->GetDeviceSpec());
				696
				697	// Loads it into the runtime.
				698	NetworkId netId;
				699	std::string ignoredErrorMessage;
				700	// Enable Importing
Francis Murtagh	73d3e2e	2021-04-29 14:23:04 +0100	[diff] [blame^]	701	INetworkProperties networkProperties(false, MemorySource::Malloc, MemorySource::Malloc);
Ferran Balaguer	83239f9	2019-09-19 11:49:25 +0100	[diff] [blame]	702	runtime->LoadNetwork(netId, std::move(optNet), ignoredErrorMessage, networkProperties);
				703
				704	// Creates structures for input & output
				705	std::vector<float> inputData
				706	{
				707	1.0f, 2.0f, 3.0f, 4.0f
				708	};
				709
				710	std::vector<float> outputData0(4);
				711	std::vector<float> outputData1(4);
				712
Narumol Prangnawarat	3b90af6	2020-06-26 11:00:21 +0100	[diff] [blame]	713	std::vector<float> expectedOutput
				714	{
				715	1.0f, 4.0f, 9.0f, 16.0f
				716	};
				717
Ferran Balaguer	83239f9	2019-09-19 11:49:25 +0100	[diff] [blame]	718	InputTensors inputTensors
				719	{
				720	{0,armnn::ConstTensor(runtime->GetInputTensorInfo(netId, 0), inputData.data())},
				721	};
				722	OutputTensors outputTensors
				723	{
				724	{0,armnn::Tensor(runtime->GetOutputTensorInfo(netId, 0), outputData0.data())},
				725	{1,armnn::Tensor(runtime->GetOutputTensorInfo(netId, 1), outputData1.data())}
				726	};
				727
				728	// The result of the inference is not important, just the fact that there
				729	// should not be CopyMemGeneric workloads.
				730	runtime->GetProfiler(netId)->EnableProfiling(true);
				731
				732	// Do the inference
				733	runtime->EnqueueWorkload(netId, inputTensors, outputTensors);
				734
				735	// Retrieve the Profiler.Print() output to get the workload execution
				736	ProfilerManager& profilerManager = armnn::ProfilerManager::GetInstance();
				737	std::stringstream ss;
				738	profilerManager.GetProfiler()->Print(ss);
				739	std::string dump = ss.str();
				740
				741	std::size_t found = std::string::npos;
				742
				743	if (backends[0] == Compute::CpuRef)
				744	{
				745	found = dump.find("RefActivationWorkload");
				746	}
				747	else if (backends[0] == Compute::CpuAcc)
				748	{
				749	found = dump.find("NeonActivationWorkload");
				750	}
				751	else if (backends[0] == Compute::GpuAcc)
				752	{
				753	found = dump.find("ClActivationWorkload");
				754	}
				755
				756	BOOST_TEST(found != std::string::npos);
				757	// No contains SyncMemGeneric
				758	found = dump.find("SyncMemGeneric");
				759	BOOST_TEST(found == std::string::npos);
				760	// Contains CopyMemGeneric
				761	found = dump.find("CopyMemGeneric");
				762	BOOST_TEST(found != std::string::npos);
Narumol Prangnawarat	3b90af6	2020-06-26 11:00:21 +0100	[diff] [blame]	763
				764	// Check that the outputs are correct
				765	BOOST_CHECK_EQUAL_COLLECTIONS(outputData0.begin(), outputData0.end(),
				766	expectedOutput.begin(), expectedOutput.end());
				767	BOOST_CHECK_EQUAL_COLLECTIONS(outputData1.begin(), outputData1.end(),
				768	expectedOutput.begin(), expectedOutput.end());
Ferran Balaguer	83239f9	2019-09-19 11:49:25 +0100	[diff] [blame]	769	}
				770
David Monahan	0a99a14	2020-03-13 07:52:54 +0000	[diff] [blame]	771	inline void StridedSliceInvalidSliceEndToEndTest(std::vector<BackendId> backends)
				772	{
				773	using namespace armnn;
				774
				775	// Create runtime in which test will run
				776	IRuntime::CreationOptions options;
				777	IRuntimePtr runtime(armnn::IRuntime::Create(options));
				778
				779	// build up the structure of the network
				780	INetworkPtr net(INetwork::Create());
				781
				782	IConnectableLayer* input = net->AddInputLayer(0);
				783
				784	// Configure a strided slice with a stride the same size as the input but with a ShrinkAxisMask on the first
				785	// dim of the output to make it too small to hold the specified slice.
				786	StridedSliceDescriptor descriptor;
				787	descriptor.m_Begin = {0, 0};
				788	descriptor.m_End = {2, 3};
				789	descriptor.m_Stride = {1, 1};
				790	descriptor.m_BeginMask = 0;
				791	descriptor.m_EndMask = 0;
				792	descriptor.m_ShrinkAxisMask = 1;
				793	IConnectableLayer* stridedSlice = net->AddStridedSliceLayer(descriptor);
				794
				795	IConnectableLayer* output0 = net->AddOutputLayer(0);
				796
				797	input->GetOutputSlot(0).Connect(stridedSlice->GetInputSlot(0));
				798	stridedSlice->GetOutputSlot(0).Connect(output0->GetInputSlot(0));
				799
				800	input->GetOutputSlot(0).SetTensorInfo(TensorInfo({ 2, 3 }, DataType::Float32));
				801	stridedSlice->GetOutputSlot(0).SetTensorInfo(TensorInfo({ 3 }, DataType::Float32));
				802
				803	// Attempt to optimize the network and check that the correct exception is thrown
				804	BOOST_CHECK_THROW(Optimize(*net, backends, runtime->GetDeviceSpec()), armnn::LayerValidationException);
				805	}
				806
Nattapat Chaimanowong	1fcb4ff	2019-01-24 15:25:26 +0000	[diff] [blame]	807	} // anonymous namespace