Blame - examples/cl_cache.cpp - ml/ComputeLibrary

blob: 7d8a5154242b8a200b7b301e041976a0e83f0f4a [file] [log] [blame]

Pablo Tello	f6f23ea	2019-07-05 14:00:30 +0100	[diff] [blame]	1	/*
				2	* Copyright (c) 2019 ARM Limited.
				3	*
				4	* SPDX-License-Identifier: MIT
				5	*
				6	* Permission is hereby granted, free of charge, to any person obtaining a copy
				7	* of this software and associated documentation files (the "Software"), to
				8	* deal in the Software without restriction, including without limitation the
				9	* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
				10	* sell copies of the Software, and to permit persons to whom the Software is
				11	* furnished to do so, subject to the following conditions:
				12	*
				13	* The above copyright notice and this permission notice shall be included in all
				14	* copies or substantial portions of the Software.
				15	*
				16	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
				17	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
				18	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
				19	* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
				20	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
				21	* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
				22	* SOFTWARE.
				23	*/
				24	#include "arm_compute/runtime/CL/CLFunctions.h"
				25
				26	#include "arm_compute/core/Types.h"
				27	#include "arm_compute/runtime/CL/CLHelpers.h"
				28	#include "arm_compute/runtime/CL/CLScheduler.h"
				29	#include "utils/Utils.h"
				30
Pablo Tello	f6f23ea	2019-07-05 14:00:30 +0100	[diff] [blame]	31	using namespace arm_compute;
				32	using namespace utils;
				33
				34	namespace
				35	{
Pablo Tello	f6f23ea	2019-07-05 14:00:30 +0100	[diff] [blame]	36	} // namespace
				37
				38	class CLCacheExample : public Example
				39	{
				40	public:
				41	CLCacheExample() = default;
				42
				43	bool do_setup(int argc, char **argv) override
				44	{
				45	std::cout << "Once the program has run and created the file cache.bin, rerun with --restore_cache." << std::endl;
				46	CLScheduler::get().default_init();
Gian Marco Iodice	f3622be	2019-07-29 14:27:16 +0100	[diff] [blame]	47
Pablo Tello	f6f23ea	2019-07-05 14:00:30 +0100	[diff] [blame]	48	if(argc > 1)
				49	{
				50	std::string argv1 = argv[1];
				51	std::transform(argv1.begin(), argv1.end(), argv1.begin(), ::tolower);
				52	if(argv1 == "--restore_cache")
				53	{
				54	// Load the precompiled kernels from a file into the kernel library, in this way the next time they are needed
				55	// compilation won't be required.
				56	restore_program_cache_from_file();
				57	}
				58	else
				59	{
				60	std::cout << "Unkown option " << argv1 << std::endl;
				61	}
				62	}
				63
				64	// Initialise shapes
				65	init_tensor(TensorShape(8U, 4U, 2U), tensor_nchw, DataType::U8, DataLayout::NCHW);
				66	init_tensor(TensorShape(2U, 8U, 4U), tensor_nhwc, DataType::U8, DataLayout::NHWC);
				67	init_tensor(TensorShape(8U, 4U, 2U), tensor_nchw_result, DataType::U8, DataLayout::NCHW);
				68
				69	// Create the permutation vector to turn a NCHW tensor to NHWC.
				70	// The input tensor is NCHW, which means that the fastest changing coordinate is W=8U.
				71	// For permutation vectors the fastest changing coordinate is the one on the left too.
				72	// Each element in the permutation vector specifies a mapping from the source tensor to the destination one, thus if we
				73	// use 2U in the permutation vector's first element we are telling the function to move the channels to the fastest
				74	// changing coordinate in the destination tensor.
				75
				76	const PermutationVector vector_nchw_to_nhwc(2U, 0U, 1U);
				77	permute_nhwc.configure(&tensor_nchw, &tensor_nhwc, vector_nchw_to_nhwc);
				78
				79	// Allocate and fill tensors
				80	tensor_nhwc.allocator()->allocate();
				81	tensor_nchw.allocator()->allocate();
				82	fill_tensor(tensor_nchw);
				83
				84	// Demostrate autoconfigure for the output tensor
				85	const PermutationVector vector_nhwc_to_nchw(1U, 2U, 0U);
				86	permute_nchw.configure(&tensor_nhwc, &tensor_nchw_result, vector_nhwc_to_nchw);
				87	tensor_nchw_result.allocator()->allocate();
				88
Pablo Tello	f6f23ea	2019-07-05 14:00:30 +0100	[diff] [blame]	89	// Save the opencl kernels to a file
				90	save_program_cache_to_file();
				91
				92	return true;
				93	}
				94	void do_run() override
				95	{
				96	permute_nhwc.run();
				97	permute_nchw.run();
				98	}
				99	void do_teardown() override
				100	{
				101	}
				102
				103	private:
				104	void validate_result(CLTensor &reference, CLTensor &result)
				105	{
				106	reference.map();
				107	result.map();
				108	Window window;
				109	window.use_tensor_dimensions(reference.info()->tensor_shape());
				110	Iterator it_ref(&reference, window);
				111	Iterator it_res(&result, window);
				112	execute_window_loop(window, [&](const Coordinates &)
				113	{
				114	assert(reinterpret_cast<unsigned char >(it_ref.ptr()) == reinterpret_cast<unsigned char >(it_res.ptr()));
				115	},
				116	it_ref, it_res);
				117	reference.unmap();
				118	result.unmap();
				119	}
				120
				121	void fill_tensor(CLTensor &tensor)
				122	{
				123	tensor.map();
				124	Window window;
				125	window.use_tensor_dimensions(tensor.info()->tensor_shape());
				126	Iterator it_tensor(&tensor, window);
				127	unsigned char val(0);
				128	execute_window_loop(window, [&](const Coordinates &)
				129	{
				130	reinterpret_cast<unsigned char >(it_tensor.ptr()) = val++;
				131	},
				132	it_tensor);
				133	tensor.unmap();
				134	}
				135	void init_tensor(const TensorShape shape, CLTensor &tensor, DataType type, DataLayout layout)
				136	{
				137	tensor.allocator()->init(TensorInfo(shape, 1, type).set_data_layout(layout));
				138	}
				139
				140	CLTensor tensor_nchw{};
				141	CLTensor tensor_nhwc{};
				142	CLTensor tensor_nchw_result{};
				143	CLPermute permute_nhwc{};
				144	CLPermute permute_nchw{};
				145	};
				146
				147	/** Main program creating an example that demostrates how to load precompiled kernels from a file.
				148	*
				149	* @param[in] argc Number of arguments
				150	* @param[in] argv Arguments
				151	*/
				152	int main(int argc, char **argv)
				153	{
				154	return utils::run_example<CLCacheExample>(argc, argv);
				155	}