src/graph/detail/ExecutionHelpers.cpp - ml/ComputeLibrary - Gitiles

 /*
  * Copyright (c) 2018-2020 ARM Limited.
  *
  * SPDX-License-Identifier: MIT
  *
  * Permission is hereby granted, free of charge, to any person obtaining a copy
  * of this software and associated documentation files (the "Software"), to
  * deal in the Software without restriction, including without limitation the
  * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
  * sell copies of the Software, and to permit persons to whom the Software is
  * furnished to do so, subject to the following conditions:
  *
  * The above copyright notice and this permission notice shall be included in all
  * copies or substantial portions of the Software.
  *
  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  * SOFTWARE.
  */
 #include "arm_compute/graph/detail/ExecutionHelpers.h"

 #include "arm_compute/graph/Graph.h"
 #include "arm_compute/graph/GraphContext.h"
 #include "arm_compute/graph/GraphManager.h"
 #include "arm_compute/graph/Tensor.h"
 #include "arm_compute/graph/Utils.h"
 #include "arm_compute/graph/backends/BackendRegistry.h"

 namespace arm_compute
 {
 namespace graph
 {
 namespace detail
 {
 void validate_all_nodes(Graph &g)
 {
     auto &nodes = g.nodes();

     // Create tasks
     for(auto &node : nodes)
     {
         if(node != nullptr)
         {
             Target                    assigned_target = node->assigned_target();
             backends::IDeviceBackend &backend         = backends::BackendRegistry::get().get_backend(assigned_target);
             Status                    status          = backend.validate_node(*node);
             ARM_COMPUTE_ERROR_ON_MSG(!bool(status), status.error_description().c_str());
         }
     }
 }

 void configure_all_tensors(Graph &g)
 {
     auto &tensors = g.tensors();

     for(auto &tensor : tensors)
     {
         if(tensor && tensor->handle() == nullptr)
         {
             Target                         target  = tensor->desc().target;
             backends::IDeviceBackend      &backend = backends::BackendRegistry::get().get_backend(target);
             std::unique_ptr<ITensorHandle> handle  = backend.create_tensor(*tensor);
             ARM_COMPUTE_ERROR_ON_MSG(!handle, "Couldn't create backend handle!");
             tensor->set_handle(std::move(handle));
         }
     }
 }

 void allocate_all_input_tensors(INode &node)
 {
     for(unsigned int i = 0; i < node.num_inputs(); ++i)
     {
         Tensor *tensor = node.input(i);
         if(tensor != nullptr && !tensor->bound_edges().empty())
         {
             ARM_COMPUTE_ERROR_ON_MSG(!tensor->handle(), "Tensor handle is not configured!");
             tensor->handle()->allocate();
         }
     }
 }

 void allocate_all_output_tensors(INode &node)
 {
     for(unsigned int i = 0; i < node.num_outputs(); ++i)
     {
         Tensor *tensor = node.output(i);
         if(tensor != nullptr && !tensor->bound_edges().empty())
         {
             ARM_COMPUTE_ERROR_ON_MSG(!tensor->handle(), "Tensor handle is not configured!");
             tensor->handle()->allocate();
         }
     }
 }

 void allocate_const_tensors(Graph &g)
 {
     for(auto &node : g.nodes())
     {
         if(node != nullptr)
         {
             switch(node->type())
             {
                 case NodeType::Const:
                 case NodeType::Input:
                     allocate_all_output_tensors(*node);
                     break;
                 case NodeType::Output:
                     allocate_all_input_tensors(*node);
                 default:
                     break;
             }
         }
     }
 }

 void allocate_all_tensors(Graph &g)
 {
     auto &tensors = g.tensors();

     for(auto &tensor : tensors)
     {
         if(tensor && !tensor->bound_edges().empty() && tensor->handle() != nullptr && tensor->handle()->tensor().info()->is_resizable() && tensor->handle()->tensor().is_used())
         {
             tensor->handle()->allocate();
         }
     }
 }

 ExecutionWorkload configure_all_nodes(Graph &g, GraphContext &ctx, const std::vector<NodeID> &node_order)
 {
     ExecutionWorkload workload;
     workload.graph = &g;
     workload.ctx   = &ctx;

     // Reserve memory for tasks
     workload.tasks.reserve(node_order.size());

     // Create tasks
     for(auto &node_id : node_order)
     {
         auto node = g.node(node_id);
         if(node != nullptr)
         {
             Target                     assigned_target = node->assigned_target();
             backends::IDeviceBackend &backend         = backends::BackendRegistry::get().get_backend(assigned_target);
             std::unique_ptr<IFunction> func            = backend.configure_node(*node, ctx);
             if(func != nullptr || is_utility_node(node))
             {
                 workload.tasks.emplace_back(ExecutionTask(std::move(func), node));
             }
         }
     }

     // Add inputs and outputs
     for(auto &node : g.nodes())
     {
         if(node != nullptr && node->type() == NodeType::Input)
         {
             workload.inputs.push_back(node->output(0));
         }

         if(node != nullptr && node->type() == NodeType::Output)
         {
             workload.outputs.push_back(node->input(0));
             continue;
         }
     }

     return workload;
 }

 void release_unused_tensors(Graph &g)
 {
     for(auto &tensor : g.tensors())
     {
         if(tensor != nullptr && tensor->handle() != nullptr)
         {
             tensor->handle()->release_if_unused();
         }
     }
 }

 void call_tensor_accessor(Tensor *tensor)
 {
     ARM_COMPUTE_ERROR_ON(!tensor);
     tensor->call_accessor();
 }

 void call_all_const_node_accessors(Graph &g)
 {
     auto &nodes = g.nodes();

     for(auto &node : nodes)
     {
         if(node != nullptr && node->type() == NodeType::Const)
         {
             call_tensor_accessor(node->output(0));
         }
     }
 }

 bool call_all_input_node_accessors(ExecutionWorkload &workload)
 {
     bool is_valid = true;
     std::for_each(std::begin(workload.inputs), std::end(workload.inputs), [&](Tensor * input_tensor)
     {
         bool valid_input = (input_tensor != nullptr) && input_tensor->call_accessor();
         is_valid         = is_valid && valid_input;
     });
     return is_valid;
 }

 void prepare_all_tasks(ExecutionWorkload &workload)
 {
     ARM_COMPUTE_ERROR_ON(workload.graph == nullptr);
     for(auto &task : workload.tasks)
     {
         task.prepare();
         release_unused_tensors(*workload.graph);
     }
 }

 void call_all_tasks(ExecutionWorkload &workload)
 {
     ARM_COMPUTE_ERROR_ON(workload.ctx == nullptr);

     // Acquire memory for the transition buffers
     for(auto &mm_ctx : workload.ctx->memory_managers())
     {
         if(mm_ctx.second.cross_group != nullptr)
         {
             mm_ctx.second.cross_group->acquire();
         }
     }

     // Execute tasks
     for(auto &task : workload.tasks)
     {
         task();
     }

     // Release memory for the transition buffers
     for(auto &mm_ctx : workload.ctx->memory_managers())
     {
         if(mm_ctx.second.cross_group != nullptr)
         {
             mm_ctx.second.cross_group->release();
         }
     }
 }

 bool call_all_output_node_accessors(ExecutionWorkload &workload)
 {
     bool is_valid = true;
     std::for_each(std::begin(workload.outputs), std::end(workload.outputs), [&](Tensor * output_tensor)
     {
         bool valid_output = (output_tensor != nullptr) && output_tensor->call_accessor();
         is_valid          = is_valid && valid_output;
     });

     return is_valid;
 }
 } // namespace detail
 } // namespace graph
 } // namespace arm_compute
	/*
	* Copyright (c) 2018-2020 ARM Limited.
	*
	* SPDX-License-Identifier: MIT
	*
	* Permission is hereby granted, free of charge, to any person obtaining a copy
	* of this software and associated documentation files (the "Software"), to
	* deal in the Software without restriction, including without limitation the
	* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
	* sell copies of the Software, and to permit persons to whom the Software is
	* furnished to do so, subject to the following conditions:
	*
	* The above copyright notice and this permission notice shall be included in all
	* copies or substantial portions of the Software.
	*
	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
	* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
	* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
	* SOFTWARE.
	*/
	#include "arm_compute/graph/detail/ExecutionHelpers.h"

	#include "arm_compute/graph/Graph.h"
	#include "arm_compute/graph/GraphContext.h"
	#include "arm_compute/graph/GraphManager.h"
	#include "arm_compute/graph/Tensor.h"
	#include "arm_compute/graph/Utils.h"
	#include "arm_compute/graph/backends/BackendRegistry.h"

	namespace arm_compute
	{
	namespace graph
	{
	namespace detail
	{
	void validate_all_nodes(Graph &g)
	{
	auto &nodes = g.nodes();

	// Create tasks
	for(auto &node : nodes)
	{
	if(node != nullptr)
	{
	Target assigned_target = node->assigned_target();
	backends::IDeviceBackend &backend = backends::BackendRegistry::get().get_backend(assigned_target);
	Status status = backend.validate_node(*node);
	ARM_COMPUTE_ERROR_ON_MSG(!bool(status), status.error_description().c_str());
	}
	}
	}

	void configure_all_tensors(Graph &g)
	{
	auto &tensors = g.tensors();

	for(auto &tensor : tensors)
	{
	if(tensor && tensor->handle() == nullptr)
	{
	Target target = tensor->desc().target;
	backends::IDeviceBackend &backend = backends::BackendRegistry::get().get_backend(target);
	std::unique_ptr<ITensorHandle> handle = backend.create_tensor(*tensor);
	ARM_COMPUTE_ERROR_ON_MSG(!handle, "Couldn't create backend handle!");
	tensor->set_handle(std::move(handle));
	}
	}
	}

	void allocate_all_input_tensors(INode &node)
	{
	for(unsigned int i = 0; i < node.num_inputs(); ++i)
	{
	Tensor *tensor = node.input(i);
	if(tensor != nullptr && !tensor->bound_edges().empty())
	{
	ARM_COMPUTE_ERROR_ON_MSG(!tensor->handle(), "Tensor handle is not configured!");
	tensor->handle()->allocate();
	}
	}
	}

	void allocate_all_output_tensors(INode &node)
	{
	for(unsigned int i = 0; i < node.num_outputs(); ++i)
	{
	Tensor *tensor = node.output(i);
	if(tensor != nullptr && !tensor->bound_edges().empty())
	{
	ARM_COMPUTE_ERROR_ON_MSG(!tensor->handle(), "Tensor handle is not configured!");
	tensor->handle()->allocate();
	}
	}
	}

	void allocate_const_tensors(Graph &g)
	{
	for(auto &node : g.nodes())
	{
	if(node != nullptr)
	{
	switch(node->type())
	{
	case NodeType::Const:
	case NodeType::Input:
	allocate_all_output_tensors(*node);
	break;
	case NodeType::Output:
	allocate_all_input_tensors(*node);
	default:
	break;
	}
	}
	}
	}

	void allocate_all_tensors(Graph &g)
	{
	auto &tensors = g.tensors();

	for(auto &tensor : tensors)
	{
	if(tensor && !tensor->bound_edges().empty() && tensor->handle() != nullptr && tensor->handle()->tensor().info()->is_resizable() && tensor->handle()->tensor().is_used())
	{
	tensor->handle()->allocate();
	}
	}
	}

	ExecutionWorkload configure_all_nodes(Graph &g, GraphContext &ctx, const std::vector<NodeID> &node_order)
	{
	ExecutionWorkload workload;
	workload.graph = &g;
	workload.ctx = &ctx;

	// Reserve memory for tasks
	workload.tasks.reserve(node_order.size());

	// Create tasks
	for(auto &node_id : node_order)
	{
	auto node = g.node(node_id);
	if(node != nullptr)
	{
	Target assigned_target = node->assigned_target();
	backends::IDeviceBackend &backend = backends::BackendRegistry::get().get_backend(assigned_target);
	std::unique_ptr<IFunction> func = backend.configure_node(*node, ctx);
	if(func != nullptr \|\| is_utility_node(node))
	{
	workload.tasks.emplace_back(ExecutionTask(std::move(func), node));
	}
	}
	}

	// Add inputs and outputs
	for(auto &node : g.nodes())
	{
	if(node != nullptr && node->type() == NodeType::Input)
	{
	workload.inputs.push_back(node->output(0));
	}

	if(node != nullptr && node->type() == NodeType::Output)
	{
	workload.outputs.push_back(node->input(0));
	continue;
	}
	}

	return workload;
	}

	void release_unused_tensors(Graph &g)
	{
	for(auto &tensor : g.tensors())
	{
	if(tensor != nullptr && tensor->handle() != nullptr)
	{
	tensor->handle()->release_if_unused();
	}
	}
	}

	void call_tensor_accessor(Tensor *tensor)
	{
	ARM_COMPUTE_ERROR_ON(!tensor);
	tensor->call_accessor();
	}

	void call_all_const_node_accessors(Graph &g)
	{
	auto &nodes = g.nodes();

	for(auto &node : nodes)
	{
	if(node != nullptr && node->type() == NodeType::Const)
	{
	call_tensor_accessor(node->output(0));
	}
	}
	}

	bool call_all_input_node_accessors(ExecutionWorkload &workload)
	{
	bool is_valid = true;
	std::for_each(std::begin(workload.inputs), std::end(workload.inputs), [&](Tensor * input_tensor)
	{
	bool valid_input = (input_tensor != nullptr) && input_tensor->call_accessor();
	is_valid = is_valid && valid_input;
	});
	return is_valid;
	}

	void prepare_all_tasks(ExecutionWorkload &workload)
	{
	ARM_COMPUTE_ERROR_ON(workload.graph == nullptr);
	for(auto &task : workload.tasks)
	{
	task.prepare();
	release_unused_tensors(*workload.graph);
	}
	}

	void call_all_tasks(ExecutionWorkload &workload)
	{
	ARM_COMPUTE_ERROR_ON(workload.ctx == nullptr);

	// Acquire memory for the transition buffers
	for(auto &mm_ctx : workload.ctx->memory_managers())
	{
	if(mm_ctx.second.cross_group != nullptr)
	{
	mm_ctx.second.cross_group->acquire();
	}
	}

	// Execute tasks
	for(auto &task : workload.tasks)
	{
	task();
	}

	// Release memory for the transition buffers
	for(auto &mm_ctx : workload.ctx->memory_managers())
	{
	if(mm_ctx.second.cross_group != nullptr)
	{
	mm_ctx.second.cross_group->release();
	}
	}
	}

	bool call_all_output_node_accessors(ExecutionWorkload &workload)
	{
	bool is_valid = true;
	std::for_each(std::begin(workload.outputs), std::end(workload.outputs), [&](Tensor * output_tensor)
	{
	bool valid_output = (output_tensor != nullptr) && output_tensor->call_accessor();
	is_valid = is_valid && valid_output;
	});

	return is_valid;
	}
	} // namespace detail
	} // namespace graph
	} // namespace arm_compute