Blame - src/armnn/LoadedNetwork.cpp - ml/armnn

2018-03-09 14:13:49 +0000

[diff] [blame]

4

//

5

6

#include "LoadedNetwork.hpp"

7

#include "Layer.hpp"

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

8

#include "Graph.hpp"

Jim Flynn

f771321

2020-07-14 09:50:59 +0100

[diff] [blame]

9

#include <Processes.hpp>

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

10

#include "Profiling.hpp"

surmeh01

2018-05-18 16:31:43 +0100

[diff] [blame]

11

#include "HeapProfiling.hpp"

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

12

#include "WorkingMemHandle.hpp"

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

13

Matteo Martincigh

c601aa6

2019-10-29 15:03:22 +0000

[diff] [blame]

14

#include <armnn/BackendRegistry.hpp>

Matthew Bentham

f48afc6

2020-01-15 17:55:08 +0000

[diff] [blame]

15

#include <armnn/Logging.hpp>

Narumol Prangnawarat

2020-04-01 16:51:23 +0100

[diff] [blame]

16

#include <armnn/utility/Assert.hpp>

Matteo Martincigh

c601aa6

2019-10-29 15:03:22 +0000

[diff] [blame]

17

Colm Donelan

0c47974

2021-12-10 12:43:54 +0000

[diff] [blame]

18

#include <armnn/backends/TensorHandle.hpp>

Matteo Martincigh

e5b8eb9

2019-11-28 15:45:42 +0000

[diff] [blame]

19

#include <armnn/backends/IMemoryManager.hpp>

Colm Donelan

0c47974

2021-12-10 12:43:54 +0000

[diff] [blame]

20

#include <armnn/backends/MemCopyWorkload.hpp>

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

21

#include <backendsCommon/MemSyncWorkload.hpp>

Finn Williams

dbf5f31

2021-08-26 11:08:01 +0100

[diff] [blame]

22

#include <armnn/BackendHelper.hpp>

Matteo Martincigh

e5b8eb9

2019-11-28 15:45:42 +0000

[diff] [blame]

23

Colm Donelan

5b5c222

2020-09-09 12:48:16 +0100

[diff] [blame]

24

#include <fmt/format.h>

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

namespace armnn

{

using namespace std;

Cathal Corbett

2022-02-25 15:33:28 +0000

[diff] [blame^]

30

using namespace arm::pipe;

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

31

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

namespace

{

template <typename ExceptionType>

36

std::string ToErrorMessage(const char * prefix, const ExceptionType & error)

37

{

38

std::stringstream ss;

39

ss << prefix << " " << error.what();

return ss.str();

}

Narumol Prangnawarat

2019-11-22 11:26:06 +0000

[diff] [blame]

43

void AddLayerStructure(std::unique_ptr<TimelineUtilityMethods>& timelineUtils,

44

const Layer& layer,

45

ProfilingGuid networkGuid)

46

{

47

// Add layer to the post-optimisation network structure

48

std::string layerName = layer.GetNameStr().empty() ? "<Unnamed>" : layer.GetNameStr();

49

timelineUtils->CreateNamedTypedChildEntity(layer.GetGuid(),

50

networkGuid,

51

layerName,

52

LabelsAndEventClasses::LAYER_GUID);

53

for (auto&& input : layer.GetInputSlots())

54

{

55

const IOutputSlot* source = input.GetConnectedOutputSlot();

Narumol Prangnawarat

2020-04-01 16:51:23 +0100

[diff] [blame]

56

ARMNN_ASSERT(source != NULL);

Narumol Prangnawarat

2019-11-22 11:26:06 +0000

[diff] [blame]

57

timelineUtils->CreateConnectionRelationship(ProfilingRelationshipType::RetentionLink,

58

source->GetOwningLayerGuid(),

layer.GetGuid());

}

}

void AddWorkloadStructure(std::unique_ptr<TimelineUtilityMethods>& timelineUtils,

64

std::unique_ptr<IWorkload>& workload,

65

const Layer& layer)

66

{

67

// Add workload to the post-optimisation network structure

68

timelineUtils->CreateTypedEntity(workload->GetGuid(), LabelsAndEventClasses::WORKLOAD_GUID);

69

timelineUtils->MarkEntityWithLabel(workload->GetGuid(),

70

layer.GetBackendId().Get(),

71

LabelsAndEventClasses::BACKENDID_GUID);

72

73

// Link the workload to the layer

74

timelineUtils->CreateRelationship(ProfilingRelationshipType::RetentionLink,

75

layer.GetGuid(),

Jim Flynn

6398a98

2020-05-27 17:05:21 +0100

[diff] [blame]

76

workload->GetGuid(),

77

LabelsAndEventClasses::CHILD_GUID);

Narumol Prangnawarat

2019-11-22 11:26:06 +0000

[diff] [blame]

78

}

79

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

80

} // anonymous

81

Francis Murtagh

2021-02-15 18:23:17 +0000

[diff] [blame]

82

std::unique_ptr<LoadedNetwork> LoadedNetwork::MakeLoadedNetwork(std::unique_ptr<IOptimizedNetwork> net,

David Monahan

2019-09-04 09:22:10 +0100

[diff] [blame]

83

std::string& errorMessage,

Sadik Armagan

2020-03-18 10:57:30 +0000

[diff] [blame]

84

const INetworkProperties& networkProperties,

Cathal Corbett

2022-02-25 15:33:28 +0000

[diff] [blame^]

85

ProfilingService& profilingService)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

86

{

87

std::unique_ptr<LoadedNetwork> loadedNetwork;

88

Aron Virginas-Tar

2018-10-19 16:46:15 +0100

[diff] [blame]

89

auto Fail = [&](const std::exception& error) -> std::unique_ptr<LoadedNetwork>

90

{

91

errorMessage = ToErrorMessage("An error occurred when preparing the network workloads: ", error);

Derek Lamberti

0844697

2019-11-26 16:38:31 +0000

[diff] [blame]

92

ARMNN_LOG(error) << errorMessage;

Aron Virginas-Tar

2018-10-19 16:46:15 +0100

[diff] [blame]

93

94

return std::unique_ptr<LoadedNetwork>();

95

};

96

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

97

try

98

{

Finn Williams

f364d53

2021-06-09 17:07:33 +0100

[diff] [blame]

99

loadedNetwork.reset(new LoadedNetwork(std::move(net), networkProperties, profilingService));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

100

}

Aron Virginas-Tar

2018-10-19 16:46:15 +0100

[diff] [blame]

101

catch (const armnn::RuntimeException& error)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

102

{

Aron Virginas-Tar

2018-10-19 16:46:15 +0100

[diff] [blame]

103

return Fail(error);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

104

}

105

catch (const armnn::Exception& error)

106

{

Aron Virginas-Tar

2018-10-19 16:46:15 +0100

[diff] [blame]

107

return Fail(error);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

108

}

Aron Virginas-Tar

2018-10-19 16:46:15 +0100

[diff] [blame]

109

catch (const std::runtime_error& error)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

110

{

Aron Virginas-Tar

2018-10-19 16:46:15 +0100

[diff] [blame]

111

return Fail(error);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

112

}

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

113

114

return loadedNetwork;

115

}

116

Francis Murtagh

2021-02-15 18:23:17 +0000

[diff] [blame]

117

LoadedNetwork::LoadedNetwork(std::unique_ptr<IOptimizedNetwork> net,

Sadik Armagan

2020-03-18 10:57:30 +0000

[diff] [blame]

118

const INetworkProperties& networkProperties,

Cathal Corbett

2022-02-25 15:33:28 +0000

[diff] [blame^]

119

ProfilingService& profilingService) :

David Monahan

2019-09-04 09:22:10 +0100

[diff] [blame]

120

m_OptimizedNetwork(std::move(net)),

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

121

m_NetworkProperties(networkProperties),

Narumol Prangnawarat

549cb7a

2020-07-10 17:50:53 +0100

[diff] [blame]

122

m_TensorHandleFactoryRegistry(),

Sadik Armagan

2020-03-18 10:57:30 +0000

[diff] [blame]

123

m_ProfilingService(profilingService)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

124

{

Kevin May

4692e11

2021-10-18 14:41:50 +0100

[diff] [blame]

125

ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "LoadedNetwork");

Derek Lamberti

e155bbf

2021-10-13 14:32:12 +0100

[diff] [blame]

126

// Get the profiler and register it for the current thread.

127

const std::shared_ptr<IProfiler>& profiler = m_OptimizedNetwork->GetProfiler();

128

ProfilerManager::GetInstance().RegisterProfiler(profiler.get());

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

129

Derek Lamberti

e155bbf

2021-10-13 14:32:12 +0100

[diff] [blame]

130

profiler->EnableProfiling(networkProperties.m_ProfilingEnabled);

Keith Davis

554fa09

2021-07-20 11:25:22 +0100

[diff] [blame]

131

Derek Lamberti

e155bbf

2021-10-13 14:32:12 +0100

[diff] [blame]

132

profiler->EnableNetworkDetailsToStdOut(networkProperties.m_OutputNetworkDetailsMethod);

Keith Davis

f487486

2021-08-09 16:49:18 +0100

[diff] [blame]

133

David Beck

2018-10-23 13:35:58 +0100

[diff] [blame]

134

//First create tensor handlers, backends and workload factories.

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

135

//Handlers are created before workloads are.

136

//Because workload creation can modify some of the handlers,

Jim Flynn

e242f2d

2019-05-22 14:24:13 +0100

[diff] [blame]

137

//(for example the splitter and concat layers).

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

138

139

bool useExternalMemoryManager = false;

140

bool useInternalMemoryManager = false;

141

Graph& order = m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph().TopologicalSort();

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

142

143

if (!networkProperties.m_AsyncEnabled)

144

{

145

m_IsInputImported = std::vector<bool>(order.GetNumInputs(), false);

146

m_IsOutputImported = std::vector<bool>(order.GetNumOutputs(), false);

147

}

148

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

149

for (auto&& layer : order)

150

{

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

151

auto const& backendId = layer->GetBackendId();

152

if (m_Backends.count(backendId) == 0)

David Beck

2018-10-23 13:35:58 +0100

[diff] [blame]

153

{

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

154

auto createBackend = BackendRegistryInstance().GetFactory(backendId);

155

auto it = m_Backends.emplace(std::make_pair(backendId, createBackend()));

Aron Virginas-Tar

5605519

2018-11-12 18:10:43 +0000

[diff] [blame]

156

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

157

IBackendInternal* backend = it.first->second.get();

Aron Virginas-Tar

5605519

2018-11-12 18:10:43 +0000

[diff] [blame]

158

Finn Williams

dbf5f31

2021-08-26 11:08:01 +0100

[diff] [blame]

159

if (networkProperties.m_AsyncEnabled &&

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

160

!HasCapability(BackendOptions::BackendOption{"AsyncExecution", true}, backend->GetCapabilities()))

Finn Williams

dbf5f31

2021-08-26 11:08:01 +0100

[diff] [blame]

161

{

162

std::string er = backend->GetId();

163

er += " does not support AsyncExecution";

164

throw BackendCapabilityException(er);

165

}

166

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

167

if (networkProperties.m_AsyncEnabled &&

168

!HasCapability(BackendOptions::BackendOption{"ExternallyManagedMemory", true},

169

backend->GetCapabilities()))

170

{

171

std::string er = backend->GetId();

172

er += " does not support ExternallyManagedMemory\n";

173

er += "AsyncEnabled networks require all backends to support ExternallyManagedMemory";

174

throw BackendCapabilityException(er);

175

}

176

177

if (HasCapability(BackendOptions::BackendOption{"ExternallyManagedMemory", true},backend->GetCapabilities())

178

&& (m_NetworkProperties.m_ExternalMemoryManagementEnabled || m_NetworkProperties.m_AsyncEnabled))

179

{

180

m_SupportsExternallyManagedMemory[backend->GetId()] = true;

181

useExternalMemoryManager = true;

}

else

{

m_SupportsExternallyManagedMemory[backend->GetId()] = false;

186

useInternalMemoryManager = true;

187

}

188

189

IBackendInternal::IWorkloadFactoryPtr workloadFactory;

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

190

if (backend->SupportsTensorAllocatorAPI())

191

{

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

192

workloadFactory = backend->CreateWorkloadFactory(

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

193

m_TensorHandleFactoryRegistry,

194

m_OptimizedNetwork->pOptimizedNetworkImpl->GetModelOptions(),

Narumol Prangnawarat

2021-05-07 17:52:36 +0100

[diff] [blame]

195

static_cast<MemorySourceFlags>(m_NetworkProperties.m_InputSource),

196

static_cast<MemorySourceFlags>(m_NetworkProperties.m_OutputSource));

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

197

}

198

else

199

{

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

200

m_BackendMemoryMangers.emplace_back(backend->CreateMemoryManager());

201

workloadFactory = backend->CreateWorkloadFactory(

202

m_BackendMemoryMangers.back(), m_OptimizedNetwork->pOptimizedNetworkImpl->GetModelOptions());

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

203

}

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

204

m_WorkloadFactories[backendId ] = std::move(workloadFactory);

David Beck

2018-10-23 13:35:58 +0100

[diff] [blame]

205

}

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

206

}

Keith Davis

e813d67

2021-04-22 10:10:34 +0100

[diff] [blame]

207

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

208

if (!networkProperties.m_AsyncEnabled)

Derek Lamberti

2019-06-13 11:40:08 +0100

[diff] [blame]

209

{

Kevin May

b4b3ac9

2021-05-21 16:42:21 +0100

[diff] [blame]

210

for (auto&& layer : order)

David Monahan

3fb7e10

2019-08-20 11:25:29 +0100

[diff] [blame]

211

{

Kevin May

b4b3ac9

2021-05-21 16:42:21 +0100

[diff] [blame]

212

auto& workloadFactory = GetWorkloadFactory(*layer);

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

213

bool supportsExternalManager = m_SupportsExternallyManagedMemory[layer->GetBackendId()];

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

214

215

switch (layer->GetType())

David Monahan

3fb7e10

2019-08-20 11:25:29 +0100

[diff] [blame]

216

{

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

217

case LayerType::Input:

218

case LayerType::MemImport:

Ferran Balaguer

2019-09-19 11:49:25 +0100

[diff] [blame]

219

{

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

220

// If IsImportEnabled is true then we need to set IsMemoryManaged

221

// to false when creating TensorHandles

Francis Murtagh

73d3e2e

2021-04-29 14:23:04 +0100

[diff] [blame]

222

layer->CreateTensorHandles(m_TensorHandleFactoryRegistry,

223

workloadFactory,

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

224

!supportsExternalManager && !m_NetworkProperties.m_ImportEnabled);

225

break;

226

}

227

case LayerType::Constant:

228

{

229

layer->CreateTensorHandles(m_TensorHandleFactoryRegistry, workloadFactory, true);

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

230

break;

Ferran Balaguer

2019-09-19 11:49:25 +0100

[diff] [blame]

231

}

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

232

default:

Ferran Balaguer

2019-09-19 11:49:25 +0100

[diff] [blame]

233

{

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

234

// Look for a layer with 1 OutputSlot which has 1 connection and that connection is an Output Layer

235

// If Export is enabled disable memory management so we can export, otherwise we do a copy

236

if ((layer->GetNumOutputSlots() == 1) &&

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

237

(layer->GetOutputSlots()[0].GetNumConnections() == 1) &&

238

(layer->GetOutputSlots()[0].GetConnection(0)->GetOwningLayer().GetType() == LayerType::Output))

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

239

{

Francis Murtagh

73d3e2e

2021-04-29 14:23:04 +0100

[diff] [blame]

240

layer->CreateTensorHandles(m_TensorHandleFactoryRegistry,

241

workloadFactory,

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

242

!supportsExternalManager && !m_NetworkProperties.m_ExportEnabled);

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

243

}

244

else

245

{

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

246

layer->CreateTensorHandles(m_TensorHandleFactoryRegistry,

247

workloadFactory,

248

!supportsExternalManager);

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

249

}

Ferran Balaguer

2019-09-19 11:49:25 +0100

[diff] [blame]

250

}

David Monahan

3fb7e10

2019-08-20 11:25:29 +0100

[diff] [blame]

251

}

252

}

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

253

}

254

Narumol Prangnawarat

2019-11-22 11:26:06 +0000

[diff] [blame]

255

ProfilingGuid networkGuid = m_OptimizedNetwork->GetGuid();

Sadik Armagan

2020-03-18 10:57:30 +0000

[diff] [blame]

256

std::unique_ptr<TimelineUtilityMethods> timelineUtils =

257

TimelineUtilityMethods::GetTimelineUtils(m_ProfilingService);

Narumol Prangnawarat

2019-11-22 11:26:06 +0000

[diff] [blame]

258

if (timelineUtils)

259

{

260

timelineUtils->CreateTypedEntity(networkGuid, LabelsAndEventClasses::NETWORK_GUID);

Jim Flynn

f771321

2020-07-14 09:50:59 +0100

[diff] [blame]

261

// Mark the network with a start of life event

262

timelineUtils->RecordEvent(networkGuid, LabelsAndEventClasses::ARMNN_PROFILING_SOL_EVENT_CLASS);

263

// and with the process ID

264

int processID = armnnUtils::Processes::GetCurrentId();

265

std::stringstream ss;

266

ss << processID;

267

timelineUtils->MarkEntityWithLabel(networkGuid, ss.str(), LabelsAndEventClasses::PROCESS_ID_GUID);

Narumol Prangnawarat

2019-11-22 11:26:06 +0000

[diff] [blame]

268

}

269

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

270

//Then create workloads.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

271

{

Derek Lamberti

2021-10-13 18:26:16 +0100

[diff] [blame]

272

ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "LoadNetwork_CreateWorkloads");

273

for (auto&& layer: order)

Narumol Prangnawarat

2019-11-22 11:26:06 +0000

[diff] [blame]

274

{

Derek Lamberti

2021-10-13 18:26:16 +0100

[diff] [blame]

275

if (timelineUtils)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

276

{

Derek Lamberti

2021-10-13 18:26:16 +0100

[diff] [blame]

277

// Add layer to the post-optimisation network structure

278

AddLayerStructure(timelineUtils, *layer, networkGuid);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

279

}

Derek Lamberti

2021-10-13 18:26:16 +0100

[diff] [blame]

280

281

const IWorkloadFactory& workloadFactory = GetWorkloadFactory(*layer);

282

283

switch (layer->GetType())

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

284

{

Derek Lamberti

2021-10-13 18:26:16 +0100

[diff] [blame]

285

case LayerType::Input:

286

case LayerType::Output:

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

287

{

Derek Lamberti

2021-10-13 18:26:16 +0100

[diff] [blame]

288

// Inputs and outputs are treated in a special way - see EnqueueInput() and EnqueueOutput().

289

break;

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

290

}

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

291

default:

292

{

Derek Lamberti

2021-10-13 18:26:16 +0100

[diff] [blame]

293

auto workload = layer->CreateWorkload(workloadFactory);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

294

Derek Lamberti

2021-10-13 18:26:16 +0100

[diff] [blame]

295

if (!workload)

296

{

297

const char* const layerName =

298

layer->GetNameStr().length() != 0 ? layer->GetName() : "<Unnamed>";

299

throw InvalidArgumentException(

300

fmt::format("No workload created for layer (name: '{0}' type: '{1}') (compute '{2}')",

301

layerName, static_cast<int>(layer->GetType()), layer->GetBackendId().Get()

302

));

303

}

Narumol Prangnawarat

2019-11-22 11:26:06 +0000

[diff] [blame]

304

Derek Lamberti

2021-10-13 18:26:16 +0100

[diff] [blame]

305

if (timelineUtils)

306

{

307

// Add workload to the post-optimisation network structure

308

AddWorkloadStructure(timelineUtils, workload, *layer);

309

}

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

310

Derek Lamberti

2021-10-13 18:26:16 +0100

[diff] [blame]

311

// For async networks ConstantWorkloads are managed exclusively by LoadedNetwork

312

// and are separated out from the other workloads

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

313

if((networkProperties.m_AsyncEnabled || useExternalMemoryManager) &&

314

layer->GetType() == LayerType::Constant)

Derek Lamberti

2021-10-13 18:26:16 +0100

[diff] [blame]

315

{

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

316

m_ConstantTensorHandles[layer->GetGuid()] =

317

layer->GetOutputSlot(0).GetOutputHandler().GetData();

Derek Lamberti

2021-10-13 18:26:16 +0100

[diff] [blame]

318

m_ConstantWorkloads[layer->GetGuid()] = std::move(workload);

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

}

else

{

m_WorkloadQueue.push_back(std::move(workload));

Derek Lamberti

2021-10-13 18:26:16 +0100

[diff] [blame]

323

}

324

325

// release the constant data in the layer..

326

layer->ReleaseConstantData();

327

break;

328

}

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

}

}

}

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

333

// Gather information about workloads for inputs & outputs

334

if (!networkProperties.m_AsyncEnabled && m_WorkloadQueue.size() != 0)

335

{

336

const int noOfInputs = armnn::numeric_cast<int>(order.GetNumInputs());

337

338

// Get indices of all workloads connected to each input and

339

// check if they support tensor handle replacement

340

for (const BindableLayer* layer: order.GetInputLayers())

341

{

342

const auto bindingId = layer->GetBindingId();

343

344

bool supportsReplacement = true;

345

346

for (const auto inputSlot: layer->GetOutputSlot(0).GetConnections())

347

{

348

auto workloadIndex = std::distance(order.begin(), order.GetPosInGraph(inputSlot->GetOwningLayer()));

349

workloadIndex -= noOfInputs;

350

351

m_InputWorkloadSlotPairs[bindingId].emplace_back(WorkloadIndices{

352

armnn::numeric_cast<unsigned int>(workloadIndex), inputSlot->GetSlotIndex()});

353

354

auto workload = m_WorkloadQueue[m_InputWorkloadSlotPairs[bindingId].back().m_WorkloadIndex].get();

355

supportsReplacement &= workload->SupportsTensorHandleReplacement();

356

}

357

358

ITensorHandleFactory::FactoryId factoryId = layer->GetOutputSlot(0).GetTensorHandleFactoryId();

359

// Get matching import factory Id

360

ITensorHandleFactory::FactoryId importFactoryId =

361

m_TensorHandleFactoryRegistry.GetMatchingImportFactoryId(factoryId);

362

363

ITensorHandleFactory *importFactory = m_TensorHandleFactoryRegistry.GetFactory(importFactoryId);

364

365

if (supportsReplacement && importFactory)

366

{

367

m_PreImportedInputHandles.emplace_back(

368

bindingId, importFactory->CreateTensorHandle(layer->GetOutputSlot(0).GetTensorInfo(), false));

}

else

{

m_PreImportedInputHandles.emplace_back(bindingId, nullptr);

}

}

// Get indices of all workloads connected to each output and

377

// check if they support tensor handle replacement

378

for (const BindableLayer* layer: order.GetOutputLayers())

379

{

380

const auto bindingId = layer->GetBindingId();

381

382

const auto outputSlot = layer->GetInputSlot(0).GetConnectedOutputSlot();

383

auto& indices = m_OutputWorkloadSlotPairs[bindingId];

384

385

auto workloadIndex = std::distance(order.begin(), order.GetPosInGraph(outputSlot->GetOwningLayer()));

386

workloadIndex -= noOfInputs;

387

388

indices.m_OutputSlotIndices = WorkloadIndices{numeric_cast<unsigned int>(workloadIndex),

389

outputSlot->CalculateIndexOnOwner()};

390

391

bool supportsReplacement = true;

392

auto outputWorkload = m_WorkloadQueue[indices.m_OutputSlotIndices.m_WorkloadIndex].get();

393

supportsReplacement &= outputWorkload->SupportsTensorHandleReplacement();

394

395

for (auto &inputSlot: outputSlot->GetConnections())

396

{

397

if(inputSlot->GetOwningLayer().GetType() != LayerType::Output)

398

{

399

auto inWorkloadIndex = std::distance(order.begin(),

400

order.GetPosInGraph(inputSlot->GetOwningLayer()));

401

inWorkloadIndex -= noOfInputs;

402

indices.m_InputSlotIndices.emplace_back(WorkloadIndices{numeric_cast<unsigned int>(inWorkloadIndex),

403

inputSlot->GetSlotIndex()});

404

auto inputWorkload = m_WorkloadQueue[indices.m_InputSlotIndices.back().m_WorkloadIndex].get();

405

supportsReplacement &= inputWorkload->SupportsTensorHandleReplacement();

}

}

ITensorHandleFactory::FactoryId factoryId = outputSlot->GetTensorHandleFactoryId();

410

// Get matching import factory Id

411

ITensorHandleFactory::FactoryId importFactoryId =

412

m_TensorHandleFactoryRegistry.GetMatchingImportFactoryId(factoryId);

413

ITensorHandleFactory *importFactory = m_TensorHandleFactoryRegistry.GetFactory(importFactoryId);

414

415

if (supportsReplacement && importFactory)

416

{

417

m_PreImportedOutputHandles.emplace_back(

418

bindingId, importFactory->CreateTensorHandle(outputSlot->GetTensorInfo(), false));

}

else

{

m_PreImportedOutputHandles.emplace_back(bindingId, nullptr);

}

}

}

Sadik Armagan

2020-11-26 10:38:11 +0000

[diff] [blame]

427

for (auto&& workloadFactory : m_WorkloadFactories)

428

{

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

429

workloadFactory.second->AfterWorkloadsCreated();

Sadik Armagan

dea8fb6

2020-11-26 10:38:11 +0000

[diff] [blame]

430

}

431

Narumol Prangnawarat

2019-11-22 11:26:06 +0000

[diff] [blame]

432

if (timelineUtils)

433

{

434

// Commit to send the post-optimisation network structure

435

timelineUtils->Commit();

436

}

437

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

438

if (useExternalMemoryManager)

439

{

440

if (networkProperties.m_AsyncEnabled)

441

{

442

CreateMemoryProfileAsync();

}

else

{

CreateMemoryProfile();

447

}

448

449

auto backendStrategyMap = BackendRegistryInstance().GetMemoryOptimizerStrategies();

450

for (auto& backendMemoryProfile : m_MemBlockMap)

451

{

452

const BackendId& backendId = backendMemoryProfile.first;

453

if (backendStrategyMap.find(backendId) != backendStrategyMap.end())

454

{

455

m_MemBinMap[backendId] = backendStrategyMap[backendId]->Optimize(backendMemoryProfile.second);

}

else

{

m_MemBinMap[backendId] = m_ConstantStrategy->Optimize(backendMemoryProfile.second);

}

}

if (!networkProperties.m_AsyncEnabled)

464

{

465

m_ExternalMemoryManager = CreateExternalMemoryManger(m_TensorMemory);

466

467

// Sort m_TensorMemory, so it's order matches m_Tensorhandles

468

std::sort(m_TensorMemory.begin(), m_TensorMemory.end(),

469

[](const std::pair<std::shared_ptr<TensorMemory>, MemorySource>& lhs,

470

const std::pair<std::shared_ptr<TensorMemory>, MemorySource>& rhs)

471

{

472

return lhs.first->m_OutputSlotId < rhs.first->m_OutputSlotId;

});

}

}

// Now that the intermediate tensor memory has been set-up,

478

// do any post allocation configuration for each workload.

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

479

if (!networkProperties.m_AsyncEnabled)

Derek Lamberti

f30f7d3

2019-04-09 10:25:02 +0100

[diff] [blame]

480

{

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

481

if (useInternalMemoryManager)

482

{

483

// Set up memory.

484

m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph().AllocateDynamicBuffers();

485

}

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

486

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

487

for (auto &workload : m_WorkloadQueue)

488

{

489

workload->PostAllocationConfigure();

490

}

491

}

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

492

493

if (useExternalMemoryManager)

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

494

{

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

495

if (!networkProperties.m_AsyncEnabled)

496

{

497

AllocateAndExecuteConstantWorkloads();

}

else

{

AllocateAndExecuteConstantWorkloadsAsync();

502

}

Derek Lamberti

f30f7d3

2019-04-09 10:25:02 +0100

[diff] [blame]

503

}

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

504

}

505

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

506

void LoadedNetwork::AllocateAndExecuteConstantWorkloads()

507

{

Derek Lamberti

2021-10-13 18:26:16 +0100

[diff] [blame]

508

ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "LoadNetwork_AllocateAndExecuteConstants");

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

509

for (auto& pair : m_ConstantWorkloads)

510

{

511

auto tensorHandle = m_ConstantTensorHandles[pair.first];

512

tensorHandle->Allocate();

513

pair.second->Execute();

}

}

void LoadedNetwork::AllocateAndExecuteConstantWorkloadsAsync()

520

{

521

ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "LoadNetwork_AllocateAndExecuteConstants");

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

522

Graph& order = m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph();

523

for (auto&& layer : order)

524

{

525

if (layer->GetType() == LayerType::Constant)

526

{

527

const auto& outSlot = layer->GetOutputSlots()[0];

528

const auto factoryId = outSlot.GetTensorHandleFactoryId();

529

ARMNN_ASSERT(factoryId != ITensorHandleFactory::LegacyFactoryId);

530

auto& workloadFactory = GetWorkloadFactory(*layer);

531

532

layer->CreateTensorHandles(m_TensorHandleFactoryRegistry, workloadFactory);

533

ITensorHandle* tensorHandle = outSlot.GetOutputHandler().GetData();

534

535

m_ConstantTensorHandles[layer->GetGuid()] = tensorHandle;

536

tensorHandle->Allocate();

537

538

WorkingMemDescriptor memDesc;

539

memDesc.m_Outputs.push_back(tensorHandle);

540

m_ConstantWorkloads[layer->GetGuid()]->ExecuteAsync(memDesc);

}

}

}

Keith Davis

2020-03-30 10:43:41 +0100

[diff] [blame]

545

void LoadedNetwork::SendNetworkStructure()

546

{

Derek Lamberti

2021-10-13 18:26:16 +0100

[diff] [blame]

547

ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "LoadNetwork_SendNetworkStructure");

Francis Murtagh

2021-02-15 18:23:17 +0000

[diff] [blame]

548

Graph& order = m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph().TopologicalSort();

Keith Davis

33ed221

2020-03-30 10:43:41 +0100

[diff] [blame]

549

ProfilingGuid networkGuid = m_OptimizedNetwork->GetGuid();

550

551

std::unique_ptr<TimelineUtilityMethods> timelineUtils =

552

TimelineUtilityMethods::GetTimelineUtils(m_ProfilingService);

553

554

timelineUtils->CreateTypedEntity(networkGuid, LabelsAndEventClasses::NETWORK_GUID);

555

556

for (auto&& layer : order)

557

{

558

// Add layer to the post-optimisation network structure

559

AddLayerStructure(timelineUtils, *layer, networkGuid);

560

switch (layer->GetType())

561

{

562

case LayerType::Input:

563

case LayerType::Output:

564

{

565

// Inputs and outputs are treated in a special way - see EnqueueInput() and EnqueueOutput().

break;

}

default:

{

for (auto& workload : m_WorkloadQueue)

571

{

572

// Add workload to the post-optimisation network structure

573

AddWorkloadStructure(timelineUtils, workload, *layer);

}

break;

}

}

}

// Commit to send the post-optimisation network structure

580

timelineUtils->Commit();

581

}

582

Cathal Corbett

2022-02-25 15:33:28 +0000

[diff] [blame^]

583

ProfilingGuid LoadedNetwork::GetNetworkGuid()

Jim Flynn

f771321

2020-07-14 09:50:59 +0100

[diff] [blame]

584

{

585

return m_OptimizedNetwork->GetGuid();

586

}

587

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

588

TensorInfo LoadedNetwork::GetInputTensorInfo(LayerBindingId layerId) const

589

{

Francis Murtagh

2021-02-15 18:23:17 +0000

[diff] [blame]

590

for (auto&& inputLayer : m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph().GetInputLayers())

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

591

{

Narumol Prangnawarat

2020-04-01 16:51:23 +0100

[diff] [blame]

592

ARMNN_ASSERT_MSG(inputLayer->GetNumOutputSlots() == 1, "Input layer should have exactly 1 output slot");

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

593

if (inputLayer->GetBindingId() == layerId)

594

{

595

return inputLayer->GetOutputSlot(0).GetTensorInfo();

}

}

Colm Donelan

2020-09-09 12:48:16 +0100

[diff] [blame]

599

throw InvalidArgumentException(fmt::format("No input layer is associated with id {}", layerId));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

600

}

601

602

TensorInfo LoadedNetwork::GetOutputTensorInfo(LayerBindingId layerId) const

603

{

Francis Murtagh

2021-02-15 18:23:17 +0000

[diff] [blame]

604

for (auto&& outputLayer : m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph().GetOutputLayers())

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

605

{

Narumol Prangnawarat

2020-04-01 16:51:23 +0100

[diff] [blame]

606

ARMNN_ASSERT_MSG(outputLayer->GetNumInputSlots() == 1, "Output layer should have exactly 1 input slot");

607

ARMNN_ASSERT_MSG(outputLayer->GetInputSlot(0).GetConnection(), "Input slot on Output layer must be connected");

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

608

if (outputLayer->GetBindingId() == layerId)

609

{

610

return outputLayer->GetInputSlot(0).GetConnection()->GetTensorInfo();

}

}

Colm Donelan

2020-09-09 12:48:16 +0100

[diff] [blame]

614

throw InvalidArgumentException(fmt::format("No output layer is associated with id {}", layerId));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

615

}

616

surmeh01

2018-05-18 16:31:43 +0100

[diff] [blame]

617

const IWorkloadFactory& LoadedNetwork::GetWorkloadFactory(const Layer& layer) const

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

618

{

surmeh01

2018-05-18 16:31:43 +0100

[diff] [blame]

619

const IWorkloadFactory* workloadFactory = nullptr;

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

620

David Beck

2018-10-23 13:35:58 +0100

[diff] [blame]

621

auto it = m_WorkloadFactories.find(layer.GetBackendId());

622

if (it == m_WorkloadFactories.end())

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

623

{

Colm Donelan

5b5c222

2020-09-09 12:48:16 +0100

[diff] [blame]

624

throw RuntimeException(fmt::format("No workload factory for {0} to be used for layer: {1}",

625

layer.GetBackendId().Get(),

626

layer.GetNameStr()),

627

CHECK_LOCATION());

David Beck

33f0ae0

2018-10-18 15:13:56 +0100

[diff] [blame]

628

}

David Beck

2018-10-23 13:35:58 +0100

[diff] [blame]

629

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

630

workloadFactory = it->second.get();

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

631

Narumol Prangnawarat

2020-04-01 16:51:23 +0100

[diff] [blame]

632

ARMNN_ASSERT_MSG(workloadFactory, "No workload factory");

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

633

634

std::string reasonIfUnsupported;

Sadik Armagan

04a7297

2020-09-14 15:44:18 +0100

[diff] [blame]

635

ARMNN_ASSERT_MSG(IWorkloadFactory::IsLayerSupported(layer,

636

{},

637

reasonIfUnsupported,

Francis Murtagh

2021-02-15 18:23:17 +0000

[diff] [blame]

638

m_OptimizedNetwork->pOptimizedNetworkImpl->GetModelOptions()),

David Beck

2018-10-23 13:35:58 +0100

[diff] [blame]

639

"Factory does not support layer");

Jan Eilers

8eb2560

2020-03-09 12:13:48 +0000

[diff] [blame]

640

IgnoreUnused(reasonIfUnsupported);

surmeh01

2018-05-18 16:31:43 +0100

[diff] [blame]

641

return *workloadFactory;

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

}

namespace {

// Non-copyable class owning accelerator-specific tensor data.

class TensorPin

{

public:

TensorPin(std::unique_ptr<ITensorHandle> handle, const TensorInfo& info, LayerBindingId id)

651

: m_TensorHandle(std::move(handle))

, m_TensorInfo(info)

, m_Id(id)

{

}

ITensorHandle* GetTensorHandle() const { return m_TensorHandle.get(); }

658

const TensorInfo& GetTensorInfo() const { return m_TensorInfo; }

659

LayerBindingId GetBindingId() const { return m_Id; }

660

661

private:

662

std::unique_ptr<ITensorHandle> m_TensorHandle;

663

TensorInfo m_TensorInfo;

LayerBindingId m_Id;

};

static const TensorPin& GetTensorPin(LayerBindingId id,

668

const std::vector<TensorPin>& pins,

669

char const* bindingPointDesc)

670

{

671

auto it = std::find_if(pins.begin(), pins.end(),

672

[id](const TensorPin& pin)

673

{

674

return pin.GetBindingId() == id;

675

});

676

677

if (it != pins.end())

{

return *it;

}

else

{

Colm Donelan

5b5c222

2020-09-09 12:48:16 +0100

[diff] [blame]

683

throw InvalidArgumentException(fmt::format("No tensor supplied for {0} {1}", bindingPointDesc, id));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

}

}

// Stores data that needs to be kept accessible for the entire execution of a workload.

class WorkloadData

{

public:

WorkloadData(const InputTensors& inputTensors, const OutputTensors& outputTensors)

692

{

693

m_InputTensorPins.reserve(inputTensors.size());

694

m_OutputTensorPins.reserve(outputTensors.size());

695

696

for (auto inputTensorPair : inputTensors)

697

{

698

auto inputTensor = inputTensorPair.second;

699

700

std::unique_ptr<ITensorHandle> tensorHandle =

James Conroy

2021-04-27 17:13:27 +0100

[diff] [blame]

701

std::make_unique<ConstPassthroughTensorHandle>(inputTensor.GetInfo(),inputTensor.GetMemoryArea());

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

702

LayerBindingId layerId = inputTensorPair.first;

703

704

m_InputTensorPins.emplace_back(std::move(tensorHandle), inputTensor.GetInfo(), layerId);

705

}

706

707

for (auto outputTensorPair : outputTensors)

708

{

709

auto outputTensor = outputTensorPair.second;

710

711

std::unique_ptr<ITensorHandle> tensorHandle =

James Conroy

2021-04-27 17:13:27 +0100

[diff] [blame]

712

std::make_unique<PassthroughTensorHandle>(outputTensor.GetInfo(), outputTensor.GetMemoryArea());

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

713

LayerBindingId layerId = outputTensorPair.first;

714

715

m_OutputTensorPins.emplace_back(std::move(tensorHandle), outputTensor.GetInfo(), layerId);

}

}

const TensorPin& GetInputTensorPin(LayerBindingId id) const

720

{

721

return GetTensorPin(id, m_InputTensorPins, "input");

722

}

723

724

const TensorPin& GetOutputTensorPin(LayerBindingId id) const

725

{

726

return GetTensorPin(id, m_OutputTensorPins, "output");

}

private:

std::vector<TensorPin> m_InputTensorPins;

732

std::vector<TensorPin> m_OutputTensorPins;

};

}

Status LoadedNetwork::EnqueueWorkload(const InputTensors& inputTensors,

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

738

const OutputTensors& outputTensors,

739

std::vector<ImportedInputId> preImportedInputIds,

740

std::vector<ImportedOutputId> preImportedOutputIds)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

741

{

Francis Murtagh

2021-02-15 18:23:17 +0000

[diff] [blame]

742

const Graph& graph = m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph();

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

743

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

744

// Walk graph to determine the order of execution.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

745

if (graph.GetNumLayers() < 2)

746

{

Derek Lamberti

0844697

2019-11-26 16:38:31 +0000

[diff] [blame]

747

ARMNN_LOG(warning) << "IRuntime::EnqueueWorkload()::Less than two nodes in graph";

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

748

return Status::Failure;

749

}

750

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

751

// Data that must be kept alive for the entire execution of the workload.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

752

WorkloadData workloadData(inputTensors, outputTensors);

753

754

if (graph.GetNumInputs() != inputTensors.size())

755

{

756

throw InvalidArgumentException("Number of inputs provided does not match network.");

757

}

758

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

759

// For each input to the network, call EnqueueInput with the data passed by the user.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

760

{

Derek Lamberti

2020-06-19 14:33:05 +0100

[diff] [blame]

761

ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "PrepareInputs");

762

m_InputQueue.clear();

763

m_InputQueue.reserve(graph.GetNumInputs());

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

764

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

765

if (preImportedInputIds.size() > graph.GetNumInputs())

766

{

767

throw InvalidArgumentException("Invalid number of preImportedInputIds");

768

}

769

770

unsigned int inputIndex = 0;

771

unsigned int importedInputIdIndex = 0;

772

std::sort(preImportedInputIds.begin(), preImportedInputIds.end());

Derek Lamberti

2020-06-19 14:33:05 +0100

[diff] [blame]

773

for (const BindableLayer* inputLayer : graph.GetInputLayers())

774

{

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

775

if (importedInputIdIndex < preImportedInputIds.size() &&

776

inputIndex == preImportedInputIds[importedInputIdIndex])

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

777

{

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

778

// Only replace tensorhandles if they have not already been replaced

779

if (!m_IsInputImported[inputIndex])

780

{

781

auto outputTensorHandle = m_PreImportedInputHandles[inputIndex].m_TensorHandle.get();

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

782

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

783

for (const auto& workloadInfo: m_InputWorkloadSlotPairs[inputLayer->GetBindingId()])

784

{

785

auto workload = m_WorkloadQueue[workloadInfo.m_WorkloadIndex].get();

786

workload->ReplaceInputTensorHandle(outputTensorHandle, workloadInfo.m_SlotIndex);

787

}

788

m_IsInputImported[inputIndex] = true;

789

}

790

importedInputIdIndex++;

791

}

792

else

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

793

{

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

794

if (m_IsInputImported[inputIndex])

795

{

796

OutputHandler& handler = const_cast<OutputHandler&>(inputLayer->GetOutputHandler(0));

797

798

for (const auto& workloadInfo: m_InputWorkloadSlotPairs[inputLayer->GetBindingId()])

799

{

800

auto workload = m_WorkloadQueue[workloadInfo.m_WorkloadIndex].get();

801

workload->ReplaceInputTensorHandle(handler.GetData(), workloadInfo.m_SlotIndex);

802

}

803

804

m_IsInputImported[inputIndex] = false;

805

}

806

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

807

// InputTensorHandle is not imported yet, process to enqueue input

808

const TensorPin& pin = workloadData.GetInputTensorPin(inputLayer->GetBindingId());

809

EnqueueInput(*inputLayer, pin.GetTensorHandle(), pin.GetTensorInfo());

810

}

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

811

inputIndex++;

Derek Lamberti

2020-06-19 14:33:05 +0100

[diff] [blame]

812

}

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

813

}

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

814

// For each output to the network, call EnqueueOutput with the data passed by the user.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

815

{

Derek Lamberti

2020-06-19 14:33:05 +0100

[diff] [blame]

816

ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "PrepareOutputs");

817

m_OutputQueue.clear();

818

m_OutputQueue.reserve(graph.GetNumOutputs());

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

819

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

820

if (preImportedOutputIds.size() > graph.GetNumOutputs())

821

{

822

throw InvalidArgumentException("Invalid number of preImportedOutputIds");

823

}

824

825

unsigned int outputIndex = 0;

826

unsigned int importedOutputIdIndex = 0;

827

std::sort(preImportedOutputIds.begin(), preImportedOutputIds.end());

Derek Lamberti

2020-06-19 14:33:05 +0100

[diff] [blame]

828

for (const BindableLayer* outputLayer : graph.GetOutputLayers())

829

{

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

830

if (importedOutputIdIndex < preImportedOutputIds.size() &&

831

outputIndex == preImportedOutputIds[importedOutputIdIndex])

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

832

{

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

833

// Only replace tensorhandles if they have not already been replaced

834

ITensorHandle* inputTensorHandle = m_PreImportedOutputHandles[outputIndex].m_TensorHandle.get();

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

835

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

836

if (!m_IsOutputImported[outputIndex])

837

{

838

const auto bindingId = outputLayer->GetBindingId();

839

const auto& indices = m_OutputWorkloadSlotPairs[bindingId];

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

840

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

841

auto outputWorkload = m_WorkloadQueue[indices.m_OutputSlotIndices.m_WorkloadIndex].get();

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

842

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

843

outputWorkload->ReplaceOutputTensorHandle(inputTensorHandle,

844

indices.m_OutputSlotIndices.m_SlotIndex);

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

845

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

846

for (const auto& workloadInfo: indices.m_InputSlotIndices)

847

{

848

auto inputWorkload = m_WorkloadQueue[workloadInfo.m_WorkloadIndex].get();

849

inputWorkload->ReplaceInputTensorHandle(inputTensorHandle, workloadInfo.m_SlotIndex);

850

}

851

m_IsOutputImported[outputIndex] = true;

852

}

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

853

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

854

ARMNN_ASSERT_MSG(inputTensorHandle != nullptr, "Data should have been allocated.");

855

MemSyncQueueDescriptor syncDesc;

856

syncDesc.m_Inputs.push_back(inputTensorHandle);

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

857

WorkloadInfo info;

858

info.m_InputTensorInfos.push_back(

859

outputLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetTensorInfo());

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

860

auto syncWorkload = std::make_unique<SyncMemGenericWorkload>(syncDesc, info);

861

ARMNN_ASSERT_MSG(syncWorkload, "No sync workload created");

862

m_OutputQueue.push_back(move(syncWorkload));

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

863

importedOutputIdIndex++;

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

864

}

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

865

else

866

{

867

if (m_IsOutputImported[outputIndex])

868

{

869

const auto bindingId = outputLayer->GetBindingId();

870

const auto& indices = m_OutputWorkloadSlotPairs[bindingId];

871

872

auto outputWorkload = m_WorkloadQueue[indices.m_OutputSlotIndices.m_WorkloadIndex].get();

873

const OutputHandler& outputHandler =

874

outputLayer->GetInputSlot(0).GetConnectedOutputSlot()->GetOutputHandler();

875

876

outputWorkload->ReplaceOutputTensorHandle(

877

outputHandler.GetData(), indices.m_OutputSlotIndices.m_SlotIndex);

878

879

for (const auto& workloadInfo: indices.m_InputSlotIndices)

880

{

881

auto inputWorkload = m_WorkloadQueue[workloadInfo.m_WorkloadIndex].get();

882

inputWorkload->ReplaceInputTensorHandle(outputHandler.GetData(), workloadInfo.m_SlotIndex);

883

}

884

m_IsOutputImported[outputIndex] = false;

885

}

886

887

const TensorPin& pin = workloadData.GetOutputTensorPin(outputLayer->GetBindingId());

888

// OutputTensorHandle is not imported yet, process to enqueue Output

889

EnqueueOutput(*outputLayer, pin.GetTensorHandle(), pin.GetTensorInfo());

890

}

891

outputIndex++;

Derek Lamberti

2020-06-19 14:33:05 +0100

[diff] [blame]

892

}

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

893

}

894

Sadik Armagan

2020-03-18 10:57:30 +0000

[diff] [blame]

895

std::unique_ptr<TimelineUtilityMethods> timelineUtils =

896

TimelineUtilityMethods::GetTimelineUtils(m_ProfilingService);

897

ProfilingGuid inferenceGuid = m_ProfilingService.GetNextGuid();

David Monahan

2019-12-02 08:35:43 +0000

[diff] [blame]

898

if (timelineUtils)

899

{

900

// Add inference timeline trace if profiling is enabled.

901

ProfilingGuid networkGuid = m_OptimizedNetwork->GetGuid();

902

timelineUtils->CreateTypedEntity(inferenceGuid, LabelsAndEventClasses::INFERENCE_GUID);

Jim Flynn

6398a98

2020-05-27 17:05:21 +0100

[diff] [blame]

903

timelineUtils->CreateRelationship(ProfilingRelationshipType::RetentionLink,

904

networkGuid,

905

inferenceGuid,

906

LabelsAndEventClasses::EXECUTION_OF_GUID);

David Monahan

2019-12-02 08:35:43 +0000

[diff] [blame]

907

timelineUtils->RecordEvent(inferenceGuid, LabelsAndEventClasses::ARMNN_PROFILING_SOL_EVENT_CLASS);

908

}

909

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

910

bool executionSucceeded = true;

911

912

{

Sadik Armagan

2020-03-18 10:57:30 +0000

[diff] [blame]

913

if (m_ProfilingService.IsProfilingEnabled())

Keith Davis

e394bd9

2019-12-02 15:12:19 +0000

[diff] [blame]

914

{

Cathal Corbett

2022-02-25 15:33:28 +0000

[diff] [blame^]

915

m_ProfilingService.IncrementCounterValue(INFERENCES_RUN);

Keith Davis

e394bd9

2019-12-02 15:12:19 +0000

[diff] [blame]

916

}

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

917

ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "Execute");

surmeh01

2018-05-18 16:31:43 +0100

[diff] [blame]

918

ARMNN_SCOPED_HEAP_PROFILING("Executing");

David Monahan

2019-12-02 08:35:43 +0000

[diff] [blame]

919

executionSucceeded = Execute(timelineUtils, inferenceGuid);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

920

}

921

David Monahan

2019-12-02 08:35:43 +0000

[diff] [blame]

922

if (timelineUtils)

923

{

924

// Add end of life of the inference timeline if profiling is enabled.

925

timelineUtils->RecordEvent(inferenceGuid, LabelsAndEventClasses::ARMNN_PROFILING_EOL_EVENT_CLASS);

926

timelineUtils->Commit();

927

}

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

928

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

929

return executionSucceeded ? Status::Success : Status::Failure;

930

}

931

surmeh01

2018-05-18 16:31:43 +0100

[diff] [blame]

932

void LoadedNetwork::EnqueueInput(const BindableLayer& layer, ITensorHandle* tensorHandle, const TensorInfo& tensorInfo)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

933

{

934

if (layer.GetType() != LayerType::Input)

935

{

936

throw InvalidArgumentException("EnqueueInput: given layer not an InputLayer");

937

}

938

939

if (tensorHandle == nullptr)

940

{

941

throw InvalidArgumentException("EnqueueInput: tensorHandle must not be NULL");

942

}

943

944

InputQueueDescriptor inputQueueDescriptor;

945

WorkloadInfo info;

946

947

inputQueueDescriptor.m_Inputs.push_back(tensorHandle);

948

info.m_InputTensorInfos.push_back(tensorInfo);

949

Narumol Prangnawarat

2020-04-01 16:51:23 +0100

[diff] [blame]

950

ARMNN_ASSERT_MSG(layer.GetNumOutputSlots() == 1, "Can only handle Input Layer with one output");

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

951

const OutputHandler& handler = layer.GetOutputHandler();

952

const TensorInfo& outputTensorInfo = handler.GetTensorInfo();

953

ITensorHandle* outputTensorHandle = handler.GetData();

Narumol Prangnawarat

2020-04-01 16:51:23 +0100

[diff] [blame]

954

ARMNN_ASSERT_MSG(outputTensorHandle != nullptr,

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

955

"Data should have been allocated.");

956

inputQueueDescriptor.m_Outputs.push_back(outputTensorHandle);

957

info.m_OutputTensorInfos.push_back(outputTensorInfo);

958

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

959

MemorySourceFlags importFlags = outputTensorHandle->GetImportFlags();

Narumol Prangnawarat

2020-10-30 16:06:55 +0000

[diff] [blame]

960

bool needMemCopy = true;

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

961

if (m_NetworkProperties.m_ImportEnabled) // Try import the input tensor

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

962

{

Narumol Prangnawarat

2021-05-07 17:52:36 +0100

[diff] [blame]

963

if(CheckFlag(importFlags, m_NetworkProperties.m_InputSource))

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

964

{

Narumol Prangnawarat

2020-10-30 16:06:55 +0000

[diff] [blame]

965

needMemCopy = false;

Ferran Balaguer

2019-09-19 11:49:25 +0100

[diff] [blame]

966

// This assumes a CPU Tensor handle

967

void* mem = tensorHandle->Map(false);

Narumol Prangnawarat

2021-05-07 17:52:36 +0100

[diff] [blame]

968

if (outputTensorHandle->Import(mem, m_NetworkProperties.m_InputSource))

Ferran Balaguer

2019-09-19 11:49:25 +0100

[diff] [blame]

969

{

970

tensorHandle->Unmap();

971

return; // No need for a workload since the import has been done.

972

}

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

973

tensorHandle->Unmap();

Ferran Balaguer

2019-09-19 11:49:25 +0100

[diff] [blame]

974

throw MemoryImportException("EnqueueInput: Memory Import failed");

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

975

}

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

976

}

Narumol Prangnawarat

2020-10-30 16:06:55 +0000

[diff] [blame]

977

if (needMemCopy)

David Monahan

2019-09-04 09:22:10 +0100

[diff] [blame]

978

{

979

// Create a mem copy workload for input since we did not import

Narumol Prangnawarat

2019-11-29 17:17:43 +0000

[diff] [blame]

980

std::unique_ptr<IWorkload> inputWorkload = std::make_unique<CopyMemGenericWorkload>(inputQueueDescriptor, info);

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

981

Narumol Prangnawarat

2020-04-01 16:51:23 +0100

[diff] [blame]

982

ARMNN_ASSERT_MSG(inputWorkload, "No input workload created");

Narumol Prangnawarat

2019-11-29 17:17:43 +0000

[diff] [blame]

983

Sadik Armagan

2020-03-18 10:57:30 +0000

[diff] [blame]

984

std::unique_ptr<TimelineUtilityMethods> timelineUtils =

985

TimelineUtilityMethods::GetTimelineUtils(m_ProfilingService);

Narumol Prangnawarat

2019-11-29 17:17:43 +0000

[diff] [blame]

986

if (timelineUtils)

987

{

988

// Add Input Workload to the post-optimisation network structure

989

AddWorkloadStructure(timelineUtils, inputWorkload, layer);

990

timelineUtils->Commit();

991

}

992

David Monahan

2019-09-04 09:22:10 +0100

[diff] [blame]

993

m_InputQueue.push_back(move(inputWorkload));

994

}

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

995

}

996

surmeh01

2018-05-18 16:31:43 +0100

[diff] [blame]

997

void LoadedNetwork::EnqueueOutput(const BindableLayer& layer, ITensorHandle* tensorHandle, const TensorInfo& tensorInfo)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

998

{

999

if (layer.GetType() != LayerType::Output)

1000

{

1001

throw InvalidArgumentException("EnqueueOutput: given layer not an OutputLayer");

1002

}

1003

1004

if (tensorHandle == nullptr)

1005

{

1006

throw InvalidArgumentException("EnqueueOutput: tensorHandle must not be NULL");

1007

}

1008

1009

OutputQueueDescriptor outputQueueDescriptor;

1010

WorkloadInfo info;

1011

1012

outputQueueDescriptor.m_Outputs.push_back(tensorHandle);

1013

info.m_OutputTensorInfos.push_back(tensorInfo);

1014

Narumol Prangnawarat

2020-04-01 16:51:23 +0100

[diff] [blame]

1015

ARMNN_ASSERT_MSG(layer.GetNumInputSlots() == 1, "Output Layer should have exactly one input.");

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1016

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

1017

// Gets the output handler from the previous node.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1018

const OutputHandler& outputHandler = layer.GetInputSlots()[0].GetConnectedOutputSlot()->GetOutputHandler();

1019

1020

const TensorInfo& inputTensorInfo = outputHandler.GetTensorInfo();

1021

ITensorHandle* inputTensorHandle = outputHandler.GetData();

Narumol Prangnawarat

2020-04-01 16:51:23 +0100

[diff] [blame]

1022

ARMNN_ASSERT_MSG(inputTensorHandle != nullptr, "Data should have been allocated.");

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1023

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

1024

// Try import the output tensor.

1025

// Note: We can only import the output pointer if all of the following hold true:

1026

// a) The imported pointer is aligned sufficiently

1027

// b) The tensor has zero padding

1028

// c) There is only one connection to the OutputSlot and it is to an OutputLayer.

1029

// d) The output pointer is allocated via malloc. (Other types will be supported in a later release)

Ferran Balaguer

2019-09-19 11:49:25 +0100

[diff] [blame]

1030

// e) m_IsExportEnabled must be set to true

Narumol Prangnawarat

2020-10-30 16:06:55 +0000

[diff] [blame]

1031

bool needMemCopy = true;

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1032

if (m_NetworkProperties.m_ExportEnabled &&

1033

(layer.GetInputSlots()[0].GetConnectedOutputSlot()->GetNumConnections() == 1))

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

1034

{

Ferran Balaguer

2019-09-19 11:49:25 +0100

[diff] [blame]

1035

if(layer.GetInputSlots()[0].GetConnectedOutputSlot()->GetOwningLayer().GetType() != LayerType::Input)

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

1036

{

Ferran Balaguer

2019-08-07 15:14:56 +0100

[diff] [blame]

1037

MemorySourceFlags importFlags = inputTensorHandle->GetImportFlags();

Narumol Prangnawarat

2021-05-07 17:52:36 +0100

[diff] [blame]

1038

if (CheckFlag(importFlags, m_NetworkProperties.m_OutputSource))

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

1039

{

Narumol Prangnawarat

2020-10-30 16:06:55 +0000

[diff] [blame]

1040

needMemCopy = false;

Ferran Balaguer

2019-08-07 15:14:56 +0100

[diff] [blame]

1041

void *mem = tensorHandle->Map(false);

Narumol Prangnawarat

2021-05-07 17:52:36 +0100

[diff] [blame]

1042

bool importOk = inputTensorHandle->Import(mem, m_NetworkProperties.m_OutputSource);

Ferran Balaguer

2019-08-07 15:14:56 +0100

[diff] [blame]

1043

tensorHandle->Unmap();

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

1044

Ferran Balaguer

2019-08-07 15:14:56 +0100

[diff] [blame]

1045

if (importOk)

1046

{

1047

// Insert synchronization workload

1048

MemSyncQueueDescriptor syncDesc;

1049

syncDesc.m_Inputs.push_back(inputTensorHandle);

1050

info.m_InputTensorInfos.push_back(inputTensorInfo);

1051

auto syncWorkload = std::make_unique<SyncMemGenericWorkload>(syncDesc, info);

Narumol Prangnawarat

2020-04-01 16:51:23 +0100

[diff] [blame]

1052

ARMNN_ASSERT_MSG(syncWorkload, "No sync workload created");

Ferran Balaguer

2019-08-07 15:14:56 +0100

[diff] [blame]

1053

m_OutputQueue.push_back(move(syncWorkload));

Ferran Balaguer

2019-08-07 15:14:56 +0100

[diff] [blame]

1054

}

David Monahan

2019-09-04 09:22:10 +0100

[diff] [blame]

1055

else

1056

{

1057

throw MemoryExportException("EnqueueOutput: Memory Export failed");

1058

}

Derek Lamberti

2019-08-01 15:56:25 +0100

[diff] [blame]

1059

}

1060

}

1061

}

Narumol Prangnawarat

2020-10-30 16:06:55 +0000

[diff] [blame]

1062

if (needMemCopy)

David Monahan

2019-09-04 09:22:10 +0100

[diff] [blame]

1063

{

Sadik Armagan

23969e8

2020-11-18 14:17:04 +0000

[diff] [blame]

1064

// If we got here then we didn't export the memory, so add an output workload which performs a memcopy.

1065

outputQueueDescriptor.m_Inputs.push_back(inputTensorHandle);

1066

info.m_InputTensorInfos.push_back(inputTensorInfo);

1067

1068

std::unique_ptr<IWorkload> outputWorkload =

1069

std::make_unique<CopyMemGenericWorkload>(outputQueueDescriptor, info);

1070

ARMNN_ASSERT_MSG(outputWorkload, "No output workload created");

1071

1072

std::unique_ptr<TimelineUtilityMethods> timelineUtils =

1073

TimelineUtilityMethods::GetTimelineUtils(m_ProfilingService);

1074

if (timelineUtils)

Narumol Prangnawarat

2019-11-29 17:17:43 +0000

[diff] [blame]

1075

{

Sadik Armagan

23969e8

2020-11-18 14:17:04 +0000

[diff] [blame]

1076

// Add Output Workload to the post-optimisation network structure

1077

AddWorkloadStructure(timelineUtils, outputWorkload, layer);

1078

timelineUtils->Commit();

Sadik Armagan

890bf65

2020-09-29 15:12:36 +0100

[diff] [blame]

1079

}

Sadik Armagan

23969e8

2020-11-18 14:17:04 +0000

[diff] [blame]

1080

1081

m_OutputQueue.push_back(move(outputWorkload));

David Monahan

2019-09-04 09:22:10 +0100

[diff] [blame]

1082

}

Derek Lamberti

2018-10-02 15:52:46 +0100

[diff] [blame]

1083

}

1084

Derek Lamberti

2020-06-19 14:33:05 +0100

[diff] [blame]

1085

void LoadedNetwork::AllocateWorkingMemory(std::lock_guard<std::mutex>& lock)

Derek Lamberti

2018-10-02 15:52:46 +0100

[diff] [blame]

1086

{

Derek Lamberti

2020-06-19 14:33:05 +0100

[diff] [blame]

1087

ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "Working Memory Allocation");

1088

1089

// this unused parameter makes sure we can only call this function with a valid lock

1090

IgnoreUnused(lock);

1091

Derek Lamberti

2018-10-02 15:52:46 +0100

[diff] [blame]

1092

if (m_IsWorkingMemAllocated)

1093

{

1094

return;

1095

}

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

1096

1097

if (m_ExternalMemoryManager)

David Beck

2018-10-23 13:35:58 +0100

[diff] [blame]

1098

{

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

1099

m_ExternalMemoryManager->Allocate();

1100

1101

for (unsigned int i = 0; i < m_TensorMemory.size(); ++i)

1102

{

1103

m_Tensorhandles[i]->Import(m_TensorMemory[i].first->m_Data, m_TensorMemory[i].second);

}

}

for (auto&& memoryManager : m_BackendMemoryMangers)

1108

{

Aron Virginas-Tar

5caf907

2018-11-14 18:35:18 +0000

[diff] [blame]

1109

if (memoryManager)

1110

{

1111

memoryManager->Acquire();

1112

}

David Beck

2018-10-23 13:35:58 +0100

[diff] [blame]

1113

}

Narumol Prangnawarat

11bd261

2019-08-13 10:26:53 +0100

[diff] [blame]

1114

m_TensorHandleFactoryRegistry.AquireMemory();

Derek Lamberti

2018-10-02 15:52:46 +0100

[diff] [blame]

1115

m_IsWorkingMemAllocated = true;

1116

}

1117

1118

void LoadedNetwork::FreeWorkingMemory()

1119

{

Matthew Bentham

2a326b5

2019-03-19 10:11:01 +0000

[diff] [blame]

1120

std::lock_guard<std::mutex> lockGuard(m_WorkingMemMutex);

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

1121

Derek Lamberti

2018-10-02 15:52:46 +0100

[diff] [blame]

1122

if (!m_IsWorkingMemAllocated)

1123

{

1124

return;

1125

}

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

1126

1127

if (m_ExternalMemoryManager)

David Beck

2018-10-23 13:35:58 +0100

[diff] [blame]

1128

{

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

1129

m_ExternalMemoryManager->Deallocate();

1130

}

1131

1132

// Informs the memory managers to release memory in its respective memory group

1133

for (auto&& memoryManager : m_BackendMemoryMangers)

1134

{

Aron Virginas-Tar

5caf907

2018-11-14 18:35:18 +0000

[diff] [blame]

1135

if (memoryManager)

1136

{

1137

memoryManager->Release();

1138

}

David Beck

2018-10-23 13:35:58 +0100

[diff] [blame]

1139

}

Narumol Prangnawarat

11bd261

2019-08-13 10:26:53 +0100

[diff] [blame]

1140

m_TensorHandleFactoryRegistry.ReleaseMemory();

Derek Lamberti

2018-10-02 15:52:46 +0100

[diff] [blame]

1141

m_IsWorkingMemAllocated = false;

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1142

}

1143

David Monahan

2019-12-02 08:35:43 +0000

[diff] [blame]

1144

bool LoadedNetwork::Execute(std::unique_ptr<TimelineUtilityMethods>& timelineUtils,

Cathal Corbett

2022-02-25 15:33:28 +0000

[diff] [blame^]

1145

ProfilingGuid inferenceGuid)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

{

bool success = true;

Aron Virginas-Tar

2018-10-19 16:46:15 +0100

[diff] [blame]

1149

auto Fail = [&](const std::exception& error)

1150

{

Derek Lamberti

0844697

2019-11-26 16:38:31 +0000

[diff] [blame]

1151

ARMNN_LOG(error) << "An error occurred attempting to execute a workload: " << error.what();

Aron Virginas-Tar

2018-10-19 16:46:15 +0100

[diff] [blame]

success = false;

};

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1155

try

1156

{

Matthew Bentham

2a326b5

2019-03-19 10:11:01 +0000

[diff] [blame]

1157

std::lock_guard<std::mutex> lockGuard(m_WorkingMemMutex);

Derek Lamberti

2020-06-19 14:33:05 +0100

[diff] [blame]

1158

AllocateWorkingMemory(lockGuard);

Derek Lamberti

2018-10-02 15:52:46 +0100

[diff] [blame]

1159

David Monahan

2019-12-02 08:35:43 +0000

[diff] [blame]

1160

ProfilingDynamicGuid workloadInferenceID(0);

Derek Lamberti

2020-06-19 14:33:05 +0100

[diff] [blame]

1161

auto ExecuteQueue = [&timelineUtils, &workloadInferenceID, &inferenceGuid](WorkloadQueue& queue)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1162

{

Derek Lamberti

2020-06-19 14:33:05 +0100

[diff] [blame]

1163

for (auto& workload : queue)

David Monahan

2019-12-02 08:35:43 +0000

[diff] [blame]

1164

{

Derek Lamberti

2020-06-19 14:33:05 +0100

[diff] [blame]

1165

if(timelineUtils)

1166

{

1167

workloadInferenceID = timelineUtils->RecordWorkloadInferenceAndStartOfLifeEvent(workload->GetGuid(),

inferenceGuid);

}

workload->Execute();

if(timelineUtils)

{

timelineUtils->RecordEndOfLifeEvent(workloadInferenceID);

1174

}

David Monahan

2019-12-02 08:35:43 +0000

[diff] [blame]

1175

}

Derek Lamberti

2020-06-19 14:33:05 +0100

[diff] [blame]

1176

};

Derek Lamberti

2018-10-02 15:52:46 +0100

[diff] [blame]

1177

Derek Lamberti

2020-06-19 14:33:05 +0100

[diff] [blame]

1178

ExecuteQueue(m_InputQueue);

1179

ExecuteQueue(m_WorkloadQueue);

1180

ExecuteQueue(m_OutputQueue);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1181

}

Aron Virginas-Tar

2018-10-19 16:46:15 +0100

[diff] [blame]

1182

catch (const RuntimeException& error)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1183

{

Aron Virginas-Tar

2018-10-19 16:46:15 +0100

[diff] [blame]

1184

Fail(error);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1185

}

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1186

catch (const std::runtime_error& error)

1187

{

Aron Virginas-Tar

2018-10-19 16:46:15 +0100

[diff] [blame]

1188

Fail(error);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

1189

}

1190

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

return success;

}

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1194

void LoadedNetwork::EnqueueInput(const ConstTensor& inputTensor, ITensorHandle* inputTensorHandle)

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1195

{

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1196

if (m_NetworkProperties.m_ImportEnabled) // Try import the input tensor

1197

{

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1198

MemorySourceFlags importFlags = inputTensorHandle->GetImportFlags();

Narumol Prangnawarat

2021-05-07 17:52:36 +0100

[diff] [blame]

1199

if (CheckFlag(importFlags, m_NetworkProperties.m_InputSource) )

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1200

{

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1201

std::unique_ptr<ITensorHandle> tensorHandle =

James Conroy

2021-04-27 17:13:27 +0100

[diff] [blame]

1202

std::make_unique<ConstPassthroughTensorHandle>(inputTensor.GetInfo(),

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1203

inputTensor.GetMemoryArea());

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1204

void* mem = tensorHandle->Map(false);

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1205

1206

if (inputTensorHandle->Import(mem, m_NetworkProperties.m_InputSource))

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1207

{

1208

tensorHandle->Unmap();

1209

return;

1210

}

1211

tensorHandle->Unmap();

1212

throw MemoryImportException("EnqueueInput: Memory Import failed");

}

else

{

throw MemoryImportException("EnqueueInput: Memory Import failed, backend does not support Import");

}

}

else

{

std::unique_ptr<ITensorHandle> tensorHandle =

James Conroy

2021-04-27 17:13:27 +0100

[diff] [blame]

1222

std::make_unique<ConstPassthroughTensorHandle>(inputTensor.GetInfo(), inputTensor.GetMemoryArea());

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1223

1224

auto copyFunc = [](void* dst, const void* src, size_t size)

1225

{

1226

memcpy(dst, src, size);

1227

};

1228

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1229

CopyTensorContentsGeneric(tensorHandle.get(), inputTensorHandle, copyFunc);

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

}

}

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1233

// Note: We can only import the output pointer if all of the following hold true:

1234

// a) The imported pointer is aligned sufficiently

1235

// b) The tensor has zero padding

1236

// c) There is only one connection to the OutputSlot and it is to an OutputLayer.

1237

// d) The output pointer is allocated via malloc. (Other types will be supported in a later release)

1238

// e) m_IsExportEnabled must be set to true

1239

void LoadedNetwork::ImportOutputTensor(const Tensor& outputTensor, ITensorHandle* outputTensorHandle)

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1240

{

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1241

ARMNN_ASSERT_MSG(outputTensorHandle != nullptr, "Data should have been allocated.");

1242

MemorySourceFlags importFlags = outputTensorHandle->GetImportFlags();

1243

if (CheckFlag(importFlags, m_NetworkProperties.m_OutputSource))

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1244

{

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1245

std::unique_ptr<ITensorHandle> tensorHandle =

1246

std::make_unique<PassthroughTensorHandle>(outputTensor.GetInfo(),

1247

outputTensor.GetMemoryArea());

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1248

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1249

void* mem = tensorHandle->Map(false);

1250

bool importOk = outputTensorHandle->Import(mem, m_NetworkProperties.m_OutputSource);

1251

tensorHandle->Unmap();

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1252

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1253

if (!importOk)

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1254

{

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1255

throw MemoryExportException("ImportOutputTensor: Memory Export failed");

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

}

}

else

{

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1260

throw MemoryExportException("ImportOutputTensor: Memory Export failed, attempting to export Input Layer");

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1261

}

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

}

void CopyToOutputTensor(const Tensor& outputTensor, ITensorHandle* outputTensorHandle)

1266

{

1267

auto copyFunc = [](void* dst, const void* src, size_t size)

1268

{

1269

memcpy(dst, src, size);

1270

};

1271

1272

std::unique_ptr<ITensorHandle> tensorHandle =

1273

std::make_unique<PassthroughTensorHandle>(outputTensor.GetInfo(),

1274

outputTensor.GetMemoryArea());

1275

1276

CopyTensorContentsGeneric(outputTensorHandle, tensorHandle.get(), copyFunc);

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1277

}

1278

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

1279

1280

const armnn::ConstTensor GetInputTensor(const LayerBindingId layerId, const InputTensors& inputTensors)

1281

{

1282

for (auto inputTensorPair : inputTensors)

1283

{

1284

LayerBindingId id = inputTensorPair.first;

1285

if (id == layerId)

1286

{

1287

return inputTensorPair.second;

1288

}

1289

}

1290

throw InvalidArgumentException("Input does not exist.");

1291

}

1292

1293

const armnn::Tensor GetOutputTensor(const LayerBindingId layerId, const OutputTensors& outputTensors)

1294

{

1295

for (auto outputTensorPair : outputTensors)

1296

{

1297

LayerBindingId id = outputTensorPair.first;

1298

if (id == layerId)

1299

{

1300

return outputTensorPair.second;

1301

}

1302

}

1303

throw InvalidArgumentException("Output does not exist.");

1304

}

1305

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1306

std::vector<ImportedInputId> LoadedNetwork::ImportInputs(const InputTensors& inputTensors,

1307

MemorySource forceImportMemorySource)

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1308

{

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

1309

if (!m_NetworkProperties.m_AsyncEnabled)

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1310

{

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1311

// Cannot import if import is not enabled and forceImportMemorySource is undefined

1312

if (forceImportMemorySource == MemorySource::Undefined)

1313

{

1314

throw MemoryImportException("ImportInputs: Memory Import failed, NetworkProperties.m_ImportEnabled");

1315

}

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1316

if (inputTensors.size() != m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph().GetNumInputs())

1317

{

1318

throw MemoryImportException("ImportInputs: Force Import failed, incorrect number of tensors");

1319

}

1320

1321

std::vector<ImportedInputId> importedInputs;

1322

Graph& graph = m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph().TopologicalSort();

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

1323

unsigned int inputIndex = 0;

1324

for (const BindableLayer* inputLayer : graph.GetInputLayers())

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1325

{

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

1326

auto outputTensorHandle = m_PreImportedInputHandles[inputIndex].m_TensorHandle.get();

1327

1328

if (!outputTensorHandle)

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1329

{

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

inputIndex++;

continue;

}

auto layerBindingId = inputLayer->GetBindingId();

1335

auto it = std::find_if(inputTensors.begin(), inputTensors.end(), [=](const auto& inputTensor)

1336

{

1337

return inputTensor.first == layerBindingId;

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1338

});

1339

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

1340

if (it == inputTensors.end())

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1341

{

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

1342

inputIndex++;

1343

continue;

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1344

}

1345

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

1346

const auto& inputTensor = *it;

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1347

std::unique_ptr<ITensorHandle> passThroughTensorHandle =

1348

std::make_unique<ConstPassthroughTensorHandle>(inputTensor.second.GetInfo(),

1349

inputTensor.second.GetMemoryArea());

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1350

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

1351

if (outputTensorHandle->CanBeImported(passThroughTensorHandle->Map(), forceImportMemorySource)

1352

&& (outputTensorHandle->Import(passThroughTensorHandle->Map(), forceImportMemorySource)))

1353

{

1354

importedInputs.push_back(inputIndex);

1355

}

1356

passThroughTensorHandle->Unmap();

1357

1358

inputIndex++;

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1359

}

1360

1361

return importedInputs;

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1362

}

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1363

else

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1364

{

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1365

// Import when the import of network properties is enabled

1366

std::vector<ImportedInputId> importedInputs;

1367

Graph& graph = m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph().TopologicalSort();

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1368

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1369

for (auto inputTensor : inputTensors)

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1370

{

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1371

auto layerBindingId = inputTensor.first;

1372

auto it = std::find_if(graph.GetInputLayers().begin(), graph.GetInputLayers().end(), [=](auto* layer)

1373

{

1374

return layer->GetBindingId() == layerBindingId;

1375

});

1376

1377

if (it == graph.GetInputLayers().end())

1378

{

1379

throw MemoryImportException(fmt::format(

1380

"ImportInputs: Memory Import failed, unknown LayerBindingId: {}", layerBindingId));

1381

}

1382

1383

const Layer* layer = *it;

1384

if (layer->GetType() != LayerType::Input)

1385

{

1386

throw InvalidArgumentException("ImportInputs: given layer not an InputLayer");

1387

}

1388

1389

auto& backend = m_Backends.at(layer->GetBackendId());

1390

if (!HasCapability(BackendOptions::BackendOption{"PreImportIOTensors", true}, backend->GetCapabilities()))

1391

{

1392

std::string er = backend->GetId();

1393

er += " does not have PreImportIOTensors capability";

1394

throw BackendCapabilityException(er);

1395

}

1396

1397

const OutputSlot& outputSlot = layer->GetOutputSlots()[0];

1398

1399

ITensorHandleFactory::FactoryId factoryId = outputSlot.GetTensorHandleFactoryId();

1400

const TensorInfo& tensorInfo = outputSlot.GetTensorInfo();

1401

1402

ITensorHandleFactory* handleFactory = m_TensorHandleFactoryRegistry.GetFactory(factoryId);

1403

ARMNN_ASSERT(handleFactory);

1404

1405

ImportedTensorHandlePin importedTensorHandlePin{layerBindingId,

1406

handleFactory->CreateTensorHandle(tensorInfo, false)};

1407

1408

ITensorHandle* tensorHandle = importedTensorHandlePin.m_TensorHandle.get();

1409

1410

if (!CheckFlag(tensorHandle->GetImportFlags(), m_NetworkProperties.m_InputSource))

1411

{

1412

throw MemoryImportException(

1413

fmt::format("ImportInputs: Memory Import failed, backend: "

1414

"{} does not support importing from source {}"

1415

, factoryId, m_NetworkProperties.m_InputSource));

1416

}

1417

1418

std::unique_ptr<ITensorHandle> passThroughTensorHandle =

1419

std::make_unique<ConstPassthroughTensorHandle>(inputTensor.second.GetInfo(),

1420

inputTensor.second.GetMemoryArea());

1421

1422

if (tensorHandle->Import(passThroughTensorHandle->Map(), m_NetworkProperties.m_InputSource))

1423

{

1424

importedInputs.push_back(m_CurImportedInputId++);

1425

passThroughTensorHandle->Unmap();

}

else

{

passThroughTensorHandle->Unmap();

1430

throw MemoryImportException("ImportInputs: Memory Import failed");

1431

}

1432

1433

m_PreImportedInputHandles.push_back(std::move(importedTensorHandlePin));

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1434

}

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1435

return importedInputs;

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1436

}

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1437

}

1438

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1439

std::vector<ImportedOutputId> LoadedNetwork::ImportOutputs(const OutputTensors& outputTensors,

1440

MemorySource forceImportMemorySource)

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1441

{

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

1442

if (!m_NetworkProperties.m_AsyncEnabled)

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1443

{

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1444

// Cannot import if import is not enabled and forceImportMemorySource is undefined

1445

if (forceImportMemorySource == MemorySource::Undefined)

1446

{

1447

throw MemoryImportException("ImportOutputs: Memory Import failed, NetworkProperties.m_ImportEnabled");

1448

}

1449

// If forceImportMemorySource is defined, try import if memory is aligned

1450

if (outputTensors.size() != m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph().GetNumOutputs())

1451

{

1452

throw MemoryImportException("ImportOutputs: Force Import failed, incorrect number of tensors");

1453

}

1454

std::vector<ImportedInputId> importedOutputs;

1455

Graph& graph = m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph().TopologicalSort();

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

1456

1457

unsigned int outputIndex = 0;

1458

for (const BindableLayer* const outputLayer : graph.GetOutputLayers())

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1459

{

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

1460

auto inputTensorHandle = m_PreImportedOutputHandles[outputIndex].m_TensorHandle.get();

1461

1462

if (!inputTensorHandle)

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1463

{

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

outputIndex++;

continue;

}

auto layerBindingId = outputLayer->GetBindingId();

1469

auto it = std::find_if(outputTensors.begin(), outputTensors.end(), [=] (const auto& outputTensor)

1470

{

1471

return outputTensor.first == layerBindingId;

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1472

});

1473

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

1474

if (it == outputTensors.end())

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1475

{

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

1476

outputIndex++;

1477

continue;

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1478

}

1479

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

1480

const auto outputTensor = *it;

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1481

// Check if the output memory can be imported

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

1482

if (inputTensorHandle->CanBeImported(outputTensor.second.GetMemoryArea(), forceImportMemorySource)

1483

&& inputTensorHandle->Import(outputTensor.second.GetMemoryArea(), forceImportMemorySource))

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1484

{

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

1485

importedOutputs.push_back(outputIndex);

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1486

}

Finn Williams

2022-02-15 20:47:34 +0000

[diff] [blame]

1487

outputIndex++;

Narumol Prangnawarat

2022-01-28 17:59:18 +0000

[diff] [blame]

1488

}

1489

return importedOutputs;

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1490

}

1491

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1492

std::vector<ImportedOutputId> importedOutputs;

1493

Graph& graph = m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph().TopologicalSort();

1494

1495

for (const auto& outputTensor : outputTensors)

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1496

{

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1497

auto layerBindingId = outputTensor.first;

1498

auto it = std::find_if(graph.GetOutputLayers().begin(), graph.GetOutputLayers().end(), [=](auto* layer)

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1499

{

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1500

return layer->GetBindingId() == layerBindingId;

1501

});

1502

1503

if (it == graph.GetOutputLayers().end())

1504

{

1505

throw MemoryImportException(fmt::format("ImportOutputs: Memory Import failed, unknown LayerBindingId: {}",

layerBindingId));

}

const Layer* layer = *it;

1510

if (layer->GetType() != LayerType::Output)

1511

{

1512

throw InvalidArgumentException("ImportOutputs: given layer not an OutputLayer");

1513

}

1514

1515

auto& backend = m_Backends.at(layer->GetBackendId());

1516

if (!HasCapability(BackendOptions::BackendOption{"PreImportIOTensors", true}, backend->GetCapabilities()))

1517

{

1518

std::string er = backend->GetId();

1519

er += " does not have PreImportIOTensors capability";

1520

throw BackendCapabilityException(er);

1521

}

1522

1523

const InputSlot& inputSlot = layer->GetInputSlots()[0];

1524

ITensorHandleFactory::FactoryId factoryId = inputSlot.GetConnectedOutputSlot()->GetTensorHandleFactoryId();

1525

const TensorInfo& tensorInfo = inputSlot.GetConnectedOutputSlot()->GetTensorInfo();

1526

1527

ITensorHandleFactory* handleFactory = m_TensorHandleFactoryRegistry.GetFactory(factoryId);

1528

ARMNN_ASSERT(handleFactory);

1529

1530

ImportedTensorHandlePin importedTensorHandlePin{layerBindingId,

1531

handleFactory->CreateTensorHandle(tensorInfo, false)};

1532

1533

ITensorHandle* tensorHandle = importedTensorHandlePin.m_TensorHandle.get();

1534

1535

if (!CheckFlag(tensorHandle->GetImportFlags(), m_NetworkProperties.m_OutputSource))

1536

{

1537

throw MemoryImportException(fmt::format("ImportInputs: Memory Import failed, backend: "

1538

"{} does not support importing from source {}"

1539

, factoryId, m_NetworkProperties.m_OutputSource));

1540

}

1541

1542

if (tensorHandle->Import(outputTensor.second.GetMemoryArea(), m_NetworkProperties.m_OutputSource))

1543

{

1544

importedOutputs.push_back(m_CurImportedOutputId++);

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1545

}

1546

else

1547

{

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1548

throw MemoryImportException("ImportInputs: Memory Import failed");

1549

}

1550

1551

m_PreImportedOutputHandles.push_back(std::move(importedTensorHandlePin));

1552

}

1553

1554

return importedOutputs;

1555

}

1556

1557

void LoadedNetwork::ClearImportedInputs(const std::vector<ImportedInputId> inputIds)

1558

{

1559

for (auto id : inputIds)

1560

{

1561

if (id > m_PreImportedInputHandles.size())

1562

{

1563

throw InvalidArgumentException(fmt::format("ClearImportedInputs::Unknown ImportedInputId: {}", id));

1564

}

1565

1566

auto& importedTensorHandle = m_PreImportedInputHandles[id].m_TensorHandle;

1567

if (!importedTensorHandle)

1568

{

1569

throw InvalidArgumentException(

1570

fmt::format("ClearImportedInputs::ImportedInput with id: {} has already been deleted", id));

1571

}

1572

// Call Unimport then destroy the tensorHandle

1573

importedTensorHandle->Unimport();

1574

importedTensorHandle = {};

}

}

void LoadedNetwork::ClearImportedOutputs(const std::vector<ImportedOutputId> outputIds)

1579

{

1580

for (auto id : outputIds)

1581

{

1582

if (id > m_PreImportedOutputHandles.size())

1583

{

1584

throw InvalidArgumentException(fmt::format("ClearImportedOutputs::Unknown ImportedOutputId: {}", id));

1585

}

1586

1587

auto& importedTensorHandle = m_PreImportedOutputHandles[id].m_TensorHandle;

1588

if (!importedTensorHandle)

1589

{

1590

throw InvalidArgumentException(

1591

fmt::format("ClearImportedOutputs::ImportedOutput with id: {} has already been deleted", id));

1592

}

1593

// Call Unimport then destroy the tensorHandle

1594

importedTensorHandle->Unimport();

1595

importedTensorHandle = {};

}

}

Status LoadedNetwork::Execute(const InputTensors& inputTensors,

1600

const OutputTensors& outputTensors,

1601

IWorkingMemHandle& iWorkingMemHandle,

1602

std::vector<ImportedInputId> preImportedInputs,

1603

std::vector<ImportedOutputId> preImportedOutputs)

1604

{

1605

const Graph& graph = m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph();

1606

1607

if (inputTensors.size() + preImportedInputs.size() != graph.GetNumInputs())

1608

{

1609

if (preImportedInputs.empty())

1610

{

1611

throw InvalidArgumentException("LoadedNetwork::Execute: Number of inputs provided does not match network.");

}

else

{

throw InvalidArgumentException("LoadedNetwork::Execute: "

1616

"Number of inputs + preImportedInputs provided does not match network.");

}

}

if (outputTensors.size() + preImportedOutputs.size() != graph.GetNumOutputs())

1621

{

1622

if (preImportedOutputs.empty())

1623

{

1624

throw InvalidArgumentException("LoadedNetwork::Execute: "

1625

"Number of outputs provided does not match network.");

}

else

{

throw InvalidArgumentException("LoadedNetwork::Execute: "

1630

"Number of outputs + preImportedOutputs provided does not match network.");

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

}

}

WorkingMemHandle& workingMemHandle = dynamic_cast<WorkingMemHandle&>(iWorkingMemHandle);

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1635

// Collect all the given LayerBindingIds and check them for duplicates and unknowns.

1636

std::vector<LayerBindingId>& bindingIds = workingMemHandle.GetBindingIdVector();

1637

unsigned int index = 0;

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1638

for (auto pair : inputTensors)

1639

{

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1640

bindingIds[index++] = pair.first;

1641

}

1642

for (ImportedInputId id : preImportedInputs)

1643

{

1644

bindingIds[index++] = ValidateImportedInputID(id);

1645

}

1646

for (auto pair : outputTensors)

1647

{

1648

bindingIds[index++] = pair.first;

1649

}

1650

for (ImportedOutputId id : preImportedOutputs)

1651

{

1652

bindingIds[index++] = ValidateImportedOutputID(id);

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1653

}

1654

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1655

workingMemHandle.ValidateBindingIds();

1656

1657

auto resetMemHandle = [&]()

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1658

{

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1659

for (ImportedInputId id: preImportedInputs)

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1660

{

1661

const LayerBindingId layerBindingId = m_PreImportedInputHandles[id].m_LayerBindingId;

1662

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1663

auto inputHandle = workingMemHandle.GetInputHandle(layerBindingId);

1664

auto inputConnections = workingMemHandle.GetInputConnections(layerBindingId);

1665

for (auto it : inputConnections)

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1666

{

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1667

*it = inputHandle;

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1668

}

1669

}

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1670

1671

for (ImportedOutputId id: preImportedOutputs)

1672

{

1673

const LayerBindingId layerBindingId = m_PreImportedOutputHandles[id].m_LayerBindingId;

1674

1675

auto outputHandle = workingMemHandle.GetOutputHandle(layerBindingId);

1676

auto outputConnections = workingMemHandle.GetOutputConnection(layerBindingId);

1677

1678

for (auto it : outputConnections)

{

*it = outputHandle;

}

}

};

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1684

Cathal Corbett

2022-02-25 15:33:28 +0000

[diff] [blame^]

1685

std::unique_ptr<TimelineUtilityMethods> timelineUtils =

1686

TimelineUtilityMethods::GetTimelineUtils(m_ProfilingService);

1687

ProfilingGuid inferenceGuid = m_ProfilingService.GetNextGuid();

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1688

if (timelineUtils)

1689

{

1690

// Add inference timeline trace if profiling is enabled.

Cathal Corbett

2022-02-25 15:33:28 +0000

[diff] [blame^]

1691

ProfilingGuid networkGuid = m_OptimizedNetwork->GetGuid();

1692

timelineUtils->CreateTypedEntity(inferenceGuid,LabelsAndEventClasses::INFERENCE_GUID);

1693

timelineUtils->CreateRelationship(ProfilingRelationshipType::RetentionLink,

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1694

networkGuid,

1695

inferenceGuid,

Cathal Corbett

2022-02-25 15:33:28 +0000

[diff] [blame^]

1696

LabelsAndEventClasses::EXECUTION_OF_GUID);

1697

timelineUtils->RecordEvent(inferenceGuid,LabelsAndEventClasses::ARMNN_PROFILING_SOL_EVENT_CLASS);

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1698

}

1699

1700

bool executionSucceeded = true;

if (timelineUtils)

{

// Add end of life of the inference timeline if profiling is enabled.

Cathal Corbett

2022-02-25 15:33:28 +0000

[diff] [blame^]

1705

timelineUtils->RecordEvent(inferenceGuid,LabelsAndEventClasses::ARMNN_PROFILING_EOL_EVENT_CLASS);

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1706

timelineUtils->Commit();

1707

}

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1708

1709

if (!workingMemHandle.IsAllocated())

1710

{

1711

workingMemHandle.Allocate();

}

{

ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "PrepareInputs");

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1716

for (auto pair : inputTensors)

1717

{

1718

EnqueueInput(pair.second, workingMemHandle.GetInputHandle(pair.first));

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1719

}

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1720

1721

// Swap in the pre-imported inputs if any

1722

for (ImportedInputId id : preImportedInputs)

1723

{

1724

const ImportedTensorHandlePin& importedInputPin = m_PreImportedInputHandles[id];

1725

const LayerBindingId layerBindingId = m_PreImportedInputHandles[id].m_LayerBindingId;

1726

const auto& preimportedHandle = importedInputPin.m_TensorHandle;

1727

1728

auto inputConnections = workingMemHandle.GetInputConnections(layerBindingId);

1729

for (auto it : inputConnections)

1730

{

1731

*it = preimportedHandle.get();

}

}

}

{

ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "PrepareOutputs");

1737

if (m_NetworkProperties.m_ExportEnabled)

1738

{

1739

for (auto pair: outputTensors)

1740

{

1741

ImportOutputTensor(pair.second, workingMemHandle.GetOutputHandle(pair.first));

}

}

for (ImportedOutputId id : preImportedOutputs)

1746

{

1747

const ImportedTensorHandlePin& importedOutputPin = m_PreImportedOutputHandles[id];

1748

const LayerBindingId layerBindingId = m_PreImportedOutputHandles[id].m_LayerBindingId;

1749

const auto& preimportedHandle = importedOutputPin.m_TensorHandle;

1750

1751

auto outputConnections = workingMemHandle.GetOutputConnection(layerBindingId);

1752

1753

for (auto it : outputConnections)

1754

{

1755

*it = preimportedHandle.get();

1756

}

1757

}

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1758

}

1759

1760

auto Fail = [&](const std::exception& error)

1761

{

1762

ARMNN_LOG(error) << "An error occurred attempting to execute a workload: " << error.what();

1763

executionSucceeded = false;

1764

};

Cathal Corbett

2022-02-25 15:33:28 +0000

[diff] [blame^]

1765

ProfilingDynamicGuid workloadInferenceID(0);

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

try

{

for (unsigned int i = 0; i < m_WorkloadQueue.size(); ++i)

1770

{

1771

auto& workload = m_WorkloadQueue[i];

1772

if (timelineUtils)

1773

{

1774

workloadInferenceID = timelineUtils->RecordWorkloadInferenceAndStartOfLifeEvent(workload->GetGuid(),

1775

inferenceGuid);

1776

}

1777

workload->ExecuteAsync(workingMemHandle.GetWorkingMemDescriptorAt(i));

if (timelineUtils)

{

timelineUtils->RecordEndOfLifeEvent(workloadInferenceID);

}

}

}

catch (const RuntimeException& error)

1786

{

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1787

resetMemHandle();

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1788

Fail(error);

1789

}

1790

catch (const std::runtime_error& error)

1791

{

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1792

resetMemHandle();

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1793

Fail(error);

1794

}

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1795

catch (...)

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1796

{

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1797

resetMemHandle();

1798

throw;

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1799

}

Keith Davis

e813d67

2021-04-22 10:10:34 +0100

[diff] [blame]

1800

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1801

if (!m_NetworkProperties.m_ExportEnabled)

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1802

{

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1803

for (auto pair: outputTensors)

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1804

{

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1805

CopyToOutputTensor(pair.second, workingMemHandle.GetOutputHandle(pair.first));

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1806

}

1807

}

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1808

else

1809

{

1810

ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "SyncMemGeneric_Execute");

1811

workingMemHandle.MemSyncOutputs();

1812

}

1813

1814

resetMemHandle();

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1815

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1816

return executionSucceeded ? Status::Success : Status::Failure;

1817

}

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1818

1819

/// Create a new unique WorkingMemHandle object. Create multiple handles if you wish to have

1820

/// overlapped Execution by calling this function from different threads.

1821

std::unique_ptr<IWorkingMemHandle> LoadedNetwork::CreateWorkingMemHandle(NetworkId networkId)

1822

{

1823

Graph& order = m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph();

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

1824

1825

// Tensors that will need to be allocated internally within armnn

1826

std::vector<std::unique_ptr<ITensorHandle>> managedTensorHandles;

1827

// Tensors that will be allocated externally by the user

1828

std::vector<std::unique_ptr<ITensorHandle>> unmanagedTensorHandles;

1829

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

1830

std::vector<WorkingMemDescriptor> workingMemDescriptors;

1831

std::unordered_map<LayerGuid, WorkingMemDescriptor> workingMemDescriptorMap;

1832

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

1833

auto GetTensorHandle = [&](Layer* layer, const OutputSlot& outputSlot)

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

1834

{

1835

ITensorHandleFactory::FactoryId factoryId = outputSlot.GetTensorHandleFactoryId();

1836

const TensorInfo& tensorInfo = outputSlot.GetTensorInfo();

1837

1838

if (factoryId == ITensorHandleFactory::LegacyFactoryId)

1839

{

1840

BackendId id = layer->GetBackendId();

1841

ARMNN_NO_DEPRECATE_WARN_BEGIN

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

1842

return m_WorkloadFactories.at(id)->CreateTensorHandle(tensorInfo, false);

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

1843

ARMNN_NO_DEPRECATE_WARN_END

1844

}

1845

else

1846

{

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

1847

ITensorHandleFactory* handleFactory = m_TensorHandleFactoryRegistry.GetFactory(factoryId);

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

1848

ARMNN_ASSERT(handleFactory);

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

1849

return handleFactory->CreateTensorHandle(tensorInfo, false);

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

}

};

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1853

struct HandleInfo

1854

{

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

1855

ITensorHandle* m_TensorHandle;

1856

1857

bool m_IsInputLayerHandle = false;

1858

bool m_IsOutputLayerHandle = false;

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1859

1860

WorkingMemHandle::InputMemDescriptorCoords m_InputMemDescriptorCoords;

1861

WorkingMemHandle::OutputMemDescriptorCoords m_OutputMemDescriptorCoords;

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1862

};

1863

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

1864

std::unordered_map<const OutputSlot*, HandleInfo> outputToHandleInfoMap;

1865

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1866

unsigned int layerIndex = 0;

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

1867

for (auto&& layer : order)

1868

{

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

1869

// Constant layers execution and management is handled during loaded network construction

1870

if (layer->GetType() == LayerType::Constant)

1871

{

1872

continue;

1873

}

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1874

1875

WorkingMemDescriptor workingMemDescriptor;

1876

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

1877

bool isMemoryManaged = true;

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1878

bool isInputLayer = false;

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1879

bool isOutputLayer = false;

1880

bool isConnectedToOutputLayer = false;

1881

1882

if (layer->GetType() == LayerType::Input || layer->GetType() == LayerType::MemImport)

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

1883

{

1884

// Input layers/workloads will not be executed so the descriptor is not added to workingMemDescriptors

1885

// However we will still need to manage the tensorHandle

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1886

isInputLayer = true;

1887

isMemoryManaged = !m_NetworkProperties.m_ImportEnabled;

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

1888

}

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1889

else if (layer->GetType() == LayerType::Output)

1890

{

1891

isOutputLayer = true;

1892

}

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

1893

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1894

unsigned int slotIndex = 0;

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

1895

// Create a tensor handle for each output slot of a layer

1896

// Once we create it, we start managing its lifetime

1897

for (auto& slot : layer->GetOutputSlots())

1898

{

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1899

for (unsigned int i = 0; i < slot.GetNumConnections(); ++i)

1900

{

1901

if ((slot.GetConnection(i)->GetOwningLayer().GetType() == LayerType::Output))

1902

{

1903

if (!isConnectedToOutputLayer)

1904

{

1905

isConnectedToOutputLayer = true;

1906

// If Export is enabled disable memory management, so we can export, otherwise we do a copy

1907

isMemoryManaged = !m_NetworkProperties.m_ExportEnabled;

}

else

{

// Importing in this case would likely cause unexpected behaviour, so we disallow it.

1912

ARMNN_LOG(warning) <<

1913

fmt::format("Layer name: '{0}' guid: '{1}' has two or more OutputLayers connected to it. "

1914

"This will prevent importing on the connected OutputLayers.",

1915

layer->GetName(), layer->GetGuid());

1916

isMemoryManaged = true;

}

}

}

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

1921

ITensorHandle* tensorHandle;

1922

if (isMemoryManaged)

1923

{

1924

managedTensorHandles.emplace_back(GetTensorHandle(layer, slot));

1925

tensorHandle = managedTensorHandles.back().get();

}

else

{

unmanagedTensorHandles.emplace_back(GetTensorHandle(layer, slot));

1930

tensorHandle = unmanagedTensorHandles.back().get();

1931

}

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

1932

1933

workingMemDescriptor.m_Outputs.push_back(tensorHandle);

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

1934

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

1935

HandleInfo& handleInfo = outputToHandleInfoMap[&slot];

1936

handleInfo.m_TensorHandle = tensorHandle;

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1937

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1938

// Store the coordinates of the current layer's OutputSlot that is connected to the OutputLayer

1939

if (isConnectedToOutputLayer)

1940

{

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

1941

handleInfo.m_IsOutputLayerHandle = true;

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1942

handleInfo.m_OutputMemDescriptorCoords.m_OutputSlotCoords = {layerIndex, slotIndex};

1943

}

1944

// Store the LayerBindingId of the InputLayer

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1945

if (isInputLayer)

1946

{

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

1947

handleInfo.m_IsInputLayerHandle = true;

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1948

LayerBindingId bindingId = static_cast<BindableLayer*>(layer)->GetBindingId();

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1949

handleInfo.m_InputMemDescriptorCoords.m_LayerBindingId = bindingId;

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1950

}

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1951

slotIndex++;

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

1952

}

1953

// Loop through the input slots in the same layer and decrement the reference counter associated

1954

// to each tensor handle we encounter.

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1955

// Once it reaches zero, the lifetime of the tensor handle has ended, and we mark its memory as available

1956

// so that the next tensor handle with a non overlapping lifetime can share its memory.

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

1957

for (auto& slot : layer->GetInputSlots())

1958

{

1959

ARMNN_ASSERT(slot.GetConnection());

1960

auto outputSlot = slot.GetConnectedOutputSlot();

1961

auto key = outputSlot->GetOwningLayer().GetGuid();

1962

1963

// Constant layers execution and management is handled during loaded network construction

1964

auto found = m_ConstantTensorHandles.find(key);

1965

if (found != m_ConstantTensorHandles.end())

1966

{

Finn Williams

2021-10-14 11:22:19 +0100

[diff] [blame]

1967

ITensorHandle* tensorHandle = found->second;

1968

workingMemDescriptor.m_Inputs.push_back(tensorHandle);

1969

1970

// Odd case where a constant layer is connected to an output layer

1971

// We will need to create a HandleInfo to track it

1972

if (isOutputLayer)

1973

{

1974

LayerBindingId bindingId = static_cast<BindableLayer*>(layer)->GetBindingId();

1975

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

1976

HandleInfo& handleInfo = outputToHandleInfoMap[outputSlot];

1977

handleInfo.m_TensorHandle = tensorHandle;

1978

handleInfo.m_IsOutputLayerHandle = true;

Finn Williams

2021-10-14 11:22:19 +0100

[diff] [blame]

1979

handleInfo.m_OutputMemDescriptorCoords.m_LayerBindingIds.push_back(bindingId);

1980

handleInfo.m_OutputMemDescriptorCoords.m_InputSlotCoords.push_back({layerIndex, 0});

1981

}

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

continue;

}

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

1985

HandleInfo& handleInfo = outputToHandleInfoMap.at(outputSlot);

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1986

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

1987

ITensorHandle* inputTensorHandle = handleInfo.m_TensorHandle;

1988

workingMemDescriptor.m_Inputs.push_back(inputTensorHandle);

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1989

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1990

// Store the LayerBindingId of the OutputLayer

1991

if (isOutputLayer)

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

1992

{

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1993

LayerBindingId bindingId = static_cast<BindableLayer*>(layer)->GetBindingId();

1994

handleInfo.m_OutputMemDescriptorCoords.m_LayerBindingIds.push_back(bindingId);

Finn Williams

2021-10-14 11:22:19 +0100

[diff] [blame]

1995

handleInfo.m_OutputMemDescriptorCoords.m_InputSlotCoords.push_back({layerIndex, 0});

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1996

}

Finn Williams

2021-10-14 11:22:19 +0100

[diff] [blame]

1997

// In this case the layer is not an Output Layer but shares its input tensorhandle with an OutputLayer

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

1998

// It will need to be updated as well, if we swap out the tensorhandle

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

1999

else if (handleInfo.m_IsOutputLayerHandle)

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

2000

{

2001

handleInfo.m_OutputMemDescriptorCoords.m_InputSlotCoords.push_back({layerIndex, slot.GetSlotIndex()});

2002

}

2003

2004

// Store the coordinates of the InputSlots connected to the InputLayer

2005

// There can be more than one InputSlot connected to an InputLayer, so we use a vector

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

2006

if (handleInfo.m_IsInputLayerHandle)

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

2007

{

2008

std::pair<LayerGuid, unsigned int> connectionLocation{layerIndex, slot.GetSlotIndex()};

2009

handleInfo.m_InputMemDescriptorCoords.m_InputSlotCoords.emplace_back(connectionLocation);

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

2010

}

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

2011

}

2012

workingMemDescriptorMap.insert({layer->GetGuid(), workingMemDescriptor});

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

2013

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

2014

// Input/Output layers/workloads will not be executed, so the descriptor is not added to workingMemDescriptors

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

2015

// However we will still need to manage the tensorHandle

Finn Williams

2021-09-01 18:06:04 +0100

[diff] [blame]

2016

if (!isInputLayer)

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

2017

{

2018

workingMemDescriptors.push_back(workingMemDescriptor);

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

layerIndex++;

}

}

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

2023

std::vector<std::pair<std::shared_ptr<TensorMemory>, MemorySource>> tensorMemory;

2024

2025

auto externalMemoryManager = CreateExternalMemoryManger(tensorMemory);

2026

2027

// Sort m_TensorMemory, so it's order matches the outputSlot order

2028

std::sort(tensorMemory.begin(), tensorMemory.end(),

2029

[](const std::pair<std::shared_ptr<TensorMemory>, MemorySource>& lhs,

2030

const std::pair<std::shared_ptr<TensorMemory>, MemorySource>& rhs)

2031

{

2032

return lhs.first->m_OutputSlotId < rhs.first->m_OutputSlotId;

2033

});

2034

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

2035

std::vector<WorkingMemHandle::InputMemDescriptorCoords> inputConnectionsInfo;

2036

std::vector<WorkingMemHandle::OutputMemDescriptorCoords> outputConnectionsInfo;

2037

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

2038

for (const auto& handleInfo: outputToHandleInfoMap)

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

2039

{

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

2040

if (handleInfo.second.m_IsOutputLayerHandle)

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

2041

{

2042

outputConnectionsInfo.emplace_back(handleInfo.second.m_OutputMemDescriptorCoords);

2043

}

2044

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

2045

if (handleInfo.second.m_IsInputLayerHandle)

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

2046

{

2047

inputConnectionsInfo.emplace_back(handleInfo.second.m_InputMemDescriptorCoords);

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

2048

}

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

2049

}

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

2050

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

2051

return std::make_unique<WorkingMemHandle>(networkId,

Finn Williams

2021-10-02 15:06:39 +0100

[diff] [blame]

2052

inputConnectionsInfo,

2053

outputConnectionsInfo,

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

2054

workingMemDescriptors,

Finn Williams

2021-04-26 12:06:34 +0100

[diff] [blame]

2055

workingMemDescriptorMap,

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

2056

std::move(externalMemoryManager),

2057

std::move(tensorMemory),

2058

std::move(managedTensorHandles),

2059

std::move(unmanagedTensorHandles));

Mike Kelly

2021-04-07 20:10:49 +0100

[diff] [blame]

2060

}

2061

Nattapat Chaimanowong

6e94820

2019-03-22 14:01:46 +0000

[diff] [blame]

2062

void LoadedNetwork::RegisterDebugCallback(const DebugCallbackFunction& func)

2063

{

2064

for (auto&& workloadPtr: m_WorkloadQueue)

2065

{

2066

workloadPtr.get()->RegisterDebugCallback(func);

}

}

Finn Williams

2021-10-28 19:07:32 +0100

[diff] [blame]

2070

2071

void LoadedNetwork::CreateMemoryProfileAsync()

{

struct PartialBlock

{

unsigned int m_StartOfLife;

2076

unsigned int m_Lifetime;

2077

2078

size_t m_MemSize;

2079

unsigned int m_Index;

2080

2081

BackendId m_BackendId;

2082

};

2083

2084

auto align = [](size_t numToAlign)

2085

{

2086

const size_t alignment = sizeof(float);

2087

return ((numToAlign + alignment - 1) / alignment) * alignment;

2088

};

2089

2090

std::unordered_map<const OutputSlot*, PartialBlock> memBlockTrackerMap;

2091

2092

const bool inputImportingEnabled = m_NetworkProperties.m_InputSource != MemorySource::Undefined;

2093

const bool outputImportingEnabled = m_NetworkProperties.m_OutputSource != MemorySource::Undefined;

2094

2095

unsigned int timestep = 0;

2096

unsigned int outputIndex = 0;

2097

Graph& order = m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph().TopologicalSort();

2098

2099

for (auto&& layer : order)

2100

{

2101

const LayerType& layerType = layer->GetType();

2102

// Don't manage memory if importing.

2103

if (layerType == LayerType::Input && inputImportingEnabled)

{

continue;

}

// Don't manage memory if importing.

2108

if (layerType == LayerType::Output && outputImportingEnabled

2109

&& layer->GetInputSlot(0).GetConnectedOutputSlot()->GetNumConnections() == 1)

{

continue;

}

// Because Constant Layer memory can not be shared, the memory must persist for the lifetime of execution,

2114

// management is done separately.

2115

if (layerType == LayerType::Constant)

{

continue;

}

BackendId backendId = layer->GetBackendId();

2121

for (auto& outputSlot : layer->GetOutputSlots())

2122

{

2123

if (!m_SupportsExternallyManagedMemory[backendId])

{

continue;

}

PartialBlock partialBlock;

2129

2130

partialBlock.m_StartOfLife = timestep;

2131

2132

size_t alignedSize = align(outputSlot.GetOutputHandler().GetTensorInfo().GetNumBytes());

2133

partialBlock.m_MemSize = alignedSize;

2134

partialBlock.m_Index = outputIndex++;

2135

partialBlock.m_Lifetime = outputSlot.GetNumConnections();

2136

partialBlock.m_BackendId = backendId;

2137

2138

if (partialBlock.m_Lifetime == 0)

2139

{

2140

m_MemBlockMap[partialBlock.m_BackendId].emplace_back(partialBlock.m_StartOfLife,

2141

partialBlock.m_StartOfLife,

2142

partialBlock.m_MemSize,

2143

0,

2144

partialBlock.m_Index);

}

else

{

memBlockTrackerMap[&outputSlot] = partialBlock;

}

}

for (auto& inputSlot : layer->GetInputSlots())

2153

{

2154

const Layer& connectedInputLayer = inputSlot.GetConnectedOutputSlot()->GetOwningLayer();

2155

const LayerType& owningLayerType = connectedInputLayer.GetType();

2156

2157

if (owningLayerType == LayerType::Constant)

{

continue;

}

if (inputImportingEnabled && owningLayerType == LayerType::Input)

{

continue;

}

auto outputSlot = inputSlot.GetConnectedOutputSlot();

2167

2168

PartialBlock& partialBlock = memBlockTrackerMap.at(outputSlot);

2169

2170

auto& lifetime = partialBlock.m_Lifetime;

--lifetime;

if (lifetime == 0)

{

m_MemBlockMap[partialBlock.m_BackendId].emplace_back(partialBlock.m_StartOfLife,

2176

timestep,

2177

partialBlock.m_MemSize,

2178

0,

2179

partialBlock.m_Index);

}

}

++timestep;

}

}

void LoadedNetwork::CreateMemoryProfile()

2187

{

2188

// Finds the first TensorHandle ancestor of a SubTensorHandle. If the ITensorHandle provided

2189

// is a TensorHandle, the function just returns it

2190

auto TraceSubTensorHandleAncestry = [](ITensorHandle* const subTensorHandle)

2191

{

2192

ITensorHandle* ancestor = subTensorHandle;

2193

while (ancestor && ancestor->GetParent())

2194

{

2195

ancestor = ancestor->GetParent();

}

return ancestor;

};

struct PartialBlock

{

unsigned int m_StartOfLife;

2203

unsigned int m_Lifetime;

2204

2205

size_t m_MemSize;

2206

unsigned int m_Index;

2207

2208

BackendId m_BackendId;

2209

};

2210

2211

auto align = [](size_t numToAlign)

2212

{

2213

const size_t alignment = sizeof(float);

2214

return ((numToAlign + alignment - 1) / alignment) * alignment;

2215

};

2216

2217

std::unordered_map<ITensorHandle*, PartialBlock> memBlockTrackerMap;

2218

2219

const bool inputImportingEnabled = m_NetworkProperties.m_InputSource != MemorySource::Undefined;

2220

const bool outputImportingEnabled = m_NetworkProperties.m_OutputSource != MemorySource::Undefined;

2221

2222

unsigned int timestep = 0;

2223

unsigned int outputIndex = 0;

2224

Graph& order = m_OptimizedNetwork->pOptimizedNetworkImpl->GetGraph().TopologicalSort();

2225

2226

for (auto&& layer : order)

2227

{

2228

const LayerType& layerType = layer->GetType();

2229

// Don't manage memory if importing.

2230

if (layerType == LayerType::Input && inputImportingEnabled)

{

continue;

}

// Don't manage memory if importing.

2235

if (layerType == LayerType::Output && outputImportingEnabled

2236

&& layer->GetInputSlot(0).GetConnectedOutputSlot()->GetNumConnections() == 1)

{

continue;

}

// Because Constant Layer memory can not be shared, the memory must persist for the lifetime of execution,

2241

// management is done separately.

2242

if (layerType == LayerType::Constant)

{

continue;

}

BackendId backendId = layer->GetBackendId();

2248

for (auto& outputSlot : layer->GetOutputSlots())

2249

{

2250

if (!m_SupportsExternallyManagedMemory[backendId])

{

continue;

}

ITensorHandle* tensorHandle = outputSlot.GetOutputHandler().GetData();

2256

tensorHandle = TraceSubTensorHandleAncestry(tensorHandle);

2257

2258

if (memBlockTrackerMap.find(tensorHandle) == memBlockTrackerMap.end())

2259

{

2260

PartialBlock partialBlock;

2261

2262

partialBlock.m_StartOfLife = timestep;

2263

2264

size_t alignedSize = align(outputSlot.GetOutputHandler().GetTensorInfo().GetNumBytes());

2265

partialBlock.m_MemSize = alignedSize;

2266

partialBlock.m_Index = outputIndex++;

2267

partialBlock.m_Lifetime = outputSlot.GetNumConnections();

2268

partialBlock.m_BackendId = backendId;

2269

2270

if (partialBlock.m_Lifetime == 0)

2271

{

2272

m_MemBlockMap[partialBlock.m_BackendId].emplace_back(partialBlock.m_StartOfLife,

2273

partialBlock.m_StartOfLife,

2274

partialBlock.m_MemSize,

2275

0,

2276

partialBlock.m_Index);

}

else

{

memBlockTrackerMap[tensorHandle] = partialBlock;

2281

}

2282

m_Tensorhandles.push_back(tensorHandle);

}

else

{

memBlockTrackerMap.at(tensorHandle).m_Lifetime += outputSlot.GetNumConnections();

}

}

for (auto& inputSlot : layer->GetInputSlots())

2292

{

2293

const Layer& connectedInputLayer = inputSlot.GetConnectedOutputSlot()->GetOwningLayer();

2294

const LayerType& owningLayerType = connectedInputLayer.GetType();

2295

2296

if (owningLayerType == LayerType::Constant)

{

continue;

}

if (inputImportingEnabled && owningLayerType == LayerType::Input)

{

continue;

}

if (!m_SupportsExternallyManagedMemory[connectedInputLayer.GetBackendId()])

{

continue;

}

auto outputSlot = inputSlot.GetConnectedOutputSlot();

2310

2311

ITensorHandle* tensorHandle = outputSlot->GetOutputHandler().GetData();

2312

tensorHandle = TraceSubTensorHandleAncestry(tensorHandle);

2313

2314

PartialBlock& partialBlock = memBlockTrackerMap.at(tensorHandle);

2315

2316

auto& lifetime = partialBlock.m_Lifetime;

--lifetime;

if (lifetime == 0)

{

m_MemBlockMap[partialBlock.m_BackendId].emplace_back(partialBlock.m_StartOfLife,

2322

timestep,

2323

partialBlock.m_MemSize,

2324

0,

2325

partialBlock.m_Index);

}

}

++timestep;

}

}

std::unique_ptr<MemoryManager> LoadedNetwork::CreateExternalMemoryManger(

2334

std::vector<std::pair<std::shared_ptr<TensorMemory>, MemorySource>>& tensorMemoryVec)

2335

{

2336

std::unique_ptr<MemoryManager> memoryManager = std::make_unique<MemoryManager>();

2337

auto allocatorMap = BackendRegistryInstance().GetAllocators();

2338

2339

for (auto& backend : m_MemBinMap)

2340

{

2341

std::vector<BufferStorage> bufferStorageVec;

2342

2343

std::shared_ptr<ICustomAllocator> backendAllocator;

2344

if (allocatorMap.find(backend.first) != allocatorMap.end())

2345

{

2346

backendAllocator = allocatorMap[backend.first];

}

else

{

backendAllocator = m_Backends[backend.first]->GetDefaultAllocator();

2351

}

2352

2353

for (auto& memBin : backend.second)

2354

{

2355

BufferStorage bufferStorage;

2356

bufferStorage.m_BufferSize = memBin.m_MemSize;

2357

bufferStorage.m_TensorMemoryVector.reserve(memBin.m_MemBlocks.size());

2358

2359

for (auto& memBlock : memBin.m_MemBlocks)

2360

{

2361

auto tensorMemory = std::make_shared<TensorMemory>(TensorMemory{memBlock.m_Offset, memBlock.m_Index});

2362

2363

tensorMemoryVec.emplace_back(tensorMemory, backendAllocator->GetMemorySourceType());

2364

bufferStorage.m_TensorMemoryVector.emplace_back(tensorMemory);

2365

}

2366

2367

bufferStorageVec.emplace_back(std::move(bufferStorage));

2368

}

2369

2370

memoryManager->StoreMemToAllocate(bufferStorageVec, backendAllocator, 4);

2371

}

2372

2373

return memoryManager;

2374

}

2375

Finn Williams