Blame - src/backends/backendsCommon/test/StridedSliceAsyncEndToEndTest.hpp - ml/armnn

2021-03-29 15:04:50 +0100

[diff] [blame]

1

//

2

3

// SPDX-License-Identifier: MIT

//

#pragma once

#include <ResolveType.hpp>

9

10

#include <armnn/IWorkingMemHandle.hpp>

11

#include <armnn/INetwork.hpp>

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

12

#include <armnn/Threadpool.hpp>

Keith Davis

2021-04-22 10:10:34 +0100

[diff] [blame]

13

#include <armnn/IAsyncExecutionCallback.hpp>

Mike Kelly

2021-03-29 15:04:50 +0100

[diff] [blame]

14

Keith Davis

2021-04-22 10:10:34 +0100

[diff] [blame]

15

#include <AsyncExecutionCallback.hpp>

Sadik Armagan

a097d2a

2021-11-24 15:47:28 +0000

[diff] [blame]

16

#include <CommonTestUtils.hpp>

Mike Kelly

2021-03-29 15:04:50 +0100

[diff] [blame]

17

Sadik Armagan

1625efc

2021-06-10 18:24:34 +0100

[diff] [blame]

18

#include <doctest/doctest.h>

Mike Kelly

2021-03-29 15:04:50 +0100

[diff] [blame]

#include <vector>

namespace armnn

{

namespace experimental

26

{

27

28

template<DataType ArmnnIType, DataType ArmnnOType,

29

typename TInput = ResolveType <ArmnnIType>, typename TOutput = ResolveType <ArmnnOType>>

Finn Williams

2021-04-07 10:23:21 +0100

[diff] [blame]

30

void AsyncThreadedEndToEndTestImpl(INetworkPtr network,

31

const std::vector<std::map<int, std::vector<TInput>>>& inputTensorData,

32

const std::vector<std::map<int, std::vector<TOutput>>>& expectedOutputData,

33

std::vector<BackendId> backends,

34

const size_t numberOfInferences,

35

float tolerance = 0.000001f)

36

{

37

// Create Runtime in which test will run

38

IRuntime::CreationOptions options;

39

IRuntimePtr runtime(IRuntime::Create(options));

40

41

// Optimize the Network

42

IOptimizedNetworkPtr optNet = Optimize(*network, backends, runtime->GetDeviceSpec());

43

Finn Williams

2021-04-07 10:23:21 +0100

[diff] [blame]

44

// Creates AsyncNetwork

45

NetworkId networkId = 0;

46

std::string errorMessage;

Francis Murtagh

73d3e2e

2021-04-29 14:23:04 +0100

[diff] [blame]

47

const INetworkProperties networkProperties(true, MemorySource::Undefined, MemorySource::Undefined);

Finn Williams

2021-04-07 10:23:21 +0100

[diff] [blame]

48

runtime->LoadNetwork(networkId, std::move(optNet), errorMessage, networkProperties);

49

50

std::vector<InputTensors> inputTensorsVec;

51

std::vector<OutputTensors> outputTensorsVec;

52

std::vector<std::map<int, std::vector<TOutput>>> outputStorageVec;

53

std::vector<std::unique_ptr<IWorkingMemHandle>> workingMemHandles;

54

55

for (unsigned int i = 0; i < numberOfInferences; ++i)

56

{

57

InputTensors inputTensors;

58

OutputTensors outputTensors;

59

outputStorageVec.emplace_back(std::map<int, std::vector<TOutput>>());

60

61

inputTensors.reserve(inputTensorData.size());

62

for (auto&& it : inputTensorData[i])

63

{

Cathal Corbett

2021-10-22 11:12:07 +0100

[diff] [blame]

64

TensorInfo inputTensorInfo = runtime->GetInputTensorInfo(networkId, it.first);

65

inputTensorInfo.SetConstant(true);

Finn Williams

2021-04-07 10:23:21 +0100

[diff] [blame]

66

inputTensors.push_back({it.first,

Cathal Corbett

2021-10-22 11:12:07 +0100

[diff] [blame]

67

ConstTensor(inputTensorInfo, it.second.data())});

Finn Williams

2021-04-07 10:23:21 +0100

[diff] [blame]

68

}

69

70

outputTensors.reserve(expectedOutputData.size());

71

for (auto&& it : expectedOutputData[i])

72

{

73

std::vector<TOutput> out(it.second.size());

74

outputStorageVec[i].emplace(it.first, out);

75

outputTensors.push_back({it.first,

76

Tensor(runtime->GetOutputTensorInfo(networkId, it.first),

77

outputStorageVec[i].at(it.first).data())});

78

}

79

80

inputTensorsVec.push_back(inputTensors);

81

outputTensorsVec.push_back(outputTensors);

82

83

workingMemHandles.push_back(runtime->CreateWorkingMemHandle(networkId));

84

}

85

86

std::vector<std::thread> threads;

87

for (unsigned int i = 0; i < numberOfInferences; ++i)

88

{

89

// Access the vectors before we do anything multi-threaded

90

InputTensors& inputTensors = inputTensorsVec[i];

91

OutputTensors& outputTensors = outputTensorsVec[i];

92

IWorkingMemHandle& workingMemHandle = *workingMemHandles[i].get();

93

94

threads.emplace_back([&]()

95

{

96

// Run the async network

97

runtime->Execute(workingMemHandle, inputTensors, outputTensors);

});

}

for (unsigned int i = 0; i < numberOfInferences; ++i)

{

threads[i].join();

}

// Checks the results.

107

for (unsigned int i = 0; i < numberOfInferences; ++i)

108

{

109

for (auto &&it : expectedOutputData[i])

110

{

111

std::vector<TOutput> out = outputStorageVec[i].at(it.first);

112

for (unsigned int j = 0; j < out.size(); ++j)

113

{

Sadik Armagan

1625efc

2021-06-10 18:24:34 +0100

[diff] [blame]

114

CHECK(Compare<ArmnnOType>(it.second[j], out[j], tolerance) == true);

Finn Williams

2021-04-07 10:23:21 +0100

[diff] [blame]

}

}

}

}

Finn Williams

2021-04-07 10:23:21 +0100

[diff] [blame]

121

template<DataType ArmnnIType, DataType ArmnnOType,

Keith Davis

2021-04-22 10:10:34 +0100

[diff] [blame]

122

typename TInput = ResolveType<ArmnnIType>, typename TOutput = ResolveType<ArmnnOType>>

Mike Kelly

2021-03-29 15:04:50 +0100

[diff] [blame]

123

void AsyncEndToEndTestImpl(INetworkPtr network,

124

const std::map<int, std::vector<TInput>>& inputTensorData,

125

const std::map<int, std::vector<TOutput>>& expectedOutputData,

126

std::vector<BackendId> backends,

Keith Davis

2021-04-22 10:10:34 +0100

[diff] [blame]

127

float tolerance = 0.000001f,

Kevin May

b4b3ac9

2021-05-21 16:42:21 +0100

[diff] [blame]

128

size_t numThreads = 1)

Mike Kelly

2021-03-29 15:04:50 +0100

[diff] [blame]

129

{

Matthew Bentham

2022-01-10 15:41:26 +0000

[diff] [blame]

130

ARMNN_ASSERT(numThreads >= 1);

131

const unsigned int numberOfInferences = numThreads == 1 ? 1 : 1000;

132

Mike Kelly

2021-03-29 15:04:50 +0100

[diff] [blame]

133

// Create Runtime in which test will run

134

IRuntime::CreationOptions options;

Keith Davis

2021-04-22 10:10:34 +0100

[diff] [blame]

135

IRuntimePtr runtime(IRuntime::Create(options));

Mike Kelly

2021-03-29 15:04:50 +0100

[diff] [blame]

136

137

// Optimize the Network

138

IOptimizedNetworkPtr optNet = Optimize(*network, backends, runtime->GetDeviceSpec());

139

140

// Creates AsyncNetwork

141

NetworkId networkId = 0;

Keith Davis

2021-04-22 10:10:34 +0100

[diff] [blame]

142

Mike Kelly

2021-03-29 15:04:50 +0100

[diff] [blame]

143

std::string errorMessage;

Keith Davis

2021-04-22 10:10:34 +0100

[diff] [blame]

144

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

145

const INetworkProperties networkProperties(true, MemorySource::Undefined, MemorySource::Undefined);

Keith Davis

2021-04-22 10:10:34 +0100

[diff] [blame]

146

Mike Kelly

55a8ffd

2021-04-07 20:10:49 +0100

[diff] [blame]

147

runtime->LoadNetwork(networkId, std::move(optNet), errorMessage, networkProperties);

Mike Kelly

2021-03-29 15:04:50 +0100

[diff] [blame]

148

149

InputTensors inputTensors;

150

inputTensors.reserve(inputTensorData.size());

151

for (auto&& it : inputTensorData)

152

{

Cathal Corbett

2021-10-22 11:12:07 +0100

[diff] [blame]

153

TensorInfo inputTensorInfo = runtime->GetInputTensorInfo(networkId, it.first);

154

inputTensorInfo.SetConstant(true);

Mike Kelly

2021-03-29 15:04:50 +0100

[diff] [blame]

155

inputTensors.push_back({it.first,

Cathal Corbett

2021-10-22 11:12:07 +0100

[diff] [blame]

156

ConstTensor(inputTensorInfo, it.second.data())});

Mike Kelly

2021-03-29 15:04:50 +0100

[diff] [blame]

157

}

158

Matthew Bentham

2022-01-10 15:41:26 +0000

[diff] [blame]

159

std::vector<OutputTensors> outputTensorsVec;

160

std::vector<std::map<int, std::vector<TOutput>>> outputStorageVec;

161

162

outputTensorsVec.reserve(numberOfInferences);

163

outputStorageVec.reserve(numberOfInferences);

164

for (unsigned int i = 0; i < numberOfInferences; ++i)

Mike Kelly

2021-03-29 15:04:50 +0100

[diff] [blame]

165

{

Matthew Bentham

2022-01-10 15:41:26 +0000

[diff] [blame]

166

OutputTensors outputTensors;

167

outputStorageVec.emplace_back(std::map<int, std::vector<TOutput>>());

168

169

outputTensors.reserve(expectedOutputData.size());

170

for (auto&& it : expectedOutputData)

171

{

172

std::vector<TOutput> out(it.second.size());

173

outputStorageVec[i].emplace(it.first, out);

174

outputTensors.push_back({it.first,

175

Tensor(runtime->GetOutputTensorInfo(networkId, it.first),

176

outputStorageVec[i].at(it.first).data())});

177

}

178

179

outputTensorsVec.push_back(outputTensors);

Mike Kelly

2021-03-29 15:04:50 +0100

[diff] [blame]

180

}

181

Matthew Bentham

2022-01-10 15:41:26 +0000

[diff] [blame]

182

if (numThreads == 1)

Keith Davis

2021-04-22 10:10:34 +0100

[diff] [blame]

183

{

184

// Create WorkingMemHandle for this async network

185

std::unique_ptr<IWorkingMemHandle> workingMemHandle = runtime->CreateWorkingMemHandle(networkId);

186

IWorkingMemHandle& workingMemHandleRef = *workingMemHandle.get();

Mike Kelly

2021-03-29 15:04:50 +0100

[diff] [blame]

187

Keith Davis

2021-04-22 10:10:34 +0100

[diff] [blame]

188

// Run the async network

Matthew Bentham

2022-01-10 15:41:26 +0000

[diff] [blame]

189

runtime->Execute(workingMemHandleRef, inputTensors, outputTensorsVec[0]);

Keith Davis

2021-04-22 10:10:34 +0100

[diff] [blame]

190

}

191

else

192

{

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

193

std::vector<std::shared_ptr<IWorkingMemHandle>> memHandles;

Mike Kelly

2021-03-29 15:04:50 +0100

[diff] [blame]

194

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

195

for (size_t i = 0; i < numThreads; ++i)

Keith Davis

2021-04-22 10:10:34 +0100

[diff] [blame]

196

{

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

197

memHandles.emplace_back(runtime->CreateWorkingMemHandle(networkId));

Keith Davis

2021-04-22 10:10:34 +0100

[diff] [blame]

198

}

199

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

200

Threadpool threadpool(numThreads, runtime.get(), memHandles);

201

AsyncCallbackManager callbackManager;

202

Keith Davis

2021-04-22 10:10:34 +0100

[diff] [blame]

203

// For the asyncronous execution, we are adding a pool of working memory handles (1 per thread) in the

Matthew Bentham

2022-01-10 15:41:26 +0000

[diff] [blame]

204

// LoadedNetwork with each scheduled inference having a random priority

205

for (size_t i = 0; i < numberOfInferences; ++i)

Keith Davis

2021-04-22 10:10:34 +0100

[diff] [blame]

206

{

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

207

threadpool.Schedule(networkId,

208

inputTensors,

Matthew Bentham

2022-01-10 15:41:26 +0000

[diff] [blame]

209

outputTensorsVec[i],

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

210

static_cast<QosExecPriority>(rand()%3),

211

callbackManager.GetNewCallback());

Keith Davis

2021-04-22 10:10:34 +0100

[diff] [blame]

212

}

213

214

// Wait until the execution signals a notify

Matthew Bentham

2022-01-10 15:41:26 +0000

[diff] [blame]

215

for (size_t i = 0; i < numberOfInferences; ++i)

Keith Davis

2021-04-22 10:10:34 +0100

[diff] [blame]

216

{

Finn Williams

2021-06-09 17:07:33 +0100

[diff] [blame]

217

auto cb = callbackManager.GetNotifiedCallback();

218

Keith Davis

2021-04-22 10:10:34 +0100

[diff] [blame]

219

// Checks the results.

Sadik Armagan

1625efc

2021-06-10 18:24:34 +0100

[diff] [blame]

220

CHECK(cb->GetStatus() == Status::Success);

Keith Davis

2021-04-22 10:10:34 +0100

[diff] [blame]

}

}

Matthew Bentham

2022-01-10 15:41:26 +0000

[diff] [blame]

224

for (auto&& outputStorage : outputStorageVec)

Mike Kelly

2021-03-29 15:04:50 +0100

[diff] [blame]

225

{

Matthew Bentham

2022-01-10 15:41:26 +0000

[diff] [blame]

226

for (auto&& it : expectedOutputData)

Mike Kelly

2021-03-29 15:04:50 +0100

[diff] [blame]

227

{

Matthew Bentham

2022-01-10 15:41:26 +0000

[diff] [blame]

228

std::vector<TOutput> out = outputStorage.at(it.first);

229

230

for (unsigned int i = 0; i < out.size(); ++i)

231

{

232

//CHECK(Compare<ArmnnOType>(it.second[i], out[i], tolerance) == true);

233

CHECK(it.second[i] == doctest::Approx(out[i]).epsilon(tolerance));

234

}

Mike Kelly

2021-03-29 15:04:50 +0100

[diff] [blame]

}

}

}

template<typename armnn::DataType DataType>

240

INetworkPtr CreateStridedSliceNetwork(const TensorShape& inputShape,

241

const TensorShape& outputShape,

242

const std::vector<int>& beginData,

243

const std::vector<int>& endData,

244

const std::vector<int>& stridesData,

245

int beginMask = 0,

246

int endMask = 0,

247

int shrinkAxisMask = 0,

248

int ellipsisMask = 0,

249

int newAxisMask = 0,

250

const float qScale = 1.0f,

251

const int32_t qOffset = 0)

252

{

253

using namespace armnn;

254

// Builds up the structure of the network.

255

INetworkPtr net(INetwork::Create());

256

257

TensorInfo inputTensorInfo(inputShape, DataType, qScale, qOffset);

258

TensorInfo outputTensorInfo(outputShape, DataType, qScale, qOffset);

259

260

armnn::StridedSliceDescriptor stridedSliceDescriptor;

261

stridedSliceDescriptor.m_Begin = beginData;

262

stridedSliceDescriptor.m_End = endData;

263

stridedSliceDescriptor.m_Stride = stridesData;

264

stridedSliceDescriptor.m_BeginMask = beginMask;

265

stridedSliceDescriptor.m_EndMask = endMask;

266

stridedSliceDescriptor.m_ShrinkAxisMask = shrinkAxisMask;

267

stridedSliceDescriptor.m_EllipsisMask = ellipsisMask;

268

stridedSliceDescriptor.m_NewAxisMask = newAxisMask;

269

270

IConnectableLayer* input = net->AddInputLayer(0, "Input_Layer");

271

IConnectableLayer* stridedSlice = net->AddStridedSliceLayer(stridedSliceDescriptor, "splitter");

272

IConnectableLayer* output = net->AddOutputLayer(0);

273

274

Connect(input, stridedSlice, inputTensorInfo, 0, 0);

275

Connect(stridedSlice, output, outputTensorInfo, 0, 0);

return net;

}

template<armnn::DataType ArmnnType>

Kevin May

b4b3ac9

2021-05-21 16:42:21 +0100

[diff] [blame]

281

void StridedSlicedEndToEndTest(const std::vector<BackendId>& backends, size_t numThreads)

Mike Kelly

2021-03-29 15:04:50 +0100

[diff] [blame]

282

{

283

using namespace armnn;

284

using T = ResolveType<ArmnnType>;

285

286

const TensorShape& inputShape = {3, 2, 3, 1};

287

const TensorShape& outputShape = {1, 2, 3, 1};

288

const std::vector<int>& beginData = {1, 0, 0, 0};

289

const std::vector<int>& endData = {2, 2, 3, 1};

290

const std::vector<int>& stridesData = {1, 1, 1, 1};

291

int beginMask = 0;

292

int endMask = 0;

293

int shrinkAxisMask = 0;

294

int ellipsisMask = 0;

295

int newAxisMask = 0;

296

297

// Builds up the structure of the network

298

INetworkPtr net = CreateStridedSliceNetwork<ArmnnType>(inputShape,

outputShape,

beginData,

endData,

stridesData,

beginMask,

endMask,

shrinkAxisMask,

ellipsisMask,

newAxisMask);

Sadik Armagan

2021-06-10 18:24:34 +0100

[diff] [blame]

309

CHECK(net);

Mike Kelly

2021-03-29 15:04:50 +0100

[diff] [blame]

310

// Creates structures for input & output.

311

std::vector<T> inputData{

312

1.0f, 1.0f, 1.0f, 2.0f, 2.0f, 2.0f,

313

314

3.0f, 3.0f, 3.0f, 4.0f, 4.0f, 4.0f,

315

316

5.0f, 5.0f, 5.0f, 6.0f, 6.0f, 6.0f

317

};

318

319

std::vector<T> outputExpected{

320

3.0f, 3.0f, 3.0f, 4.0f, 4.0f, 4.0f

321

};

322

323

std::map<int, std::vector<T>> inputTensorData = {{0, inputData}};

324

std::map<int, std::vector<T>> expectedOutputData = {{0, outputExpected}};

325

Kevin May

b4b3ac9

2021-05-21 16:42:21 +0100

[diff] [blame]

326

AsyncEndToEndTestImpl<ArmnnType, ArmnnType>(move(net),

inputTensorData,

expectedOutputData,

backends,

0.000001f,

numThreads);

Finn Williams

2021-04-07 10:23:21 +0100

[diff] [blame]

332

}

333

334

template<armnn::DataType ArmnnType>

335

void StridedSlicedMultiThreadedEndToEndTest(const std::vector<BackendId>& backends)

336

{

337

using namespace armnn;

338

using T = ResolveType<ArmnnType>;

339

340

const TensorShape& inputShape = {3, 2, 3, 1};

341

const TensorShape& outputShape = {1, 2, 3, 1};

342

const std::vector<int>& beginData = {1, 0, 0, 0};

343

const std::vector<int>& endData = {2, 2, 3, 1};

344

const std::vector<int>& stridesData = {1, 1, 1, 1};

345

int beginMask = 0;

346

int endMask = 0;

347

int shrinkAxisMask = 0;

348

int ellipsisMask = 0;

349

int newAxisMask = 0;

350

351

// Builds up the structure of the network

352

INetworkPtr net = CreateStridedSliceNetwork<ArmnnType>(inputShape,

outputShape,

beginData,

endData,

stridesData,

beginMask,

endMask,

shrinkAxisMask,

ellipsisMask,

newAxisMask);

Sadik Armagan

2021-06-10 18:24:34 +0100

[diff] [blame]

363

CHECK(net);

Finn Williams

2021-04-07 10:23:21 +0100

[diff] [blame]

364

365

// Creates structures for input & output.

366

std::vector<T> inputData1{

367

1.0f, 1.0f, 1.0f, 2.0f, 2.0f, 2.0f,

368

369

3.0f, 3.0f, 3.0f, 4.0f, 4.0f, 4.0f,

370

371

5.0f, 5.0f, 5.0f, 6.0f, 6.0f, 6.0f

372

};

373

374

std::vector<T> outputExpected1{ 3.0f, 3.0f, 3.0f, 4.0f, 4.0f, 4.0f };

375

376

// Creates structures for input & output.

377

std::vector<T> inputData2{

378

1.0f, 1.0f, 1.0f, 2.0f, 2.0f, 2.0f,

379

380

8.0f, 8.0f, 8.0f, 7.0f, 7.0f, 7.0f,

381

382

5.0f, 5.0f, 5.0f, 6.0f, 6.0f, 6.0f

383

};

384

385

std::vector<T> outputExpected2{ 8.0f, 8.0f, 8.0f, 7.0f, 7.0f, 7.0f };

386

387

std::vector<std::map<int, std::vector<T>>> inputTensors;

388

std::vector<std::map<int, std::vector<T>>> outputTensors;

389

390

inputTensors.push_back(std::map<int, std::vector<T>> {{0, inputData1}});

391

inputTensors.push_back(std::map<int, std::vector<T>> {{0, inputData2}});

392

outputTensors.push_back(std::map<int, std::vector<T>> {{0, outputExpected1}});

393

outputTensors.push_back(std::map<int, std::vector<T>> {{0, outputExpected2}});

394

395

AsyncThreadedEndToEndTestImpl<ArmnnType, ArmnnType>(move(net), inputTensors, outputTensors, backends, 2);

Mike Kelly