Blame - tests/validation/CL/MatMulKernel.cpp - ml/ComputeLibrary

2023-03-20 10:19:10 +0000

[diff] [blame]

98

{ MatMulKernelInfo(false, false, 7, 3, 4, true), false }, // N0 not in {4, 8, 16}

99

{ MatMulKernelInfo(false, false, 7, 1, 4, true), false }, // N0 not in {4, 8, 16}

100

{ MatMulKernelInfo(false, false, 7, 12, 4, true), false }, // N0 not in {4, 8, 16}

101

{ MatMulKernelInfo(false, false, 7, 4, 4, true), true },

102

{ MatMulKernelInfo(false, false, 7, 8, 4, true), true },

103

{ MatMulKernelInfo(false, false, 7, 16, 4, true), true },

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

104

105

// Lhs not-transposed, Rhs transposed

106

{ MatMulKernelInfo(false, true, 0, 1, 1), false }, // M0 should be > 0

107

{ MatMulKernelInfo(false, true, 3, 11, 1), false }, // N0 not in {1, 2, 3, 4, 8, 16}

108

{ MatMulKernelInfo(false, true, 3, 7, 1), false }, // N0 not in {1, 2, 3, 4, 8, 16}

109

{ MatMulKernelInfo(false, true, 3, 3, 12), false }, // K0 not in {1, 2, 3, 4, 8, 16}

110

{ MatMulKernelInfo(false, true, 3, 3, 6), false }, // K0 not in {1, 2, 3, 4, 8, 16}

111

{ MatMulKernelInfo(false, true, 5, 1, 2), true },

112

{ MatMulKernelInfo(false, true, 3, 3, 3), true },

113

{ MatMulKernelInfo(false, true, 2, 4, 8), true },

Ramy Elgammal

2023-03-20 10:19:10 +0000

[diff] [blame^]

114

{ MatMulKernelInfo(false, true, 2, 4, 5, true), false }, // K0 not in {4, 8, 16}

115

{ MatMulKernelInfo(false, true, 2, 4, 9, true), false }, // K0 not in {4, 8, 16}

116

{ MatMulKernelInfo(false, true, 2, 4, 3, true), false }, // K0 not in {4, 8, 16}

117

{ MatMulKernelInfo(false, true, 2, 4, 4, true), true },

118

{ MatMulKernelInfo(false, true, 2, 4, 8, true), true },

119

{ MatMulKernelInfo(false, true, 2, 8, 16, true), true },

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

120

Ramy Elgammal

2023-03-20 10:19:10 +0000

[diff] [blame^]

121

// Lhs transposed, Rhs-not-transposed

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

122

{ MatMulKernelInfo(true, false, 1, 1, 0), false }, // K0 should be > 0

123

{ MatMulKernelInfo(true, false, 3, 11, 1), false }, // N0 not in {1, 2, 3, 4, 8, 16}

124

{ MatMulKernelInfo(true, false, 3, 7, 1), false }, // N0 not in {1, 2, 3, 4, 8, 16}

125

{ MatMulKernelInfo(true, false, 6, 3, 12), false }, // M0 not in {1, 2, 3, 4, 8, 16}

126

{ MatMulKernelInfo(true, false, 5, 3, 6), false }, // M0 not in {1, 2, 3, 4, 8, 16}

127

{ MatMulKernelInfo(true, false, 4, 1, 22), true },

128

{ MatMulKernelInfo(true, false, 3, 3, 3), true },

129

{ MatMulKernelInfo(true, false, 2, 4, 8), true },

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

130

{ MatMulKernelInfo(true, false, 2, 3, 8, true), false }, // N0 not in {4, 8, 16}

131

{ MatMulKernelInfo(true, false, 2, 7, 8, true), false }, // N0 not in {4, 8, 16}

132

{ MatMulKernelInfo(true, false, 2, 5, 8, true), false }, // N0 not in {4, 8, 16}

133

{ MatMulKernelInfo(true, false, 2, 4, 8, true), true },

134

{ MatMulKernelInfo(true, false, 2, 8, 8, true), true },

135

{ MatMulKernelInfo(true, false, 2, 16, 8, true), true },

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

136

Ramy Elgammal

2023-03-20 10:19:10 +0000

[diff] [blame^]

137

// Lhs transposed, Rhs-transposed

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

138

{ MatMulKernelInfo(true, true, 2, 1, 5), false }, // K0 should in {1, 2, 3, 4, 8, 16}

139

{ MatMulKernelInfo(true, true, 1, 8, 7), false }, // K0 should in {1, 2, 3, 4, 8, 16}

140

{ MatMulKernelInfo(true, true, 3, 11, 1), false }, // N0 not in {1, 2, 3, 4, 8, 16}

141

{ MatMulKernelInfo(true, true, 3, 7, 1), false }, // N0 not in {1, 2, 3, 4, 8, 16}

142

{ MatMulKernelInfo(true, true, 6, 3, 12), false }, // M0 not in {1, 2, 3, 4, 8, 16}

143

{ MatMulKernelInfo(true, true, 5, 3, 6), false }, // M0 not in {1, 2, 3, 4, 8, 16}

144

{ MatMulKernelInfo(true, true, 4, 8, 16), true },

145

{ MatMulKernelInfo(true, true, 3, 3, 4), true },

146

{ MatMulKernelInfo(true, true, 16, 4, 8), true },

Ramy Elgammal

2023-03-20 10:19:10 +0000

[diff] [blame^]

147

{ MatMulKernelInfo(true, true, 2, 2, 1, true), false }, // K0 not in {4, 8, 16}

148

{ MatMulKernelInfo(true, true, 2, 2, 5, true), false }, // K0 not in {4, 8, 16}

149

{ MatMulKernelInfo(true, true, 2, 4, 7, true), false }, // K0 not in {4, 8, 16}

150

{ MatMulKernelInfo(true, true, 2, 4, 4, true), true },

151

{ MatMulKernelInfo(true, true, 2, 8, 8, true), true },

152

{ MatMulKernelInfo(true, true, 2, 8, 16, true), true },

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

153

};

154

155

// Set big enough shapes so that block sizes are not truncated. Also, set all dimensions equal

156

// so that it doesn't fail for different NT/T configurations. We aim to test the block sizes here,

157

// not the shapes themselves.

158

const TensorInfo lhs_info = TensorInfo(TensorShape(100U, 100U), 1, DataType::F32);

159

const TensorInfo rhs_info = TensorInfo(TensorShape(100U, 100U), 1, DataType::F32);

160

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

161

const bool export_to_cl_image_supported = image2d_from_buffer_supported(CLKernelLibrary::get().get_device());

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

162

for(auto &pair : supported_block_sizes)

163

{

164

TensorInfo output_info;

165

Status status = ClNativeMatMulKernel::validate(&lhs_info, &rhs_info, &output_info, pair.first);

166

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

167

if(!pair.first.export_rhs_to_cl_image || export_to_cl_image_supported)

168

{

169

ARM_COMPUTE_EXPECT(bool(status) == pair.second, framework::LogLevel::ERRORS);

}

}

}

TEST_CASE(ExportToCLImage, framework::DatasetMode::ALL)

175

{

176

// We skip this test if the hardware does not support exporting to CL Image

177

if(image2d_from_buffer_supported(CLKernelLibrary::get().get_device()))

178

{

179

constexpr size_t pixel_size = 4;

180

const size_t max_image_w = pixel_size * CLKernelLibrary::get().get_device().getInfo<CL_DEVICE_IMAGE2D_MAX_WIDTH>();

181

const size_t max_image_h = CLKernelLibrary::get().get_device().getInfo<CL_DEVICE_IMAGE2D_MAX_HEIGHT>();

182

183

using ShapeConfigurationTuple = std::tuple<TensorShape, TensorShape, bool, bool, bool>;

184

const std::vector<ShapeConfigurationTuple> shape_configurations =

185

{

186

// lhs_shape, rhs_shape, adj_lhs, adj_rhs, expected

187

// Lhs t/Nt, Rhs Nt

188

// Transposition of Lhs doesn't add any value to the tests, therefore always assumed false below

189

{ TensorShape(5U, 1U), TensorShape(3U, 5U), false, false, false }, // N should be multiple of 4

190

{ TensorShape(5U, 1U), TensorShape(14U, 5U), false, false, false }, // N should be multiple of 4

191

{ TensorShape(5U, 1U), TensorShape(12U, 5U), false, false, true },

192

{ TensorShape(5U, 1U), TensorShape(8U, 5U), false, false, true },

193

{ TensorShape(5U, 1U), TensorShape(4U, 5U), false, false, true },

194

{ TensorShape(max_image_h + 1, 1U), TensorShape(4U, max_image_h + 1), false, false, false }, // Cannot fit into CL Image memory's height

195

{ TensorShape(5U, 1U), TensorShape(max_image_w + 1, 5U), false, false, false }, // Cannot fit into CL Image memory's width

196

{ TensorShape(max_image_h, 1U), TensorShape(4U, max_image_h), false, false, true }, // Barely fits into CL Image memory's height

197

{ TensorShape(5U, 1U), TensorShape(max_image_w, 5U), false, false, true }, // Barely fits into CL Image memory's width

Ramy Elgammal

2023-03-20 10:19:10 +0000

[diff] [blame^]

198

199

// Lhs Nt/T , Rhs T

200

{ TensorShape(5U, 1U), TensorShape(5U, 3U), false, true, false }, // K should be multiple of 4

201

{ TensorShape(5U, 1U), TensorShape(5U, 14U), false, true, false }, // K should be multiple of 4

202

{ TensorShape(4U, 1U), TensorShape(4U, 10U), false, true, true },

203

{ TensorShape(8U, 1U), TensorShape(8U, 9U), false, true, true },

204

{ TensorShape(12U, 1U), TensorShape(12U, 6U), false, true, true },

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

205

};

206

207

for(auto &tuple : shape_configurations)

208

{

209

TensorShape lhs_shape = std::get<0>(tuple);

210

TensorShape rhs_shape = std::get<1>(tuple);

211

212

const TensorInfo lhs_info = TensorInfo(lhs_shape, 1, DataType::F32);

213

const TensorInfo rhs_info = TensorInfo(rhs_shape, 1, DataType::F32);

214

215

const bool adj_lhs = std::get<2>(tuple);

216

const bool adj_rhs = std::get<3>(tuple);

217

218

// We choose M0, N0, K0 equal to 4 so that they're always valid for CLImage in any combination

219

const MatMulKernelInfo matmul_kernel_info {adj_lhs, adj_rhs, 4, 4, 4, true /* export_rhs_to_cl_image */};

220

221

TensorInfo output_info;

222

Status status = ClNativeMatMulKernel::validate(&lhs_info, &rhs_info, &output_info, matmul_kernel_info);

223

224

const bool expected = std::get<4>(tuple);

225

ARM_COMPUTE_EXPECT(bool(status) == expected, framework::LogLevel::ERRORS);

226

}

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

}

}

TEST_CASE(ValidateInputShapes, framework::DatasetMode::ALL)

231

{

232

// Configurations are assumed to be Nt/Nt, but will be transposed inside the test to test other configurations

233

using ShapeConfigurationTuple = std::tuple<TensorShape, TensorShape, bool>;

234

const std::vector<ShapeConfigurationTuple> shape_configurations =

235

{

236

{ TensorShape(5U, 1U), TensorShape(3U, 5U), true },

237

{ TensorShape(10U, 12U), TensorShape(3U, 10U), true },

238

{ TensorShape(8U, 4U), TensorShape(2U, 8U), true },

239

{ TensorShape(8U, 4U), TensorShape(2U, 5U), false }, // Mismatch in the K dimension

240

{ TensorShape(5U, 0U), TensorShape(2U, 5U), false }, // Invalid dimension

241

{ TensorShape(5U, 4U, 3U, 4U, 5U, 6U), TensorShape(2U, 5U, 3U, 4U, 5U, 6U), true },

242

{ TensorShape(5U, 4U, 3U, 4U, 5U, 1U), TensorShape(2U, 5U, 3U, 4U, 5U, 6U), false }, // no batch broadcasting

243

{ TensorShape(5U, 4U, 3U, 4U, 9U, 6U), TensorShape(2U, 5U, 3U, 4U, 5U, 6U), false }, // mismatch in batch dimension

244

};

245

246

for(auto &tuple : shape_configurations)

247

{

248

const bool expected = std::get<2>(tuple);

for(bool adj_lhs :

{

false, true

})

{

for(bool adj_rhs :

{

false, true

})

{

TensorShape lhs_shape = std::get<0>(tuple);

261

TensorShape rhs_shape = std::get<1>(tuple);

if(adj_lhs)

{

permute(lhs_shape, PermutationVector(1U, 0U));

}

if(adj_rhs)

{

permute(rhs_shape, PermutationVector(1U, 0U));

271

}

272

273

const TensorInfo lhs_info = TensorInfo(lhs_shape, 1, DataType::F32);

274

const TensorInfo rhs_info = TensorInfo(rhs_shape, 1, DataType::F32);

275

TensorInfo output_info;

276

277

MatMulKernelInfo matmul_kernel_info{ adj_lhs, adj_rhs, 1, 1, 1, false /* export_rhs_to_cl_image */ };

278

279

Status status = ClNativeMatMulKernel::validate(&lhs_info, &rhs_info, &output_info, matmul_kernel_info);

280

ARM_COMPUTE_EXPECT(bool(status) == expected, framework::LogLevel::ERRORS);

}

}

}

}

TEST_CASE(ValidateDataTypes, framework::DatasetMode::ALL)

287

{

288

// Configurations are assumed to be Nt/Nt, but will be transposed inside the test to test other configurations

289

using DataTypeConfigurationTuple = std::tuple<DataType, DataType, DataType, bool>;

290

const std::vector<DataTypeConfigurationTuple> data_type_configurations =

291

{

292

{ DataType::F32, DataType::F32, DataType::F32, true },

293

{ DataType::F16, DataType::F16, DataType::F16, true },

294

{ DataType::F16, DataType::F32, DataType::F32, false }, // no mixed precision

295

{ DataType::F64, DataType::F64, DataType::F64, false }, // no double precision

296

{ DataType::QASYMM8, DataType::QASYMM8, DataType::QASYMM8, false }, // no quantized types

297

{ DataType::QASYMM8_SIGNED, DataType::QASYMM8_SIGNED, DataType::QASYMM8_SIGNED, false }, // no quantized types

298

{ DataType::QSYMM8_PER_CHANNEL, DataType::QSYMM8_PER_CHANNEL, DataType::QSYMM8_PER_CHANNEL, false }, // no quantized types

299

{ DataType::QASYMM16, DataType::QASYMM16, DataType::QASYMM16, false }, // no quantized types

300

{ DataType::QSYMM16, DataType::QSYMM16, DataType::QSYMM16, false }, // no quantized types

301

{ DataType::QSYMM8, DataType::QSYMM8, DataType::QSYMM8, false }, // no quantized types

302

{ DataType::S64, DataType::S64, DataType::S64, false }, // no integral types

303

{ DataType::S32, DataType::S32, DataType::S32, false }, // no integral types

304

{ DataType::S16, DataType::S16, DataType::S16, false }, // no integral types

305

{ DataType::S8, DataType::S8, DataType::S8, false }, // no integral types

306

{ DataType::U64, DataType::U64, DataType::U64, false }, // no integral types

307

{ DataType::U32, DataType::U32, DataType::U32, false }, // no integral types

308

{ DataType::U16, DataType::U16, DataType::U16, false }, // no integral types

309

{ DataType::U8, DataType::U8, DataType::U8, false }, // no integral types

310

};

311

312

const TensorShape shape = TensorShape(10U, 10U);

313

const MatMulKernelInfo matmul_kernel_info{ false, false, 1, 1, 1, false };

314

for(auto &tuple : data_type_configurations)

315

{

316

const bool expected = std::get<3>(tuple);

317

318

const TensorInfo lhs_info(shape, 1, std::get<0>(tuple));

319

const TensorInfo rhs_info(shape, 1, std::get<1>(tuple));

320

TensorInfo output_info(shape, 1, std::get<2>(tuple));

321

322

Status status = ClNativeMatMulKernel::validate(&lhs_info, &rhs_info, &output_info, matmul_kernel_info);

323

ARM_COMPUTE_EXPECT(bool(status) == expected, framework::LogLevel::ERRORS);

}

}

TEST_SUITE_END() // Validate

328

329

TEST_SUITE(Float)

330

TEST_SUITE(FP32)

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

331

TEST_SUITE(Buffer)

332

FIXTURE_DATA_TEST_CASE(RunTiny, CLMatMulKernelFixture<float>, framework::DatasetMode::ALL, combine(combine(combine(combine(combine(combine(combine(datasets::TinyMatMulDataset(),

333

framework::dataset::make("pretransose_A", { false, true })),

334

framework::dataset::make("pretransose_B", { false, true })),

335

m0_values_precommit),

336

n0_values_precommit),

337

k0_values_precommit),

338

framework::dataset::make("export_rhs_to_cl_image", { false })),

339

framework::dataset::make("DataType", DataType::F32)))

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

340

{

341

// Validate output

342

validate(CLAccessor(_target), _reference, tolerance_f32, 0.f, abs_tolerance_f32);

343

}

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

344

FIXTURE_DATA_TEST_CASE(RunSmall, CLMatMulKernelFixture<float>, framework::DatasetMode::ALL, combine(combine(combine(combine(combine(combine(combine(datasets::SmallMatMulDataset(),

345

framework::dataset::make("pretransose_A", { false, true })),

346

framework::dataset::make("pretransose_B", { false, true })),

347

m0_values_precommit),

348

n0_values_precommit),

349

k0_values_precommit),

350

framework::dataset::make("export_rhs_to_cl_image", { false })),

351

framework::dataset::make("DataType", DataType::F32)))

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

352

{

353

// Validate output

354

validate(CLAccessor(_target), _reference, tolerance_f32, 0.f, abs_tolerance_f32);

355

}

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

356

FIXTURE_DATA_TEST_CASE(RunLargeNoTranspose, CLMatMulKernelFixture<float>, framework::DatasetMode::NIGHTLY, combine(combine(combine(combine(combine(combine(combine(datasets::LargeMatMulDataset(),

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

357

framework::dataset::make("pretransose_A", { false })),

358

framework::dataset::make("pretransose_B", { false })),

359

m0_values_nightly_lhs_nt),

360

n0_values_nightly_rhs_nt),

361

k0_values_nightly_lhs_nt_rhs_nt),

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

362

framework::dataset::make("export_rhs_to_cl_image", { false })),

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

363

framework::dataset::make("DataType", DataType::F32)))

364

{

365

// Validate output

366

validate(CLAccessor(_target), _reference, tolerance_f32, 0.f, abs_tolerance_f32);

367

}

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

368

FIXTURE_DATA_TEST_CASE(RunLargeRhsTransposed, CLMatMulKernelFixture<float>, framework::DatasetMode::NIGHTLY, combine(combine(combine(combine(combine(combine(combine(datasets::LargeMatMulDataset(),

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

369

framework::dataset::make("pretransose_A", { false })),

370

framework::dataset::make("pretransose_B", { true })),

371

m0_values_nightly_lhs_nt),

372

n0_values_nightly_rhs_t),

373

k0_values_nightly_rhs_t),

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

374

framework::dataset::make("export_rhs_to_cl_image", { false })),

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

375

framework::dataset::make("DataType", DataType::F32)))

376

{

377

// Validate output

378

validate(CLAccessor(_target), _reference, tolerance_f32, 0.f, abs_tolerance_f32);

379

}

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

380

FIXTURE_DATA_TEST_CASE(RunLargeLhsTransposed, CLMatMulKernelFixture<float>, framework::DatasetMode::NIGHTLY, combine(combine(combine(combine(combine(combine(combine(datasets::LargeMatMulDataset(),

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

381

framework::dataset::make("pretransose_A", { true })),

382

framework::dataset::make("pretransose_B", { false })),

383

m0_values_nightly_lhs_t),

384

n0_values_nightly_rhs_nt),

385

k0_values_nightly_lhs_t_rhs_nt),

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

386

framework::dataset::make("export_rhs_to_cl_image", { false })),

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

387

framework::dataset::make("DataType", DataType::F32)))

388

{

389

// Validate output

390

validate(CLAccessor(_target), _reference, tolerance_f32, 0.f, abs_tolerance_f32);

391

}

392

FIXTURE_DATA_TEST_CASE(RunLargeLhsTransposedRhsTransposed, CLMatMulKernelFixture<float>, framework::DatasetMode::NIGHTLY,

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

393

combine(combine(combine(combine(combine(combine(combine(datasets::LargeMatMulDataset(),

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

394

framework::dataset::make("pretransose_A", { true })),

395

framework::dataset::make("pretransose_B", { true })),

396

m0_values_nightly_lhs_t),

397

n0_values_nightly_rhs_t),

398

k0_values_nightly_rhs_t),

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

399

framework::dataset::make("export_rhs_to_cl_image", { false })),

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

400

framework::dataset::make("DataType", DataType::F32)))

401

{

402

// Validate output

403

validate(CLAccessor(_target), _reference, tolerance_f32, 0.f, abs_tolerance_f32);

404

}

405

// Running High Dimensional test is enough for FP32, because we're stressing the number of dimensions, not data type or M0/N0/K0

406

// It's a good idea to test for each Lhs/Rhs T/NT combinations because they're different CL kernels

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

407

FIXTURE_DATA_TEST_CASE(RunHighDimensional, CLMatMulKernelFixture<float>, framework::DatasetMode::ALL, combine(combine(combine(combine(combine(combine(combine(datasets::HighDimensionalMatMulDataset(),

408

framework::dataset::make("pretransose_A", { false, true })),

409

framework::dataset::make("pretransose_B", { false, true })),

410

framework::dataset::make("M0", { 2 })),

411

framework::dataset::make("N0", { 2 })),

412

framework::dataset::make("K0", { 2 })),

413

framework::dataset::make("export_rhs_to_cl_image", { false })),

414

framework::dataset::make("DataType", DataType::F32)))

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

415

{

416

// Validate output

417

validate(CLAccessor(_target), _reference, tolerance_f32, 0.f, abs_tolerance_f32);

418

}

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

419

TEST_SUITE_END() // Buffer

420

421

TEST_SUITE(ExportRhsToCLImage)

422

FIXTURE_DATA_TEST_CASE(RunSmallRhsNotTransposed, CLMatMulKernelFixture<float>, framework::DatasetMode::ALL, combine(combine(combine(combine(combine(combine(combine(datasets::SmallMatMulDatasetRhsExportToCLImageRhsNT(),

423

framework::dataset::make("pretransose_A", { true, false })),

424

framework::dataset::make("pretransose_B", { false })),

425

framework::dataset::make("M0", { 2 })),

426

framework::dataset::make("N0", { 4, 8, 16 })),

427

framework::dataset::make("K0", { 2, 4 })),

428

framework::dataset::make("export_rhs_to_cl_image", { true })),

429

framework::dataset::make("DataType", DataType::F32)))

430

{

431

// Validate output

432

if(_device_supports_export_to_cl_image)

433

{

434

validate(CLAccessor(_target), _reference, tolerance_f32, 0.f, abs_tolerance_f32);

435

}

436

}

437

FIXTURE_DATA_TEST_CASE(RunLargeRhsNotTransposed, CLMatMulKernelFixture<float>, framework::DatasetMode::NIGHTLY, combine(combine(combine(combine(combine(combine(combine(datasets::LargeMatMulDatasetRhsExportToCLImageRhsNT(),

438

framework::dataset::make("pretransose_A", { true, false })),

439

framework::dataset::make("pretransose_B", { false })),

440

framework::dataset::make("M0", { 2 })), // Choices of M0 does not matter much because it's related to Lhs tensor

441

framework::dataset::make("N0", { 4, 8, 16 })),

442

framework::dataset::make("K0", { 1, 2, 3, 4 })),

443

framework::dataset::make("export_rhs_to_cl_image", { true })),

444

framework::dataset::make("DataType", DataType::F32)))

445

{

446

// Validate output

447

if(_device_supports_export_to_cl_image)

448

{

449

validate(CLAccessor(_target), _reference, tolerance_f32, 0.f, abs_tolerance_f32);

450

}

451

}

Ramy Elgammal

2023-03-20 10:19:10 +0000

[diff] [blame^]

452

FIXTURE_DATA_TEST_CASE(RunSmallRhsTransposed, CLMatMulKernelFixture<float>, framework::DatasetMode::ALL, combine(combine(combine(combine(combine(combine(combine(datasets::SmallMatMulDatasetRhsExportToCLImageRhsT(),

453

framework::dataset::make("pretransose_A", { true, false })),

454

framework::dataset::make("pretransose_B", { true })),

455

framework::dataset::make("M0", { 2 })),

456

framework::dataset::make("N0", { 2, 4 })),

457

framework::dataset::make("K0", { 4, 8, 16 })),

458

framework::dataset::make("export_rhs_to_cl_image", { true })),

459

framework::dataset::make("DataType", DataType::F32)))

460

{

461

// Validate output

462

if(_device_supports_export_to_cl_image)

463

{

464

validate(CLAccessor(_target), _reference, tolerance_f32, 0.f, abs_tolerance_f32);

465

}

466

}

467

FIXTURE_DATA_TEST_CASE(RunLargeRhsTransposed, CLMatMulKernelFixture<float>, framework::DatasetMode::NIGHTLY, combine(combine(combine(combine(combine(combine(combine(datasets::LargeMatMulDatasetRhsExportToCLImageRhsT(),

468

framework::dataset::make("pretransose_A", { true, false })),

469

framework::dataset::make("pretransose_B", { true })),

470

framework::dataset::make("M0", { 2 })), // Choices of M0 does not matter much because it's related to Lhs tensor

471

framework::dataset::make("N0", { 1, 2, 3, 4 })),

472

framework::dataset::make("K0", { 4, 8, 16 })),

473

framework::dataset::make("export_rhs_to_cl_image", { true })),

474

framework::dataset::make("DataType", DataType::F32)))

475

{

476

// Validate output

477

if(_device_supports_export_to_cl_image)

478

{

479

validate(CLAccessor(_target), _reference, tolerance_f32, 0.f, abs_tolerance_f32);

480

}

481

}

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

482

TEST_SUITE_END() // ExportRhsToCLImage

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

483

TEST_SUITE_END() // FP32

484

485

TEST_SUITE(FP16)

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

486

TEST_SUITE(Buffer)

487

FIXTURE_DATA_TEST_CASE(RunSmall, CLMatMulKernelFixture<half>, framework::DatasetMode::ALL, combine(combine(combine(combine(combine(combine(combine(datasets::SmallMatMulDataset(),

488

framework::dataset::make("pretransose_A", { false, true })),

489

framework::dataset::make("pretransose_B", { false, true })),

490

m0_values_precommit),

491

n0_values_precommit),

492

k0_values_precommit),

493

framework::dataset::make("export_rhs_to_cl_image", { false })),

494

framework::dataset::make("DataType", DataType::F16)))

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

495

{

496

// Validate output

497

validate(CLAccessor(_target), _reference, tolerance_f16, 0.f, abs_tolerance_f16);

498

}

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

499

FIXTURE_DATA_TEST_CASE(RunLargeNoTranspose, CLMatMulKernelFixture<half>, framework::DatasetMode::NIGHTLY, combine(combine(combine(combine(combine(combine(combine(datasets::LargeMatMulDataset(),

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

500

framework::dataset::make("pretransose_A", { false })),

501

framework::dataset::make("pretransose_B", { false })),

502

m0_values_nightly_lhs_nt),

503

n0_values_nightly_rhs_nt),

504

k0_values_nightly_lhs_nt_rhs_nt),

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

505

framework::dataset::make("export_rhs_to_cl_image", { false })),

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

506

framework::dataset::make("DataType", DataType::F16)))

507

{

508

// Validate output

509

validate(CLAccessor(_target), _reference, tolerance_f16, 0.f, abs_tolerance_f16);

510

}

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

511

FIXTURE_DATA_TEST_CASE(RunLargeRhsTransposed, CLMatMulKernelFixture<half>, framework::DatasetMode::NIGHTLY, combine(combine(combine(combine(combine(combine(combine(datasets::LargeMatMulDataset(),

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

512

framework::dataset::make("pretransose_A", { false })),

513

framework::dataset::make("pretransose_B", { true })),

514

m0_values_nightly_lhs_nt),

515

n0_values_nightly_rhs_t),

516

k0_values_nightly_rhs_t),

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

517

framework::dataset::make("export_rhs_to_cl_image", { false })),

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

518

framework::dataset::make("DataType", DataType::F16)))

519

{

520

// Validate output

521

validate(CLAccessor(_target), _reference, tolerance_f16, 0.f, abs_tolerance_f16);

522

}

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

523

FIXTURE_DATA_TEST_CASE(RunLargeLhsTransposed, CLMatMulKernelFixture<half>, framework::DatasetMode::NIGHTLY, combine(combine(combine(combine(combine(combine(combine(datasets::LargeMatMulDataset(),

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

524

framework::dataset::make("pretransose_A", { true })),

525

framework::dataset::make("pretransose_B", { false })),

526

m0_values_nightly_lhs_t),

527

n0_values_nightly_rhs_nt),

528

k0_values_nightly_lhs_t_rhs_nt),

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

529

framework::dataset::make("export_rhs_to_cl_image", { false })),

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

530

framework::dataset::make("DataType", DataType::F16)))

531

{

532

// Validate output

533

validate(CLAccessor(_target), _reference, tolerance_f16, 0.f, abs_tolerance_f16);

534

}

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

535

FIXTURE_DATA_TEST_CASE(RunLargeLhsTransposedRhsTransposed, CLMatMulKernelFixture<half>, framework::DatasetMode::NIGHTLY, combine(combine(combine(combine(combine(combine(combine(datasets::LargeMatMulDataset(),

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

536

framework::dataset::make("pretransose_A", { true })),

537

framework::dataset::make("pretransose_B", { true })),

538

m0_values_nightly_lhs_t),

539

n0_values_nightly_rhs_t),

540

k0_values_nightly_rhs_t),

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

541

framework::dataset::make("export_rhs_to_cl_image", { false })),

Gunes Bayir

2023-03-17 13:52:21 +0000

[diff] [blame]

542

framework::dataset::make("DataType", DataType::F16)))

543

{

544

// Validate output

545

validate(CLAccessor(_target), _reference, tolerance_f16, 0.f, abs_tolerance_f16);

546

}

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

547

TEST_SUITE_END() // Buffer

548

549

TEST_SUITE(ExportRhsToCLImage)

Ramy Elgammal

2023-03-20 10:19:10 +0000

[diff] [blame^]

550

FIXTURE_DATA_TEST_CASE(RunSmallRhsNotTransposed, CLMatMulKernelFixture<half>, framework::DatasetMode::ALL, combine(combine(combine(combine(combine(combine(combine(datasets::SmallMatMulDatasetRhsExportToCLImageRhsNT(),

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

551

framework::dataset::make("pretransose_A", { true, false })),

552

framework::dataset::make("pretransose_B", { false })),

553

framework::dataset::make("M0", { 2 })),

554

framework::dataset::make("N0", { 4, 8, 16 })),

555

framework::dataset::make("K0", { 2, 4 })),

556

framework::dataset::make("export_rhs_to_cl_image", { true })),

557

framework::dataset::make("DataType", DataType::F16)))

558

{

559

// Validate output

560

if(_device_supports_export_to_cl_image)

561

{

562

validate(CLAccessor(_target), _reference, tolerance_f16, 0.f, abs_tolerance_f16);

563

}

564

}

Ramy Elgammal

2023-03-20 10:19:10 +0000

[diff] [blame^]

565

FIXTURE_DATA_TEST_CASE(RunLargeRhsNotTransposed, CLMatMulKernelFixture<half>, framework::DatasetMode::NIGHTLY, combine(combine(combine(combine(combine(combine(combine(datasets::LargeMatMulDatasetRhsExportToCLImageRhsNT(),

Gunes Bayir

2023-03-20 10:19:10 +0000

[diff] [blame]

566

framework::dataset::make("pretransose_A", { true, false })),

567

framework::dataset::make("pretransose_B", { false })),

568

framework::dataset::make("M0", { 2 })), // Choices of M0 does not matter much because it's related to Lhs tensor

569

framework::dataset::make("N0", { 4, 8, 16 })),

570

framework::dataset::make("K0", { 1, 2, 3, 4 })),

571

framework::dataset::make("export_rhs_to_cl_image", { true })),

572

framework::dataset::make("DataType", DataType::F16)))

573

{

574

// Validate output

575

if(_device_supports_export_to_cl_image)

576

{

577

validate(CLAccessor(_target), _reference, tolerance_f16, 0.f, abs_tolerance_f16);

578

}

579

}

Ramy Elgammal