Blame - tests/validation/fixtures/GEMMLowpFixture.h - ml/ComputeLibrary

2024-02-27 18:32:26 +0000

[diff] [blame^]

85

GEMMLowpOutputStageInfo output_stage = GEMMLowpOutputStageInfo(), bool reshape_b_only_on_first_run = false, const TensorFillInfo& finfo = TensorFillInfo(),

86

bool accumulate = false)

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame]

87

{

88

ARM_COMPUTE_ASSERT(is_data_type_quantized_asymmetric(data_type_a));

89

ARM_COMPUTE_ASSERT(data_type_a == data_type_b);

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

90

// Create tensors

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame]

91

const DataType data_type_output = output_stage.type == GEMMLowpOutputStageType::NONE ? DataType::S32 : data_type_a;

Manuel Bottini

2019-12-02 16:22:35 +0000

[diff] [blame]

92

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame]

93

TensorType a = create_tensor<TensorType>(shape_a, data_type_a, 1, a_qinfo);

94

TensorType b = create_tensor<TensorType>(shape_b, data_type_b, 1, b_qinfo); // gemm output before output stage mismatch if i pass data_layout_output here. to be investigated

95

TensorType output = create_tensor<TensorType>(shape_output, data_type_output, 1, output_qinfo /* output_qinfo will be ignored when output stage type is None */);

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

96

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

TensorType bias;

if(is_fused)

{

TensorShape bias_shape(shape_b[0]);

101

bias = create_tensor<TensorType>(bias_shape, DataType::S32, 1);

102

}

103

104

// Create and configure function

105

// The GEMMinfo includes the values of the depth in case of reinterpreted 3d input/output

106

FunctionType gemmlowp;

Giorgio Arena

2021-06-09 15:23:06 +0100

[diff] [blame]

107

gemmlowp.configure(&a, &b, is_fused ? &bias : nullptr, &output, GEMMInfo(false, false, reshape_b_only_on_first_run, (reinterpret_output_as_3d ? shape_output[2] : 0), reinterpret_input_as_3d, false,

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

108

output_stage, false /*fp_mixed_precision*/, false /*fast_math*/, false /*broadcast_bias*/,

109

arm_compute::ActivationLayerInfo(), false /* fixed_format */, arm_compute::WeightFormat::UNSPECIFIED,

110

false /* pretranspose_B */, accumulate));

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

111

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

112

ARM_COMPUTE_ASSERT(a.info()->is_resizable());

113

ARM_COMPUTE_ASSERT(b.info()->is_resizable());

114

ARM_COMPUTE_ASSERT(output.info()->is_resizable());

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

115

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

116

add_padding_x({ &a, &b, &output });

117

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

118

// Allocate tensors

119

a.allocator()->allocate();

120

b.allocator()->allocate();

121

output.allocator()->allocate();

122

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

123

ARM_COMPUTE_ASSERT(!a.info()->is_resizable());

124

ARM_COMPUTE_ASSERT(!b.info()->is_resizable());

125

ARM_COMPUTE_ASSERT(!output.info()->is_resizable());

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

126

127

// Fill tensors

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

128

fill_quantized(AccessorType(a), 0 + finfo.hash);

129

fill_quantized(AccessorType(b), 1 + finfo.hash);

if (accumulate)

{

ARM_COMPUTE_ASSERT(accumulate != run_twice);

134

fill_s32(AccessorType(output), 6 + finfo.hash, finfo.min_output, finfo.max_output);

135

}

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

136

137

if(is_fused)

138

{

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

139

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

140

bias.allocator()->allocate();

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

141

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

142

fill_s32(AccessorType(bias), 2 + finfo.hash, finfo.min_bias, finfo.max_bias);

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

143

}

Ramy Elgammal

2022-09-08 11:30:08 +0100

[diff] [blame]

144

145

// Run with variable inputs.

146

if(run_twice)

147

{

148

gemmlowp.run();

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

149

fill_quantized(AccessorType(a), 3 + finfo.hash); // Fill tensors with new seed after run

150

fill_quantized(AccessorType(b), 4 + finfo.hash);

Ramy Elgammal

2022-09-08 11:30:08 +0100

[diff] [blame]

151

if(is_fused)

152

{

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

153

fill_s32(AccessorType(bias), 5 + finfo.hash, finfo.min_bias, finfo.max_bias);

Ramy Elgammal

2022-09-08 11:30:08 +0100

[diff] [blame]

}

}

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

157

// Compute GEMM function

gemmlowp.run();

return output;

}

Ramy Elgammal

2022-09-08 11:30:08 +0100

[diff] [blame]

162

template <bool reinterpret_input_as_3d, typename TI = uint8_t, typename TW = uint8_t, bool pretranspose_A = false, bool pretranspose_B = false, bool run_twice = false>

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame]

163

SimpleTensor<int32_t> compute_gemmlowp_reference(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_output, const QuantizationInfo& a_qinfo, const QuantizationInfo& b_qinfo,

164

DataType data_type_a = DataType::QASYMM8, DataType data_type_b = DataType::QASYMM8, const TensorFillInfo& finfo = TensorFillInfo())

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

165

{

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame]

166

ARM_COMPUTE_ASSERT(is_data_type_quantized_asymmetric(data_type_a));

167

ARM_COMPUTE_ASSERT(data_type_a == data_type_b);

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

168

TensorShape shape_a_to_use = shape_a;

169

if(reinterpret_input_as_3d)

170

{

171

// Collapse the second and third dimension if the input is 3D

172

shape_a_to_use.collapse(2U, 1U);

173

}

174

175

// Create reference

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame]

176

SimpleTensor<TI> a{ shape_a_to_use, data_type_a, 1, a_qinfo };

177

SimpleTensor<TW> b{ shape_b, data_type_b, 1, b_qinfo };

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

178

Adnan AlSinan

2022-05-05 11:13:19 +0100

[diff] [blame]

179

TensorShape shape_a_to_use_transposed{ shape_a_to_use };

180

TensorShape shape_b_transposed{ shape_b };

181

182

shape_a_to_use_transposed.set(0, shape_a_to_use[1]);

183

shape_a_to_use_transposed.set(1, shape_a_to_use[0]);

184

shape_b_transposed.set(0, shape_b[1]);

185

shape_b_transposed.set(1, shape_b[0]);

186

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame]

187

SimpleTensor<TI> a_transposed{ shape_a_to_use_transposed, data_type_a, 1, a_qinfo };

188

SimpleTensor<TW> b_transposed{ shape_b_transposed, data_type_b, 1, b_qinfo };

Adnan AlSinan

2022-05-05 11:13:19 +0100

[diff] [blame]

189

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

190

// Fill reference

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

191

fill_quantized(a, 0 + finfo.hash);

192

fill_quantized(b, 1 + finfo.hash);

Adnan AlSinan

2022-05-05 11:13:19 +0100

[diff] [blame]

193

194

// Transpose reference if required

Adnan AlSinan

3bb72b6

2022-05-06 12:10:11 +0100

[diff] [blame]

195

/* Note: Assuming the usual batch matmul dimensions A = (B x M x K), B = (B x K x N), if pretranspose_A is set to true, then A is assumed to be (B x K x M),

196

therefore, A must be pre-transposed before passing it to the fixture. And, we transpose A again in the fixture to make it (B x M x K)

197

in order to be able to call reference implementation that works with (B x M x K) input.

198

Similarly, if pretranspose_B is set to true, then B is assumed to be (B x N x K), B must be pre-transposed before passing it to the fixture. */

Adnan AlSinan

2022-05-05 11:13:19 +0100

[diff] [blame]

199

if(pretranspose_A)

200

{

201

transpose_matrix<TI>(a, a_transposed);

}

if(pretranspose_B)

{

transpose_matrix<TW>(b, b_transposed);

207

}

208

Ramy Elgammal

2022-09-08 11:30:08 +0100

[diff] [blame]

209

// Run with variable inputs.

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame]

210

const int32_t a_offset = a_qinfo.uniform().offset;

211

const int32_t b_offset = b_qinfo.uniform().offset;

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

212

Ramy Elgammal

2022-09-08 11:30:08 +0100

[diff] [blame]

213

if(run_twice)

214

{

215

reference::gemmlowp_matrix_multiply_core<int32_t, TI, TW>((pretranspose_A ? a_transposed : a), (pretranspose_B ? b_transposed : b), shape_output, a_offset, b_offset);

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

216

fill_quantized((pretranspose_A) ? a_transposed : a, 3 + finfo.hash);

217

fill_quantized((pretranspose_B) ? b_transposed : b, 4 + finfo.hash);

Ramy Elgammal

2022-09-08 11:30:08 +0100

[diff] [blame]

218

}

219

Adnan AlSinan

2022-05-05 11:13:19 +0100

[diff] [blame]

220

return reference::gemmlowp_matrix_multiply_core<int32_t, TI, TW>((pretranspose_A ? a_transposed : a), (pretranspose_B ? b_transposed : b), shape_output, a_offset, b_offset);

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

221

}

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame]

222

} // namespace

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

223

Ramy Elgammal

2022-09-08 11:30:08 +0100

[diff] [blame]

224

template <typename TensorType, typename AccessorType, typename FunctionType, bool reinterpret_input_as_3d = false, bool reinterpret_output_as_3d = false, bool run_twice = false>

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

225

class GEMMLowpGenericMatrixMultiplyCoreValidationFixture : public framework::Fixture

Pablo Tello

2017-09-29 11:30:12 +0100

[diff] [blame]

226

{

227

public:

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

228

void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_output, int32_t a_offset, int32_t b_offset, bool accumulate=false)

Pablo Tello

2017-09-29 11:30:12 +0100

[diff] [blame]

229

{

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame]

230

const auto a_qinfo = QuantizationInfo(1.0f / 255, a_offset);

231

const auto b_qinfo = QuantizationInfo(1.0f / 255, b_offset);

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

232

TensorFillInfo finfo;

233

_target = compute_target(shape_a, shape_b, shape_output, a_qinfo, b_qinfo, finfo, accumulate);

234

_reference = compute_reference(shape_a, shape_b, shape_output, a_qinfo, b_qinfo, finfo, accumulate);

Pablo Tello

2017-09-29 11:30:12 +0100

[diff] [blame]

235

}

236

237

protected:

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

238

TensorType compute_target(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_output, const QuantizationInfo& a_qinfo, const QuantizationInfo& b_qinfo, const TensorFillInfo& finfo, const bool accumulate)

Pablo Tello

2017-09-29 11:30:12 +0100

[diff] [blame]

239

{

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame]

240

const auto output_qinfo = QuantizationInfo(); // No output stage

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

241

return compute_gemmlowp_target<TensorType, AccessorType, FunctionType, reinterpret_input_as_3d, reinterpret_output_as_3d, int32_t, false, run_twice>(shape_a, shape_b, shape_output, a_qinfo, b_qinfo, output_qinfo,

242

DataType::QASYMM8, DataType::QASYMM8, GEMMLowpOutputStageInfo(), false, finfo, accumulate);

Pablo Tello

2017-09-29 11:30:12 +0100

[diff] [blame]

243

}

244

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

245

SimpleTensor<int32_t> compute_reference(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_output, const QuantizationInfo& a_qinfo, const QuantizationInfo& b_qinfo, const TensorFillInfo& finfo, bool accumulate)

Pablo Tello

2017-09-29 11:30:12 +0100

[diff] [blame]

246

{

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

247

SimpleTensor<int32_t> ref_output = compute_gemmlowp_reference<reinterpret_input_as_3d, uint8_t, uint8_t, false, false, run_twice>(shape_a, shape_b, shape_output, a_qinfo, b_qinfo,

248

DataType::QASYMM8, DataType::QASYMM8, finfo);

if (accumulate)

{

SimpleTensor<int32_t> output{ shape_output, DataType::S32, 1 };

253

fill_s32(output, 6 + finfo.hash, finfo.min_output, finfo.max_output);

254

reference::arithmetic_operation<int32_t>(reference::ArithmeticOperation::ADD, output, ref_output, output, ConvertPolicy::SATURATE);

return output;

}

return ref_output;

Pablo Tello

bf2fb95

2017-09-29 16:43:25 +0100

[diff] [blame]

259

}

260

Pablo Tello

6ff12a0

2017-11-02 16:09:35 +0000

[diff] [blame]

261

TensorType _target{};

262

SimpleTensor<int32_t> _reference{};

Pablo Tello

bf2fb95

2017-09-29 16:43:25 +0100

[diff] [blame]

263

};

264

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

265

template <typename TensorType, typename AccessorType, typename FunctionType, bool reinterpret_input_as_3d = false, bool reinterpret_output_as_3d = false, bool run_twice = false>

266

class GEMMLowpMatrixMultiplyCoreValidationFixture : protected GEMMLowpGenericMatrixMultiplyCoreValidationFixture<TensorType, AccessorType, FunctionType, reinterpret_input_as_3d, reinterpret_output_as_3d, run_twice>

267

{

268

public:

269

void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_output, int32_t a_offset, int32_t b_offset)

270

{

271

GEMMLowpGenericMatrixMultiplyCoreValidationFixture<TensorType, AccessorType, FunctionType, reinterpret_input_as_3d, reinterpret_output_as_3d, run_twice>::setup(shape_a, shape_b, shape_output, a_offset, b_offset, false /* accumulate */);

}

};

template <typename TensorType, typename AccessorType, typename FunctionType, bool reinterpret_input_as_3d = false, bool reinterpret_output_as_3d = false, bool run_twice = false>

276

class GEMMLowpMatrixMultiplyAccumulateValidationFixture : protected GEMMLowpGenericMatrixMultiplyCoreValidationFixture<TensorType, AccessorType, FunctionType, reinterpret_input_as_3d, reinterpret_output_as_3d, run_twice>

277

{

278

public:

279

void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_output, int32_t a_offset, int32_t b_offset)

280

{

281

GEMMLowpGenericMatrixMultiplyCoreValidationFixture<TensorType, AccessorType, FunctionType, reinterpret_input_as_3d, reinterpret_output_as_3d, run_twice>::setup(shape_a, shape_b, shape_output, a_offset, b_offset, true /* accumulate */);

282

}

283

};

284

Mohammed Suhail Munshi

97a609b

2022-10-21 11:15:54 +0100

[diff] [blame]

285

template <typename TensorType, typename AccessorType, typename FunctionType, bool reinterpret_input_as_3d = false, bool reinterpret_output_as_3d = false, typename TI = uint8_t, typename TW = uint8_t, bool run_twice = false>

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

286

class GEMMLowpGenericMatrixMultiplyCoreFusedOffsetOutputValidationFixture : public framework::Fixture

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

287

{

288

public:

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame]

289

/** Dynamically initialize the quantization info with saturation awareness

290

*/

291

template <typename T>

292

static void setup_quantization(DataType data_type, const TensorShape& shape_a, const TensorShape& shape_b, QuantizationInfo& a_qinfo, QuantizationInfo& b_qinfo, QuantizationInfo& output_qinfo, TensorFillInfo& finfo)

293

{

294

// This hash is used by random generators. There may be hash collisions but

295

// this is intentional as it's a very easy way to make the the current

296

// random generation process almost different for many test configurations,

297

// which were using the same set of values before.

298

finfo.hash = shape_a[0] + shape_a[1] + shape_b[0] + shape_b[1];

299

300

const int32_t t_max = static_cast<int32_t>(std::numeric_limits<T>::max());

301

const int32_t t_min = static_cast<int32_t>(std::numeric_limits<T>::min());

302

303

std::mt19937 generator(library->seed() + finfo.hash);

304

std::uniform_real_distribution<float> distribution_float(-5.0f, 3.0f);

305

std::uniform_int_distribution<int32_t> distribution_t(t_min, t_max);

306

307

const float scale_lhs = pow(2, distribution_float(generator)); // [2^-5, 2^3]

308

const float scale_rhs = pow(2, distribution_float(generator)); // [2^-5, 2^3]

309

310

const int32_t offset_lhs = distribution_t(generator);

311

const int32_t offset_rhs = distribution_t(generator);

312

313

a_qinfo = QuantizationInfo(scale_lhs, offset_lhs);

314

b_qinfo = QuantizationInfo(scale_rhs, offset_rhs);

315

316

// reinterpret_input_as_3d or reinterpret_output_as_3d can be ignored, as the underlying gemm / matmul computation

317

// is equivalent to a standard 2D one with m-n-k dimensions

318

const int m = shape_a.y();

319

const int n = shape_b.x();

320

const int k = shape_a.x();

321

322

const float bias_fraction = 0.5f; // We enabled is_fused in compute_gemmlowp_target below, thus bias is included

323

324

QuantizationHint q_hint = suggest_matmul_dst_q_info_and_bias(a_qinfo, b_qinfo, m, n, k, data_type, bias_fraction);

325

output_qinfo = q_hint.q_info;

326

finfo.min_bias = q_hint.bias_min;

327

finfo.max_bias = q_hint.bias_max;

328

329

// Both target and reference implementations use negated offsets, i.e.

330

// float_val = (int_val + offset) * scale

331

// instead of

332

// float_val = (int_val - offset) * scale

333

// as usual. Therefore, after calculating the output quantization above, we

334

// negate the offsets of inputs' offsets.

335

a_qinfo = QuantizationInfo(scale_lhs, -offset_lhs);

336

b_qinfo = QuantizationInfo(scale_rhs, -offset_rhs);

337

}

338

339

/** Initialize output stage info from quantization info */

340

static Status init_gemmlowp_output_stage_info(

341

DataType data_type,

342

const QuantizationInfo& a_qinfo,

343

const QuantizationInfo& b_qinfo,

344

const QuantizationInfo& output_qinfo,

345

GEMMLowpOutputStageType type,

346

GEMMLowpOutputStageInfo &gemmlowp_output_stage_info)

347

{

348

ARM_COMPUTE_RETURN_ERROR_ON(!is_data_type_quantized_asymmetric(data_type));

349

350

const UniformQuantizationInfo aq_unif = a_qinfo.uniform();

351

const UniformQuantizationInfo bq_unif = b_qinfo.uniform();

352

const UniformQuantizationInfo oq_unif = output_qinfo.uniform();

353

354

float multiplier = (aq_unif.scale * bq_unif.scale) / oq_unif.scale;

355

int32_t int_multiplier;

356

int32_t shift;

357

358

ARM_COMPUTE_RETURN_ON_ERROR(

359

quantization::calculate_quantized_multiplier(multiplier, &int_multiplier, &shift));

360

361

int32_t type_min = 0;

362

int32_t type_max = 0;

363

std::tie(type_min, type_max) = quantization::get_quantized_asymmetric_output_min_max(output_qinfo, ActivationLayerInfo(), data_type);

364

365

gemmlowp_output_stage_info.gemmlowp_real_multiplier = multiplier;

366

gemmlowp_output_stage_info.gemmlowp_multiplier = int_multiplier;

367

gemmlowp_output_stage_info.gemmlowp_multipliers = { int_multiplier };

368

gemmlowp_output_stage_info.gemmlowp_shift = shift;

369

gemmlowp_output_stage_info.gemmlowp_shifts = { shift };

370

gemmlowp_output_stage_info.gemmlowp_offset = oq_unif.offset;

371

gemmlowp_output_stage_info.type = type;

372

gemmlowp_output_stage_info.gemmlowp_min_bound = type_min;

373

gemmlowp_output_stage_info.gemmlowp_max_bound = type_max;

return Status{};

}

/** Currently this fixture only tests the following data type configurations:

379

*

380

* 1. a and b are of the same data type

381

* 2. The data type is quantized asymmetric

382

*

383

*/

384

void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_output, GEMMLowpOutputStageType output_stage_type, DataType data_type,

Giorgio Arena

2021-06-09 15:23:06 +0100

[diff] [blame]

385

bool reshape_b_only_on_first_run)

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

386

{

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame]

387

ARM_COMPUTE_ASSERT(output_stage_type != GEMMLowpOutputStageType::NONE);

388

ARM_COMPUTE_ASSERT(is_data_type_quantized_asymmetric(data_type));

Manuel Bottini

2019-12-02 16:22:35 +0000

[diff] [blame]

389

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame]

390

// Randomized dynamic quantization: randomize quantization info in a way that ensures no result saturation

391

// most of the time

392

QuantizationInfo a_qinfo;

393

QuantizationInfo b_qinfo;

394

QuantizationInfo output_qinfo;

395

TensorFillInfo finfo;

396

setup_quantization<TI>(data_type, shape_a, shape_b, a_qinfo, b_qinfo, output_qinfo, finfo);

Vidhya Sudhan Loganathan

951b8a4

2019-11-04 14:42:08 +0000

[diff] [blame]

397

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame]

398

GEMMLowpOutputStageInfo output_stage;

399

init_gemmlowp_output_stage_info(data_type, a_qinfo, b_qinfo, output_qinfo, output_stage_type, output_stage);

400

401

_reference = compute_reference(shape_a, shape_b, shape_output, a_qinfo, b_qinfo, data_type, data_type, output_stage, finfo);

402

_target = compute_target(shape_a, shape_b, shape_output, a_qinfo, b_qinfo, output_qinfo, data_type, data_type, output_stage, reshape_b_only_on_first_run, finfo);

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

403

}

404

405

protected:

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame]

406

TensorType compute_target(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_output, const QuantizationInfo& a_qinfo, const QuantizationInfo& b_qinfo, const QuantizationInfo& output_qinfo,

407

DataType data_type_a, DataType data_type_b, const GEMMLowpOutputStageInfo& output_stage, bool reshape_b_only_on_first_run = false, const TensorFillInfo& finfo = TensorFillInfo())

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

408

{

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame]

409

return compute_gemmlowp_target<TensorType, AccessorType, FunctionType, reinterpret_input_as_3d, reinterpret_output_as_3d, qasymm8_t, true, run_twice>(shape_a, shape_b, shape_output, a_qinfo,

410

b_qinfo, output_qinfo, data_type_a, data_type_b, output_stage, reshape_b_only_on_first_run, finfo);

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

411

}

412

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame]

413

SimpleTensor<TI> compute_reference(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_output, const QuantizationInfo& a_qinfo, const QuantizationInfo& b_qinfo,

414

DataType data_type_a, DataType data_type_b, const GEMMLowpOutputStageInfo& output_stage, const TensorFillInfo& finfo = TensorFillInfo())

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

415

{

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame]

416

SimpleTensor<int32_t> output = compute_gemmlowp_reference<reinterpret_input_as_3d, TI, TW, false, false, run_twice>(shape_a, shape_b, shape_output, a_qinfo, b_qinfo, data_type_a, data_type_b, finfo);

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

417

418

TensorShape bias_shape(shape_b[0]);

419

SimpleTensor<int32_t> bias{ bias_shape, DataType::S32, 1 };

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

420

(run_twice) ? fill_s32(bias, 5 + finfo.hash, finfo.min_bias, finfo.max_bias) : fill_s32(bias, 2 + finfo.hash, finfo.min_bias, finfo.max_bias); // Fill bias with same seed as last run of gemmlowp_target

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

421

422

switch(output_stage.type)

423

{

424

case GEMMLowpOutputStageType::QUANTIZE_DOWN:

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

425

return reference::gemmlowp_quantize_down_scale<int32_t, TI>(output, bias,

Manuel Bottini

2019-12-02 16:22:35 +0000

[diff] [blame]

426

output_stage.gemmlowp_offset, output_stage.gemmlowp_multipliers, output_stage.gemmlowp_shifts, output_stage.gemmlowp_min_bound, output_stage.gemmlowp_max_bound);

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

427

break;

428

case GEMMLowpOutputStageType::QUANTIZE_DOWN_FIXEDPOINT:

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

429

return reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, TI>(output, bias,

Manuel Bottini

2019-12-02 16:22:35 +0000

[diff] [blame]

430

output_stage.gemmlowp_multipliers, output_stage.gemmlowp_shifts, output_stage.gemmlowp_offset, output_stage.gemmlowp_min_bound, output_stage.gemmlowp_max_bound);

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

431

break;

432

default:

433

ARM_COMPUTE_ERROR("Not Supported!");

}

}

Manuel Bottini

2019-12-02 16:22:35 +0000

[diff] [blame]

437

TensorType _target{};

438

SimpleTensor<TI> _reference{};

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

439

};

440

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

441

template <typename TensorType, typename AccessorType, typename FunctionType, bool reinterpret_input_as_3d = false, bool reinterpret_output_as_3d = false, typename TI = uint8_t, typename TW = uint8_t, bool run_twice = false>

442

class GEMMLowpMatrixMultiplyCoreFusedOffsetOutputValidationFixture : public GEMMLowpGenericMatrixMultiplyCoreFusedOffsetOutputValidationFixture<TensorType, AccessorType, FunctionType, reinterpret_input_as_3d, reinterpret_output_as_3d, TI, TW, run_twice>

Giorgio Arena

2021-06-09 15:23:06 +0100

[diff] [blame]

443

{

444

public:

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

445

void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_output, GEMMLowpOutputStageType output_stage_type, DataType data_type, bool reshape_b_only_on_first_run)

Giorgio Arena

2021-06-09 15:23:06 +0100

[diff] [blame]

446

{

Radu Salavat

2024-02-27 18:32:26 +0000

[diff] [blame^]

447

GEMMLowpGenericMatrixMultiplyCoreFusedOffsetOutputValidationFixture<TensorType, AccessorType, FunctionType, reinterpret_input_as_3d, reinterpret_output_as_3d, TI, TW, run_twice>::setup(shape_a, shape_b,

448

shape_output, output_stage_type, data_type, reshape_b_only_on_first_run);

}

};

template <typename TensorType, typename AccessorType, typename FunctionType, bool reinterpret_input_as_3d = false, bool reinterpret_output_as_3d = false, typename TI = uint8_t, typename TW = uint8_t, bool run_twice = false>

453

class GEMMLowpBatchedMatrixMultiplyCoreFusedOffsetOutputFixture : public GEMMLowpGenericMatrixMultiplyCoreFusedOffsetOutputValidationFixture<TensorType, AccessorType, FunctionType, reinterpret_input_as_3d, reinterpret_output_as_3d, TI, TW, run_twice>

454

{

455

public:

456

void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_output, GEMMLowpOutputStageType output_stage_type, DataType data_type, bool reshape_b_only_on_first_run)

457

{

458

GEMMLowpGenericMatrixMultiplyCoreFusedOffsetOutputValidationFixture<TensorType, AccessorType, FunctionType, reinterpret_input_as_3d, reinterpret_output_as_3d, TI, TW, run_twice>::setup(shape_a, shape_b, shape_output, output_stage_type, data_type, reshape_b_only_on_first_run);

Giorgio Arena

2021-06-09 15:23:06 +0100

[diff] [blame]

}

};

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

462

template <typename TensorType, typename AccessorType, typename FunctionType>

463

class GEMMLowpQuantizeDownInt32ToUint8ScaleValidationFixture : public framework::Fixture

464

{

465

public:

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

466

void setup(TensorShape shape, int32_t result_offset, int32_t result_mult_int, int32_t result_shift, int32_t min, int32_t max, bool add_bias)

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

467

{

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

468

_target = compute_target(shape, result_offset, result_mult_int, result_shift, min, max, add_bias);

469

_reference = compute_reference(shape, result_offset, result_mult_int, result_shift, min, max, add_bias);

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

}

protected:

template <typename U>

474

void fill(U &&tensor, int i)

475

{

476

std::uniform_int_distribution<> distribution(-6000, 6000);

477

library->fill(tensor, distribution, i);

478

}

479

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

480

TensorType compute_target(const TensorShape &shape, int32_t result_offset, int32_t result_mult_int, int32_t result_shift, int32_t min, int32_t max, bool add_bias)

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

481

{

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

482

TensorShape shape_bias(shape[0]);

483

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

484

// Create tensors

485

TensorType a = create_tensor<TensorType>(shape, DataType::S32, 1);

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

486

TensorType b = create_tensor<TensorType>(shape_bias, DataType::S32, 1);

487

TensorType c = create_tensor<TensorType>(shape, DataType::QASYMM8, 1);

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

488

489

// Create and configure function

Luca Foschiani

2020-02-13 15:07:36 +0000

[diff] [blame]

490

FunctionType output_stage;

491

GEMMLowpOutputStageInfo output_stage_info = GEMMLowpOutputStageInfo();

492

output_stage_info.type = GEMMLowpOutputStageType::QUANTIZE_DOWN;

493

output_stage_info.gemmlowp_offset = result_offset;

494

output_stage_info.gemmlowp_multiplier = result_mult_int;

495

output_stage_info.gemmlowp_shift = result_shift;

496

output_stage_info.gemmlowp_min_bound = min;

497

output_stage_info.gemmlowp_max_bound = max;

498

output_stage_info.output_data_type = DataType::QASYMM8;

499

output_stage.configure(&a, add_bias ? &b : nullptr, &c, output_stage_info);

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

500

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

501

ARM_COMPUTE_ASSERT(a.info()->is_resizable());

502

ARM_COMPUTE_ASSERT(c.info()->is_resizable());

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

503

504

// Allocate tensors

505

a.allocator()->allocate();

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

506

c.allocator()->allocate();

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

507

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

508

ARM_COMPUTE_ASSERT(!a.info()->is_resizable());

509

ARM_COMPUTE_ASSERT(!c.info()->is_resizable());

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

510

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

511

// Fill tensor

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

512

fill(AccessorType(a), 0);

513

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

514

if(add_bias)

515

{

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

516

ARM_COMPUTE_ASSERT(b.info()->is_resizable());

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

517

518

// Allocate bias tensor

519

b.allocator()->allocate();

520

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

521

ARM_COMPUTE_ASSERT(!b.info()->is_resizable());

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

522

523

// Fill tensor

524

fill(AccessorType(b), 1);

525

}

526

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

527

// Compute GEMM function

528

output_stage.run();

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

529

return c;

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

530

}

531

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

532

SimpleTensor<uint8_t> compute_reference(const TensorShape &shape, int32_t result_offset, int32_t result_mult_int, int32_t result_shift, int32_t min, int32_t max, bool add_bias)

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

533

{

534

// Create reference

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

535

TensorShape shape_bias(shape[0]);

536

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

537

SimpleTensor<int32_t> a{ shape, DataType::S32, 1 };

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

538

SimpleTensor<int32_t> b{ shape_bias, DataType::S32, 1 };

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

// Fill reference

fill(a, 0);

Vidhya Sudhan Loganathan

951b8a4

2019-11-04 14:42:08 +0000

[diff] [blame]

543

const std::vector<int32_t> result_mult_int_vec = { result_mult_int };

544

const std::vector<int32_t> result_shift_vec = { result_shift };

545

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

if(add_bias)

{

// Fill bias

fill(b, 1);

Manuel Bottini

2019-12-02 16:22:35 +0000

[diff] [blame]

551

return reference::gemmlowp_quantize_down_scale<int32_t, uint8_t>(a, b, result_offset, result_mult_int_vec, result_shift_vec, min, max);

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

552

}

553

else

554

{

Manuel Bottini

2019-12-02 16:22:35 +0000

[diff] [blame]

555

return reference::gemmlowp_quantize_down_scale<int32_t, uint8_t>(a, result_offset, result_mult_int_vec, result_shift_vec, min, max);

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

556

}

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

557

}

558

559

TensorType _target{};

560

SimpleTensor<uint8_t> _reference{};

561

};

Gian Marco

2017-11-28 09:10:03 +0000

[diff] [blame]

562

563

template <typename TensorType, typename AccessorType, typename FunctionType>

Luca Foschiani

2020-02-13 15:07:36 +0000

[diff] [blame]

564

class GEMMLowpQuantizeDownInt32ToInt8ScaleValidationFixture : public framework::Fixture

565

{

566

public:

Luca Foschiani

2020-02-13 15:07:36 +0000

[diff] [blame]

567

void setup(TensorShape shape, int32_t result_offset, int32_t result_mult_int, int32_t result_shift, int32_t min, int32_t max, bool add_bias)

568

{

569

_target = compute_target(shape, result_offset, result_mult_int, result_shift, min, max, add_bias);

570

_reference = compute_reference(shape, result_offset, result_mult_int, result_shift, min, max, add_bias);

}

protected:

template <typename U>

575

void fill(U &&tensor, int i)

576

{

577

std::uniform_int_distribution<> distribution(-6000, 6000);

578

library->fill(tensor, distribution, i);

579

}

580

581

TensorType compute_target(const TensorShape &shape, int32_t result_offset, int32_t result_mult_int, int32_t result_shift, int32_t min, int32_t max, bool add_bias)

582

{

583

TensorShape shape_bias(shape[0]);

584

585

// Create tensors

586

TensorType a = create_tensor<TensorType>(shape, DataType::S32, 1);

587

TensorType b = create_tensor<TensorType>(shape_bias, DataType::S32, 1);

588

TensorType c = create_tensor<TensorType>(shape, DataType::QASYMM8_SIGNED, 1);

589

590

// Create and configure function

591

FunctionType output_stage;

592

GEMMLowpOutputStageInfo output_stage_info = GEMMLowpOutputStageInfo();

593

output_stage_info.type = GEMMLowpOutputStageType::QUANTIZE_DOWN;

594

output_stage_info.gemmlowp_offset = result_offset;

595

output_stage_info.gemmlowp_multiplier = result_mult_int;

596

output_stage_info.gemmlowp_shift = result_shift;

597

output_stage_info.gemmlowp_min_bound = min;

598

output_stage_info.gemmlowp_max_bound = max;

599

output_stage_info.output_data_type = DataType::QASYMM8_SIGNED;

600

output_stage.configure(&a, add_bias ? &b : nullptr, &c, output_stage_info);

601

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

602

ARM_COMPUTE_ASSERT(a.info()->is_resizable());

603

ARM_COMPUTE_ASSERT(c.info()->is_resizable());

Luca Foschiani

2020-02-13 15:07:36 +0000

[diff] [blame]

604

605

// Allocate tensors

606

a.allocator()->allocate();

607

c.allocator()->allocate();

608

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

609

ARM_COMPUTE_ASSERT(!a.info()->is_resizable());

610

ARM_COMPUTE_ASSERT(!c.info()->is_resizable());

Luca Foschiani

2020-02-13 15:07:36 +0000

[diff] [blame]

611

612

// Fill tensor

613

fill(AccessorType(a), 0);

614

615

if(add_bias)

616

{

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

617

ARM_COMPUTE_ASSERT(b.info()->is_resizable());

Luca Foschiani

2020-02-13 15:07:36 +0000

[diff] [blame]

618

619

// Allocate bias tensor

620

b.allocator()->allocate();

621

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

622

ARM_COMPUTE_ASSERT(!b.info()->is_resizable());

Luca Foschiani

2020-02-13 15:07:36 +0000

[diff] [blame]

623

624

// Fill tensor

625

fill(AccessorType(b), 1);

626

}

627

628

// Compute GEMM function

output_stage.run();

return c;

}

SimpleTensor<int8_t> compute_reference(const TensorShape &shape, int32_t result_offset, int32_t result_mult_int, int32_t result_shift, int32_t min, int32_t max, bool add_bias)

634

{

635

// Create reference

636

TensorShape shape_bias(shape[0]);

637

638

SimpleTensor<int32_t> a{ shape, DataType::S32, 1 };

639

SimpleTensor<int32_t> b{ shape_bias, DataType::S32, 1 };

// Fill reference

fill(a, 0);

const std::vector<int32_t> result_mult_int_vec = { result_mult_int };

645

const std::vector<int32_t> result_shift_vec = { result_shift };

if(add_bias)

{

// Fill bias

fill(b, 1);

return reference::gemmlowp_quantize_down_scale<int32_t, int8_t>(a, b, result_offset, result_mult_int_vec, result_shift_vec, min, max);

}

else

{

return reference::gemmlowp_quantize_down_scale<int32_t, int8_t>(a, result_offset, result_mult_int_vec, result_shift_vec, min, max);

}

}

TensorType _target{};

661

SimpleTensor<int8_t> _reference{};

662

};

663

664

template <typename TensorType, typename AccessorType, typename FunctionType>

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

665

class GEMMLowpQuantizeDownInt32ToInt8ScaleByFixedPointValidationFixture : public framework::Fixture

666

{

667

public:

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

668

void setup(TensorShape shape, int32_t result_fixedpoint_multiplier, int32_t result_shift, int32_t result_offset_after_shift, int32_t min, int32_t max, bool add_bias)

669

{

670

_target = compute_target(shape, result_fixedpoint_multiplier, result_shift, result_offset_after_shift, min, max, add_bias);

671

_reference = compute_reference(shape, result_fixedpoint_multiplier, result_shift, result_offset_after_shift, min, max, add_bias);

}

protected:

template <typename U>

676

void fill(U &&tensor, int i)

677

{

678

std::uniform_int_distribution<> distribution(-6000, 6000);

679

library->fill(tensor, distribution, i);

680

}

681

682

TensorType compute_target(const TensorShape &shape, int32_t result_fixedpoint_multiplier, int32_t result_shift, int32_t result_offset_after_shift, int32_t min, int32_t max, bool add_bias)

683

{

684

TensorShape shape_bias(shape[0]);

685

686

// Create tensors

687

TensorType a = create_tensor<TensorType>(shape, DataType::S32, 1);

688

TensorType b = create_tensor<TensorType>(shape_bias, DataType::S32, 1);

689

TensorType c = create_tensor<TensorType>(shape, DataType::QASYMM8_SIGNED, 1);

690

691

// Create and configure function

692

FunctionType output_stage;

693

output_stage.configure(&a, add_bias ? &b : nullptr, &c, result_fixedpoint_multiplier, result_shift, result_offset_after_shift, min, max);

694

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

695

ARM_COMPUTE_ASSERT(a.info()->is_resizable());

696

ARM_COMPUTE_ASSERT(c.info()->is_resizable());

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

697

698

// Allocate tensors

699

a.allocator()->allocate();

700

c.allocator()->allocate();

701

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

702

ARM_COMPUTE_ASSERT(!a.info()->is_resizable());

703

ARM_COMPUTE_ASSERT(!c.info()->is_resizable());

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

704

705

// Fill tensor

706

fill(AccessorType(a), 0);

707

708

if(add_bias)

709

{

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

710

ARM_COMPUTE_ASSERT(b.info()->is_resizable());

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

711

712

// Allocate bias tensor

713

b.allocator()->allocate();

714

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

715

ARM_COMPUTE_ASSERT(!b.info()->is_resizable());

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

716

717

// Fill tensor

718

fill(AccessorType(b), 1);

719

}

720

721

// Compute GEMM function

output_stage.run();

return c;

}

SimpleTensor<int8_t> compute_reference(const TensorShape &shape, int32_t result_fixed_point_multiplier, int32_t result_shift, int32_t result_offset_after_shift, int32_t min, int32_t max,

bool add_bias)

{

// Create reference

TensorShape shape_bias(shape[0]);

731

732

SimpleTensor<int32_t> a{ shape, DataType::S32, 1 };

733

SimpleTensor<int32_t> b{ shape_bias, DataType::S32, 1 };

// Fill reference

fill(a, 0);

const std::vector<int32_t> result_fixed_point_multiplier_vec = { result_fixed_point_multiplier };

739

const std::vector<int32_t> result_shift_vec = { result_shift };

if(add_bias)

{

// Fill bias

fill(b, 1);

return reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, int8_t>(a, b, result_fixed_point_multiplier_vec, result_shift_vec, result_offset_after_shift, min, max);

}

else

{

return reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, int8_t>(a, result_fixed_point_multiplier_vec, result_shift_vec, result_offset_after_shift, min, max);

}

}

TensorType _target{};

755

SimpleTensor<int8_t> _reference{};

756

};

757

758

template <typename TensorType, typename AccessorType, typename FunctionType>

Gian Marco

2017-11-28 09:10:03 +0000

[diff] [blame]

759

class GEMMLowpQuantizeDownInt32ToUint8ScaleByFixedPointValidationFixture : public framework::Fixture

760

{

761

public:

Gian Marco

2017-11-28 09:10:03 +0000

[diff] [blame]

762

void setup(TensorShape shape, int32_t result_fixedpoint_multiplier, int32_t result_shift, int32_t result_offset_after_shift, int32_t min, int32_t max, bool add_bias)

763

{

764

_target = compute_target(shape, result_fixedpoint_multiplier, result_shift, result_offset_after_shift, min, max, add_bias);

765

_reference = compute_reference(shape, result_fixedpoint_multiplier, result_shift, result_offset_after_shift, min, max, add_bias);

}

protected:

template <typename U>

770

void fill(U &&tensor, int i)

771

{

772

std::uniform_int_distribution<> distribution(-6000, 6000);

773

library->fill(tensor, distribution, i);

774

}

775

776

TensorType compute_target(const TensorShape &shape, int32_t result_fixedpoint_multiplier, int32_t result_shift, int32_t result_offset_after_shift, int32_t min, int32_t max, bool add_bias)

777

{

778

TensorShape shape_bias(shape[0]);

779

780

// Create tensors

781

TensorType a = create_tensor<TensorType>(shape, DataType::S32, 1);

782

TensorType b = create_tensor<TensorType>(shape_bias, DataType::S32, 1);

783

TensorType c = create_tensor<TensorType>(shape, DataType::QASYMM8, 1);

784

785

// Create and configure function

786

FunctionType output_stage;

787

output_stage.configure(&a, add_bias ? &b : nullptr, &c, result_fixedpoint_multiplier, result_shift, result_offset_after_shift, min, max);

788

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

789

ARM_COMPUTE_ASSERT(a.info()->is_resizable());

790

ARM_COMPUTE_ASSERT(c.info()->is_resizable());

Gian Marco

2017-11-28 09:10:03 +0000

[diff] [blame]

791

792

// Allocate tensors

793

a.allocator()->allocate();

794

c.allocator()->allocate();

795

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

796

ARM_COMPUTE_ASSERT(!a.info()->is_resizable());

797

ARM_COMPUTE_ASSERT(!c.info()->is_resizable());

Gian Marco

2017-11-28 09:10:03 +0000

[diff] [blame]

798

799

// Fill tensor

800

fill(AccessorType(a), 0);

801

802

if(add_bias)

803

{

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

804

ARM_COMPUTE_ASSERT(b.info()->is_resizable());

Gian Marco

2017-11-28 09:10:03 +0000

[diff] [blame]

805

806

// Allocate bias tensor

807

b.allocator()->allocate();

808

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

809

ARM_COMPUTE_ASSERT(!b.info()->is_resizable());

Gian Marco

2017-11-28 09:10:03 +0000

[diff] [blame]

810

811

// Fill tensor

812

fill(AccessorType(b), 1);

813

}

814

815

// Compute GEMM function

output_stage.run();

return c;

}

SimpleTensor<uint8_t> compute_reference(const TensorShape &shape, int32_t result_fixed_point_multiplier, int32_t result_shift, int32_t result_offset_after_shift, int32_t min, int32_t max,

bool add_bias)

{

// Create reference

TensorShape shape_bias(shape[0]);

825

826

SimpleTensor<int32_t> a{ shape, DataType::S32, 1 };

827

SimpleTensor<int32_t> b{ shape_bias, DataType::S32, 1 };

// Fill reference

fill(a, 0);

Vidhya Sudhan Loganathan

951b8a4

2019-11-04 14:42:08 +0000

[diff] [blame]

832

const std::vector<int32_t> result_fixed_point_multiplier_vec = { result_fixed_point_multiplier };

833

const std::vector<int32_t> result_shift_vec = { result_shift };

834

Gian Marco

2017-11-28 09:10:03 +0000

[diff] [blame]

if(add_bias)

{

// Fill bias

fill(b, 1);

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

840

return reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, uint8_t>(a, b, result_fixed_point_multiplier_vec, result_shift_vec, result_offset_after_shift, min, max);

Gian Marco

2017-11-28 09:10:03 +0000

[diff] [blame]

841

}

842

else

843

{

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

844

return reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, uint8_t>(a, result_fixed_point_multiplier_vec, result_shift_vec, result_offset_after_shift, min, max);

Gian Marco

2017-11-28 09:10:03 +0000

[diff] [blame]

}

}

TensorType _target{};

849

SimpleTensor<uint8_t> _reference{};

850

};

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

851

Sheri Zhang

2020-03-09 14:29:52 +0000

[diff] [blame]

852

template <typename TensorType, typename AccessorType, typename FunctionType, typename T>

853

class GEMMLowpQuantizeDownInt32ScaleByFloatValidationFixture : public framework::Fixture

854

{

855

public:

Sheri Zhang

2020-03-09 14:29:52 +0000

[diff] [blame]

856

void setup(DataType data_type, TensorShape shape, float result_real_multiplier, int32_t result_offset, int32_t min, int32_t max, bool add_bias)

857

{

858

_target = compute_target(data_type, shape, result_real_multiplier, result_offset, min, max, add_bias);

859

_reference = compute_reference(shape, result_real_multiplier, result_offset, min, max, add_bias);

}

protected:

template <typename U>

864

void fill(U &&tensor, int i)

865

{

866

// To avoid data all being clampped

867

std::uniform_int_distribution<> distribution(-500, 500);

868

library->fill(tensor, distribution, i);

869

}

870

871

TensorType compute_target(DataType data_type, const TensorShape &shape, float result_multiplier, int32_t result_offset, int32_t min, int32_t max, bool add_bias)

872

{

873

TensorShape shape_bias(shape[0]);

874

875

// Create tensors

876

TensorType a = create_tensor<TensorType>(shape, DataType::S32, 1);

877

TensorType b = create_tensor<TensorType>(shape_bias, DataType::S32, 1);

878

TensorType c = create_tensor<TensorType>(shape, data_type, 1);

879

880

// create output stage info

881

GEMMLowpOutputStageInfo info;

882

info.gemmlowp_max_bound = max;

883

info.gemmlowp_min_bound = min;

884

info.gemmlowp_real_multiplier = result_multiplier;

885

info.gemmlowp_offset = result_offset;

886

info.type = GEMMLowpOutputStageType::QUANTIZE_DOWN_FLOAT;

887

info.output_data_type = data_type;

888

889

// Create and configure function

890

FunctionType output_stage;

891

output_stage.configure(&a, add_bias ? &b : nullptr, &c, info);

892

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

893

ARM_COMPUTE_ASSERT(a.info()->is_resizable());

894

ARM_COMPUTE_ASSERT(c.info()->is_resizable());

Sheri Zhang

2020-03-09 14:29:52 +0000

[diff] [blame]

895

896

// Allocate tensors

897

a.allocator()->allocate();

898

c.allocator()->allocate();

899

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

900

ARM_COMPUTE_ASSERT(!a.info()->is_resizable());

901

ARM_COMPUTE_ASSERT(!c.info()->is_resizable());

Sheri Zhang

2020-03-09 14:29:52 +0000

[diff] [blame]

902

903

// Fill tensor

904

fill(AccessorType(a), 0);

905

906

if(add_bias)

907

{

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

908

ARM_COMPUTE_ASSERT(b.info()->is_resizable());

Sheri Zhang

2020-03-09 14:29:52 +0000

[diff] [blame]

909

910

// Allocate bias tensor

911

b.allocator()->allocate();

912

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

913

ARM_COMPUTE_ASSERT(!b.info()->is_resizable());

Sheri Zhang

2020-03-09 14:29:52 +0000

[diff] [blame]

914

915

// Fill tensor

916

fill(AccessorType(b), 1);

917

}

918

919

// Compute GEMM function

output_stage.run();

return c;

}

SimpleTensor<T> compute_reference(const TensorShape &shape, float_t result_real_multiplier, int32_t result_offset, int32_t min, int32_t max, bool add_bias)

925

{

926

// Create reference

927

TensorShape shape_bias(shape[0]);

928

929

SimpleTensor<int32_t> a{ shape, DataType::S32, 1 };

930

SimpleTensor<int32_t> b{ shape_bias, DataType::S32, 1 };

// Fill reference

fill(a, 0);

const std::vector<float_t> result_float_multiplier_vec = { result_real_multiplier };

if(add_bias)

{

// Fill bias

fill(b, 1);

return reference::gemmlowp_quantize_down_scale_by_float<int32_t, T>(a, b, result_float_multiplier_vec, result_offset, min, max);

}

else

{

return reference::gemmlowp_quantize_down_scale_by_float<int32_t, T>(a, result_float_multiplier_vec, result_offset, min, max);

}

}

TensorType _target{};

951

SimpleTensor<T> _reference{};

952

};

953

Gian Marco Iodice

2019-06-13 15:58:32 +0100

[diff] [blame]

954

template <typename TensorType, typename AccessorType, typename FunctionType>

955

class GEMMLowpQuantizeDownInt32ToInt16ScaleByFixedPointValidationFixture : public framework::Fixture

956

{

957

public:

Gian Marco Iodice

2019-06-13 15:58:32 +0100

[diff] [blame]

958

void setup(TensorShape shape, int32_t result_fixedpoint_multiplier, int32_t result_shift, int32_t min, int32_t max, bool add_bias)

959

{

960

_target = compute_target(shape, result_fixedpoint_multiplier, result_shift, min, max, add_bias);

961

_reference = compute_reference(shape, result_fixedpoint_multiplier, result_shift, min, max, add_bias);

}

protected:

template <typename U>

966

void fill(U &&tensor, int i)

967

{

968

std::uniform_int_distribution<> distribution(-6000, 6000);

969

library->fill(tensor, distribution, i);

970

}

971

972

TensorType compute_target(const TensorShape &shape, int32_t result_fixedpoint_multiplier, int32_t result_shift, int32_t min, int32_t max, bool add_bias)

973

{

974

TensorShape shape_bias(shape[0]);

975

976

// Create tensors

977

TensorType a = create_tensor<TensorType>(shape, DataType::S32, 1);

978

TensorType b = create_tensor<TensorType>(shape_bias, DataType::S32, 1);

979

TensorType c = create_tensor<TensorType>(shape, DataType::QSYMM16, 1);

980

981

// Create and configure function

982

FunctionType output_stage;

983

output_stage.configure(&a, add_bias ? &b : nullptr, &c, result_fixedpoint_multiplier, result_shift, min, max);

984

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

985

ARM_COMPUTE_ASSERT(a.info()->is_resizable());

986

ARM_COMPUTE_ASSERT(c.info()->is_resizable());

Gian Marco Iodice

2019-06-13 15:58:32 +0100

[diff] [blame]

987

988

// Allocate tensors

989

a.allocator()->allocate();

990

c.allocator()->allocate();

991

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

992

ARM_COMPUTE_ASSERT(!a.info()->is_resizable());

993

ARM_COMPUTE_ASSERT(!c.info()->is_resizable());

Gian Marco Iodice

2019-06-13 15:58:32 +0100

[diff] [blame]

994

995

// Fill tensor

996

fill(AccessorType(a), 0);

997

998

if(add_bias)

999

{

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1000

ARM_COMPUTE_ASSERT(b.info()->is_resizable());

Gian Marco Iodice

2019-06-13 15:58:32 +0100

[diff] [blame]

1001

1002

// Allocate bias tensor

1003

b.allocator()->allocate();

1004

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1005

ARM_COMPUTE_ASSERT(!b.info()->is_resizable());

Gian Marco Iodice

2019-06-13 15:58:32 +0100

[diff] [blame]

1006

1007

// Fill tensor

1008

fill(AccessorType(b), 1);

1009

}

1010

1011

// Compute GEMM function

output_stage.run();

return c;

}

SimpleTensor<int16_t> compute_reference(const TensorShape &shape, int32_t result_fixed_point_multiplier, int32_t result_shift, int32_t min, int32_t max,

bool add_bias)

{

// Create reference

TensorShape shape_bias(shape[0]);

1021

1022

SimpleTensor<int32_t> a{ shape, DataType::S32, 1 };

1023

SimpleTensor<int32_t> b{ shape_bias, DataType::S32, 1 };

// Fill reference

fill(a, 0);

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

1028

const std::vector<int32_t> result_fixed_point_multiplier_vec = { result_fixed_point_multiplier };

1029

const std::vector<int32_t> result_shift_vec = { result_shift };

1030

Gian Marco Iodice

2019-06-13 15:58:32 +0100

[diff] [blame]

if(add_bias)

{

// Fill bias

fill(b, 1);

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

1036

return reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, int16_t>(a, b, result_fixed_point_multiplier_vec, result_shift_vec, 0, min, max);

Gian Marco Iodice

2019-06-13 15:58:32 +0100

[diff] [blame]

1037

}

1038

else

1039

{

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

1040

return reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, int16_t>(a, result_fixed_point_multiplier_vec, result_shift_vec, 0, min, max);

Gian Marco Iodice

2019-06-13 15:58:32 +0100

[diff] [blame]

}

}

TensorType _target{};

1045

SimpleTensor<int16_t> _reference{};

1046

};

1047

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1048

template <typename TensorType, typename AccessorType, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMFunctionType>

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1049

class GEMMLowpMatrixMultiplyReshapedValidationFixture : public framework::Fixture

1050

{

1051

public:

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1052

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0, bool interleave_lhs,

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1053

bool interleave_rhs, DataType data_type)

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1054

{

1055

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

1060

lhs_info.transpose = false;

1061

1062

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1067

rhs_info.transpose = true;

1068

1069

// Set the tensor shapes for LHS and RHS matrices

1070

const TensorShape lhs_shape(k, m, batch_size);

1071

const TensorShape rhs_shape(n, k, batch_size);

1072

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1073

_target = compute_target(lhs_shape, rhs_shape, lhs_info, rhs_info, data_type);

1074

_reference = compute_reference(lhs_shape, rhs_shape, data_type);

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

}

protected:

template <typename U>

1079

void fill(U &&tensor, int i)

1080

{

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1081

switch(tensor.data_type())

1082

{

1083

case DataType::QASYMM8:

1084

{

1085

// Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path

1086

std::uniform_int_distribution<> distribution(1, 254);

1087

library->fill(tensor, distribution, i);

1088

}

1089

break;

1090

case DataType::QASYMM8_SIGNED:

1091

{

1092

std::uniform_int_distribution<> distribution(-127, 126);

1093

library->fill(tensor, distribution, i);

}

break;

default:

ARM_COMPUTE_ERROR("Unsupported data type");

1098

}

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1099

}

1100

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1101

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info, DataType data_type)

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1102

{

1103

// Create tensors

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1104

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1105

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1106

TensorType lhs_reshaped;

1107

TensorType rhs_reshaped;

1108

TensorType dst;

1109

1110

const unsigned int M = lhs_shape[1];

1111

const unsigned int N = rhs_shape[0];

1112

const unsigned int K = lhs_shape[0];

1113

1114

// The output tensor will be auto-initialized within the function

1115

1116

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1117

ReshapeLHSOperatorType reshape_lhs;

1118

ReshapeRHSOperatorType reshape_rhs;

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1119

GEMMFunctionType gemm;

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1120

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

1121

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

1122

gemm.configure(lhs_reshaped.info(), rhs_reshaped.info(), dst.info(), lhs_info, rhs_info, GEMMReshapeInfo(M, N, K));

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1123

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1124

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1125

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1126

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1127

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &dst });

1128

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1129

// Allocate tensors

1130

lhs.allocator()->allocate();

1131

rhs.allocator()->allocate();

1132

lhs_reshaped.allocator()->allocate();

1133

rhs_reshaped.allocator()->allocate();

1134

dst.allocator()->allocate();

1135

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1136

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1137

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1138

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

1139

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1140

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1141

1142

// Fill tensors

1143

fill(AccessorType(lhs), 0);

1144

fill(AccessorType(rhs), 1);

1145

1146

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1147

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

1148

reshape_lhs.run(reshape_lhs_pack);

1149

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1150

reshape_rhs.run(reshape_rhs_pack);

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

1151

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped }, { ACL_SRC_1, &rhs_reshaped }, { ACL_DST, &dst } });

1152

gemm.run(gemm_pack);

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

return dst;

}

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1157

SimpleTensor<int32_t> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type)

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1158

{

1159

TensorShape dst_shape = lhs_shape;

1160

dst_shape[0] = rhs_shape[0];

1161

dst_shape[1] = lhs_shape[1];

1162

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1163

switch(data_type)

1164

{

1165

case DataType::QASYMM8:

1166

{

1167

// Create reference

1168

SimpleTensor<uint8_t> lhs{ lhs_shape, data_type, 1 };

1169

SimpleTensor<uint8_t> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1170

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1171

// Fill reference

1172

fill(lhs, 0);

1173

fill(rhs, 1);

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1174

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1175

return reference::gemmlowp_matrix_multiply_core<int32_t, uint8_t>(lhs, rhs, dst_shape, 0, 0);

1176

}

1177

case DataType::QASYMM8_SIGNED:

1178

{

1179

// Create reference

1180

SimpleTensor<int8_t> lhs{ lhs_shape, data_type, 1 };

1181

SimpleTensor<int8_t> rhs{ rhs_shape, data_type, 1 };

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

return reference::gemmlowp_matrix_multiply_core<int32_t, int8_t>(lhs, rhs, dst_shape, 0, 0);

1188

}

1189

default:

1190

ARM_COMPUTE_ERROR("Unsupported data type");

1191

}

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1192

}

1193

1194

TensorType _target{};

1195

SimpleTensor<int32_t> _reference{};

1196

};

1197

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1198

template <typename TensorType, typename AccessorType, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMFunctionType>

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1199

class GEMMLowpMatrixMultiplyReshaped3DValidationFixture : public framework::Fixture

1200

{

1201

public:

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1202

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0,

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1203

bool interleave_lhs, bool interleave_rhs, DataType data_type)

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1204

{

1205

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

1210

lhs_info.transpose = false;

1211

1212

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1217

rhs_info.transpose = true;

1218

1219

// In case of GEMM3D, m is the product between m_w and m_h

1220

const unsigned int m = m_w * m_h;

1221

1222

// Set the tensor shapes for LHS and RHS matrices

1223

const TensorShape lhs_shape(k, m, batch_size);

1224

const TensorShape rhs_shape(n, k, batch_size);

1225

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1226

_target = compute_target(lhs_shape, rhs_shape, lhs_info, rhs_info, m_h, data_type);

1227

_reference = compute_reference(lhs_shape, rhs_shape, m_h, data_type);

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

}

protected:

template <typename U>

1232

void fill(U &&tensor, int i)

1233

{

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1234

switch(tensor.data_type())

1235

{

1236

case DataType::QASYMM8:

1237

{

1238

// Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path

1239

std::uniform_int_distribution<> distribution(1, 254);

1240

library->fill(tensor, distribution, i);

1241

}

1242

break;

1243

case DataType::QASYMM8_SIGNED:

1244

{

1245

std::uniform_int_distribution<> distribution(-127, 126);

1246

library->fill(tensor, distribution, i);

}

break;

default:

ARM_COMPUTE_ERROR("Unsupported data type");

1251

}

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1252

}

1253

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1254

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info, unsigned int m_h,

1255

DataType data_type)

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1256

{

1257

// Create tensors

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1258

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1259

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1260

TensorType lhs_reshaped;

1261

TensorType rhs_reshaped;

1262

TensorType dst;

1263

1264

const unsigned int M = lhs_shape[1];

1265

const unsigned int N = rhs_shape[0];

1266

const unsigned int K = lhs_shape[0];

1267

1268

// The output tensor will be auto-initialized within the function

1269

1270

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1271

ReshapeLHSOperatorType reshape_lhs;

1272

ReshapeRHSOperatorType reshape_rhs;

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1273

GEMMFunctionType gemm;

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1274

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

1275

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

1276

gemm.configure(lhs_reshaped.info(), rhs_reshaped.info(), dst.info(), lhs_info, rhs_info, GEMMReshapeInfo(M, N, K, 1, 1, m_h));

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1277

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1278

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1279

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1280

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1281

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &dst });

1282

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1283

// Allocate tensors

1284

lhs.allocator()->allocate();

1285

rhs.allocator()->allocate();

1286

lhs_reshaped.allocator()->allocate();

1287

rhs_reshaped.allocator()->allocate();

1288

dst.allocator()->allocate();

1289

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1290

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1291

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1292

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

1293

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1294

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1295

1296

// Fill tensors

1297

fill(AccessorType(lhs), 0);

1298

fill(AccessorType(rhs), 1);

1299

1300

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1301

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

1302

reshape_lhs.run(reshape_lhs_pack);

1303

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1304

reshape_rhs.run(reshape_rhs_pack);

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

1305

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped }, { ACL_SRC_1, &rhs_reshaped }, { ACL_DST, &dst } });

1306

gemm.run(gemm_pack);

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

return dst;

}

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1311

SimpleTensor<int32_t> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, unsigned int m_h, DataType data_type)

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1312

{

1313

TensorShape dst_shape = lhs_shape;

1314

dst_shape.set(0, rhs_shape[0]);

1315

dst_shape.set(1, lhs_shape[1] / m_h);

1316

dst_shape.set(2, m_h);

1317

dst_shape.set(3, lhs_shape[2]);

1318

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1319

switch(data_type)

1320

{

1321

case DataType::QASYMM8:

1322

{

1323

// Create reference

1324

SimpleTensor<uint8_t> lhs{ lhs_shape, data_type, 1 };

1325

SimpleTensor<uint8_t> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1326

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1327

// Fill reference

1328

fill(lhs, 0);

1329

fill(rhs, 1);

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1330

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1331

return reference::gemmlowp_matrix_multiply_core<int32_t, uint8_t>(lhs, rhs, dst_shape, 0, 0);

1332

}

1333

case DataType::QASYMM8_SIGNED:

1334

{

1335

// Create reference

1336

SimpleTensor<int8_t> lhs{ lhs_shape, data_type, 1 };

1337

SimpleTensor<int8_t> rhs{ rhs_shape, data_type, 1 };

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

return reference::gemmlowp_matrix_multiply_core<int32_t, int8_t>(lhs, rhs, dst_shape, 0, 0);

1344

}

1345

default:

1346

ARM_COMPUTE_ERROR("Unsupported data type");

1347

}

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1348

}

1349

1350

TensorType _target{};

1351

SimpleTensor<int32_t> _reference{};

1352

};

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1353

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1354

template <typename TensorType, typename AccessorType, typename ReshapeRHSOperatorType, typename GEMMFunctionType>

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1355

class GEMMLowpMatrixMultiplyReshapedOnlyRHSValidationFixture : public framework::Fixture

1356

{

1357

public:

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1358

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0,

1359

unsigned int k0, unsigned int h0, bool interleave_rhs, bool transpose_rhs, DataType data_type)

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1360

{

1361

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1370

rhs_info.transpose = transpose_rhs;

1371

1372

// Set the tensor shapes for LHS and RHS matrices

1373

const TensorShape lhs_shape(k, m, batch_size);

1374

const TensorShape rhs_shape(n, k, batch_size);

1375

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1376

_target = compute_target(lhs_shape, rhs_shape, lhs_info, rhs_info, data_type);

1377

_reference = compute_reference(lhs_shape, rhs_shape, data_type);

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

}

protected:

template <typename U>

1382

void fill(U &&tensor, int i)

1383

{

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1384

switch(tensor.data_type())

1385

{

1386

case DataType::QASYMM8:

1387

{

1388

// Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path

1389

std::uniform_int_distribution<> distribution(1, 254);

1390

library->fill(tensor, distribution, i);

1391

}

1392

break;

1393

case DataType::QASYMM8_SIGNED:

1394

{

1395

std::uniform_int_distribution<> distribution(-127, 126);

1396

library->fill(tensor, distribution, i);

}

break;

default:

ARM_COMPUTE_ERROR("Unsupported data type");

1401

}

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1402

}

1403

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1404

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const GEMMLHSMatrixInfo &lhs_info,

1405

const GEMMRHSMatrixInfo &rhs_info, DataType data_type)

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1406

{

1407

// Create tensors

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1408

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1409

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1410

TensorType rhs_reshaped;

1411

TensorType dst;

1412

1413

const unsigned int M = lhs_shape[1];

1414

const unsigned int N = rhs_shape[0];

1415

const unsigned int K = lhs_shape[0];

1416

Michele Di Giorgio

b54ba28

2020-01-14 15:31:55 +0000

[diff] [blame]

1417

GEMMKernelInfo gemm_info;

gemm_info.m = M;

gemm_info.n = N;

gemm_info.k = K;

gemm_info.lhs_info = lhs_info;

1422

gemm_info.rhs_info = rhs_info;

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1423

// The output tensor will be auto-initialized within the function

1424

1425

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1426

ReshapeRHSOperatorType reshape_rhs;

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1427

GEMMFunctionType gemm;

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1428

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

1429

gemm.configure(lhs.info(), rhs_reshaped.info(), dst.info(), gemm_info);

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1430

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1431

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1432

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1433

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1434

add_padding_x({ &lhs, &rhs, &rhs_reshaped, &dst });

1435

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1436

// Allocate tensors

1437

lhs.allocator()->allocate();

1438

rhs.allocator()->allocate();

1439

rhs_reshaped.allocator()->allocate();

1440

dst.allocator()->allocate();

1441

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1442

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1443

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1444

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1445

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1446

1447

// Fill tensors

1448

fill(AccessorType(lhs), 0);

1449

fill(AccessorType(rhs), 1);

1450

1451

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1452

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1453

reshape_rhs.run(reshape_rhs_pack);

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

1454

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs }, { ACL_SRC_1, &rhs_reshaped }, { ACL_DST, &dst } });

1455

gemm.run(gemm_pack);

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

return dst;

}

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1460

SimpleTensor<int32_t> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type)

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1461

{

1462

TensorShape dst_shape = lhs_shape;

1463

dst_shape[0] = rhs_shape[0];

1464

dst_shape[1] = lhs_shape[1];

1465

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1466

if(data_type == DataType::QASYMM8)

1467

{

1468

// Create reference

1469

SimpleTensor<uint8_t> lhs{ lhs_shape, data_type, 1 };

1470

SimpleTensor<uint8_t> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1471

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1472

// Fill reference

1473

fill(lhs, 0);

1474

fill(rhs, 1);

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1475

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1476

return reference::gemmlowp_matrix_multiply_core<int32_t, uint8_t>(lhs, rhs, dst_shape, 0, 0);

}

else

{

// Create reference

SimpleTensor<int8_t> lhs{ lhs_shape, data_type, 1 };

1482

SimpleTensor<int8_t> rhs{ rhs_shape, data_type, 1 };

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

return reference::gemmlowp_matrix_multiply_core<int32_t, int8_t>(lhs, rhs, dst_shape, 0, 0);

1489

}

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1490

}

1491

1492

TensorType _target{};

1493

SimpleTensor<int32_t> _reference{};

1494

};

1495

Freddie Liardet

2022-05-16 14:09:10 +0100

[diff] [blame]

1496

template <typename T, typename TensorType, typename AccessorType, typename ReshapeRHSOperatorType, typename GEMMFunctionType, typename ReduceOperation, typename CastOperation>

1497

class GEMMLowpMatrixMultiplyReshapedOnlyRHSMMULOutputStageValidationFixture : public framework::Fixture

1498

{

1499

public:

Freddie Liardet

2022-05-16 14:09:10 +0100

[diff] [blame]

1500

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0,

1501

unsigned int k0, unsigned int h0, bool interleave_rhs, bool transpose_rhs, bool broadcast_bias, DataType data_type)

1502

{

1503

GEMMLowpOutputStageInfo output_stage;

1504

output_stage.type = GEMMLowpOutputStageType::QUANTIZE_DOWN_FIXEDPOINT;

1505

output_stage.output_data_type = data_type;

1506

output_stage.gemmlowp_multipliers = std::vector<int32_t> { 1 };

1507

output_stage.gemmlowp_shifts = std::vector<int32_t> { 1 };

1508

output_stage.gemmlowp_multipliers[0] = 1;

1509

output_stage.gemmlowp_shifts[0] = 1;

1510

output_stage.gemmlowp_offset = 0;

1511

constexpr float scale = 0.001f;

1512

quantization::calculate_quantized_multiplier(scale, &output_stage.gemmlowp_multipliers[0], &output_stage.gemmlowp_shifts[0]);

1513

output_stage.gemmlowp_min_bound = -100;

1514

output_stage.gemmlowp_max_bound = 100;

1515

1516

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1525

rhs_info.transpose = transpose_rhs;

int a_offset = 1;

int b_offset = 1;

// Set the tensor shapes for LHS and RHS matrices

1531

const TensorShape lhs_shape(k, m, batch_size);

1532

const TensorShape rhs_shape(n, k, batch_size);

1533

const TensorShape bias_shape(n,

1534

broadcast_bias ? 1 : m,

1535

broadcast_bias ? 1 : batch_size);

1536

Ramy Elgammal

2022-09-08 11:30:08 +0100

[diff] [blame]

1537

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, output_stage, a_offset, b_offset);

Freddie Liardet

2022-05-16 14:09:10 +0100

[diff] [blame]

1538

if(gemm_validated == true)

1539

{

1540

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, output_stage, a_offset, b_offset);

}

}

protected:

template <typename U>

1546

void fill(U &&tensor, int i)

1547

{

1548

switch(tensor.data_type())

1549

{

1550

case DataType::QASYMM8:

1551

{

1552

// Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path

1553

std::uniform_int_distribution<> distribution(1, 254);

1554

library->fill(tensor, distribution, i);

1555

}

1556

break;

1557

case DataType::QASYMM8_SIGNED:

1558

{

1559

std::uniform_int_distribution<> distribution(-127, 126);

1560

library->fill(tensor, distribution, i);

}

break;

case DataType::S32:

{

std::uniform_int_distribution<> distribution(-10000, 10000);

1566

library->fill(tensor, distribution, i);

}

break;

default:

ARM_COMPUTE_ERROR("Unsupported data type");

}

}

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info,

1575

const GEMMRHSMatrixInfo &rhs_info, DataType data_type, GEMMLowpOutputStageInfo output_stage, const int a_offset, const int b_offset)

1576

{

1577

// Create tensors

1578

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1, QuantizationInfo(1.0f / 255, a_offset));

1579

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1, QuantizationInfo(1.0f / 255, b_offset));

1580

TensorType bias = create_tensor<TensorType>(bias_shape, DataType::S32, 1);

1581

TensorType dst;

1582

TensorType rhs_reshaped;

1583

1584

const unsigned int M = lhs_shape[1];

1585

const unsigned int N = rhs_shape[0];

1586

const unsigned int K = lhs_shape[0];

1587

1588

// Tensors for precomputing sum of lhs rows / rhs columns

1589

TensorType vec_sum_rows = create_tensor<TensorType>(TensorShape(M, 1, lhs_shape[2]), DataType::S32, 1);

1590

TensorType vec_sum_cols = create_tensor<TensorType>(TensorShape(N, 1, rhs_shape[2]), DataType::S32, 1);

1591

1592

GEMMKernelInfo gemm_info;

gemm_info.m = M;

gemm_info.n = N;

gemm_info.k = K;

gemm_info.lhs_info = lhs_info;

1597

gemm_info.rhs_info = rhs_info;

1598

gemm_info.output_stage = output_stage;

1599

gemm_info.a_offset = a_offset;

1600

gemm_info.b_offset = b_offset;

1601

// The output tensor will be auto-initialized within the function

1602

1603

// Create and configure function

1604

ReshapeRHSOperatorType reshape_rhs;

1605

GEMMFunctionType gemm;

1606

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1607

1608

// If GEMM is not validated, do not try to run. The validation will check

1609

// if the technology supports this extension. If not, the test will be skipped.

1610

// If it supports, the test will fail anyway because target and reference

1611

// will not match.

1612

gemm_validated = bool(gemm.validate(lhs.info(), rhs_reshaped.info(), dst.info(), gemm_info, vec_sum_cols.info(), vec_sum_rows.info(), bias.info()));

1613

if(gemm_validated == true)

1614

{

1615

gemm.configure(lhs.info(), rhs_reshaped.info(), dst.info(), gemm_info, vec_sum_cols.info(), vec_sum_rows.info(), bias.info());

1616

1617

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1618

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1619

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

1620

1621

// Allocate tensors

1622

lhs.allocator()->allocate();

1623

rhs.allocator()->allocate();

1624

rhs_reshaped.allocator()->allocate();

1625

bias.allocator()->allocate();

1626

vec_sum_cols.allocator()->allocate();

1627

vec_sum_rows.allocator()->allocate();

1628

dst.allocator()->allocate();

1629

1630

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1631

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1632

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1633

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1634

ARM_COMPUTE_ASSERT(!vec_sum_cols.info()->is_resizable());

1635

ARM_COMPUTE_ASSERT(!vec_sum_rows.info()->is_resizable());

1636

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

1637

1638

// Fill tensors

1639

fill(AccessorType(lhs), 0);

1640

fill(AccessorType(rhs), 1);

1641

fill(AccessorType(bias), 2);

1642

1643

TensorType lhs_32 = create_tensor<TensorType>(lhs_shape, DataType::S32, 1);

1644

TensorType rhs_32 = create_tensor<TensorType>(rhs_shape, DataType::S32, 1);

1645

CastOperation cast_lhs;

1646

CastOperation cast_rhs;

1647

cast_lhs.configure(&lhs, &lhs_32, ConvertPolicy::SATURATE);

1648

cast_rhs.configure(&rhs, &rhs_32, ConvertPolicy::SATURATE);

1649

lhs_32.allocator()->allocate();

1650

rhs_32.allocator()->allocate();

cast_lhs.run();

cast_rhs.run();

ReduceOperation lhs_sum_rows;

1655

ReduceOperation rhs_sum_cols;

1656

1657

lhs_sum_rows.configure(&lhs_32, &vec_sum_rows, 0, ReductionOperation::SUM, false);

1658

rhs_sum_cols.configure(&rhs_32, &vec_sum_cols, 1, ReductionOperation::SUM);

lhs_sum_rows.run();

rhs_sum_cols.run();

// Compute GEMM

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1665

reshape_rhs.run(reshape_rhs_pack);

1666

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs }, { ACL_SRC_1, &rhs_reshaped }, { ACL_SRC_2, &bias }, { ACL_DST, &dst }, { ACL_VEC_COL_SUM, &vec_sum_cols }, { ACL_VEC_ROW_SUM, &vec_sum_rows } });

gemm.run(gemm_pack);

}

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, GEMMLowpOutputStageInfo output_stage,

1674

const int a_offset, const int b_offset)

1675

{

1676

TensorShape dst_shape = lhs_shape;

1677

dst_shape[0] = rhs_shape[0];

1678

dst_shape[1] = lhs_shape[1];

1679

1680

// Create reference

1681

SimpleTensor<T> lhs{ lhs_shape, data_type, 1, QuantizationInfo(1.0f / 255, a_offset) };

1682

SimpleTensor<T> rhs{ rhs_shape, data_type, 1, QuantizationInfo(1.0f / 255, b_offset) };

1683

SimpleTensor<int32_t> bias{ bias_shape, DataType::S32, 1 };

1684

SimpleTensor<int32_t> dst{ dst_shape, DataType::S32, 1 };

1685

SimpleTensor<T> dst_final{ dst_shape, data_type, 1 };

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

dst = reference::gemmlowp_matrix_multiply_core<int32_t, T>(lhs, rhs, dst_shape, a_offset, b_offset);

1693

dst_final = reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, T>(dst, bias,

1694

output_stage.gemmlowp_multipliers, output_stage.gemmlowp_shifts, output_stage.gemmlowp_offset, output_stage.gemmlowp_min_bound, output_stage.gemmlowp_max_bound);

return dst_final;

}

bool gemm_validated = true;

1699

TensorType _target{};

1700

SimpleTensor<T> _reference{};

1701

};

1702

1703

template <typename TensorType, typename AccessorType, typename ReshapeRHSOperatorType, typename GEMMFunctionType>

1704

class GEMMLowpMatrixMultiplyReshapedOnlyRHSMMULValidationFixture : public framework::Fixture

1705

{

1706

public:

Freddie Liardet

2022-05-16 14:09:10 +0100

[diff] [blame]

1707

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0,

1708

unsigned int k0, unsigned int h0, bool interleave_rhs, bool transpose_rhs, DataType data_type)

1709

{

1710

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1719

rhs_info.transpose = transpose_rhs;

1720

1721

// Set the tensor shapes for LHS and RHS matrices

1722

const TensorShape lhs_shape(k, m, batch_size);

1723

const TensorShape rhs_shape(n, k, batch_size);

1724

Ramy Elgammal

2022-09-08 11:30:08 +0100

[diff] [blame]

1725

_target = compute_target(lhs_shape, rhs_shape, lhs_info, rhs_info, data_type);

Freddie Liardet

2022-05-16 14:09:10 +0100

[diff] [blame]

1726

if(gemm_validated == true)

1727

{

1728

_reference = compute_reference(lhs_shape, rhs_shape, data_type);

}

}

protected:

template <typename U>

1734

void fill(U &&tensor, int i)

1735

{

1736

switch(tensor.data_type())

1737

{

1738

case DataType::QASYMM8:

1739

{

1740

// Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path

1741

std::uniform_int_distribution<> distribution(1, 254);

1742

library->fill(tensor, distribution, i);

1743

}

1744

break;

1745

case DataType::QASYMM8_SIGNED:

1746

{

1747

std::uniform_int_distribution<> distribution(-127, 126);

1748

library->fill(tensor, distribution, i);

}

break;

default:

ARM_COMPUTE_ERROR("Unsupported data type");

}

}

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const GEMMLHSMatrixInfo &lhs_info,

1757

const GEMMRHSMatrixInfo &rhs_info, DataType data_type)

1758

{

1759

// Create tensors

1760

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1761

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1762

TensorType rhs_reshaped;

1763

TensorType dst;

1764

1765

const unsigned int M = lhs_shape[1];

1766

const unsigned int N = rhs_shape[0];

1767

const unsigned int K = lhs_shape[0];

1768

1769

GEMMKernelInfo gemm_info;

gemm_info.m = M;

gemm_info.n = N;

gemm_info.k = K;

gemm_info.lhs_info = lhs_info;

1774

gemm_info.rhs_info = rhs_info;

1775

// The output tensor will be auto-initialized within the function

1776

1777

// Create and configure function

1778

ReshapeRHSOperatorType reshape_rhs;

1779

GEMMFunctionType gemm;

1780

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1781

1782

// If GEMM is not validated, do not try to run. The validation will check

1783

// if the technology supports this extension. If not, the test will be skipped.

1784

// If it supports, the test will fail anyway because target and reference

1785

// will not match.

1786

gemm_validated = bool(gemm.validate(lhs.info(), rhs_reshaped.info(), dst.info(), gemm_info, nullptr, nullptr, nullptr));

1787

if(gemm_validated == true)

1788

{

1789

gemm.configure(lhs.info(), rhs_reshaped.info(), dst.info(), gemm_info, nullptr, nullptr, nullptr);

1790

1791

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1792

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1793

1794

// Allocate tensors

1795

lhs.allocator()->allocate();

1796

rhs.allocator()->allocate();

1797

rhs_reshaped.allocator()->allocate();

1798

dst.allocator()->allocate();

1799

1800

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1801

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1802

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1803

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

1804

1805

// Fill tensors

1806

fill(AccessorType(lhs), 0);

1807

fill(AccessorType(rhs), 1);

1808

1809

// Compute GEMM

1810

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1811

reshape_rhs.run(reshape_rhs_pack);

1812

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs }, { ACL_SRC_1, &rhs_reshaped }, { ACL_DST, &dst } });

gemm.run(gemm_pack);

}

return dst;

}

SimpleTensor<int32_t> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type)

1820

{

1821

TensorShape dst_shape = lhs_shape;

1822

dst_shape[0] = rhs_shape[0];

1823

dst_shape[1] = lhs_shape[1];

1824

1825

if(data_type == DataType::QASYMM8)

1826

{

1827

// Create reference

1828

SimpleTensor<uint8_t> lhs{ lhs_shape, data_type, 1 };

1829

SimpleTensor<uint8_t> rhs{ rhs_shape, data_type, 1 };

1830

SimpleTensor<int32_t> dst{ dst_shape, DataType::S32, 1 };

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

return reference::gemmlowp_matrix_multiply_core<int32_t, uint8_t>(lhs, rhs, dst_shape, 0, 0);

}

else

{

// Create reference

SimpleTensor<int8_t> lhs{ lhs_shape, data_type, 1 };

1842

SimpleTensor<int8_t> rhs{ rhs_shape, data_type, 1 };

1843

SimpleTensor<int32_t> dst{ dst_shape, DataType::S32, 1 };

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

return reference::gemmlowp_matrix_multiply_core<int32_t, int8_t>(lhs, rhs, dst_shape, 0, 0);

}

}

bool gemm_validated = true;

1854

TensorType _target{};

1855

SimpleTensor<int32_t> _reference{};

1856

};

1857

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1858

template <typename TensorType, typename AccessorType, typename ReshapeRHSOperatorType, typename GEMMFunctionType>

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1859

class GEMMLowpMatrixMultiplyReshapedOnlyRHS3DValidationFixture : public framework::Fixture

1860

{

1861

public:

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1862

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0,

1863

unsigned int k0, unsigned int h0, bool interleave_rhs, bool transpose_rhs, DataType data_type)

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1864

{

1865

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1874

rhs_info.transpose = transpose_rhs;

1875

1876

// In case of GEMM3D, m is the product between m_w and m_h

1877

const unsigned int m = m_w * m_h;

1878

1879

// Set the tensor shapes for LHS and RHS matrices

1880

const TensorShape lhs_shape(k, m, batch_size);

1881

const TensorShape rhs_shape(n, k, batch_size);

1882

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1883

_target = compute_target(lhs_shape, rhs_shape, lhs_info, rhs_info, m_h, data_type);

1884

_reference = compute_reference(lhs_shape, rhs_shape, m_h, data_type);

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

}

protected:

template <typename U>

1889

void fill(U &&tensor, int i)

1890

{

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1891

switch(tensor.data_type())

1892

{

1893

case DataType::QASYMM8:

1894

{

1895

// Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path

1896

std::uniform_int_distribution<> distribution(1, 254);

1897

library->fill(tensor, distribution, i);

1898

}

1899

break;

1900

case DataType::QASYMM8_SIGNED:

1901

{

1902

std::uniform_int_distribution<> distribution(-127, 126);

1903

library->fill(tensor, distribution, i);

}

break;

default:

ARM_COMPUTE_ERROR("Unsupported data type");

1908

}

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1909

}

1910

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1911

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const GEMMLHSMatrixInfo &lhs_info,

1912

const GEMMRHSMatrixInfo &rhs_info, unsigned int m_h, DataType data_type)

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1913

{

1914

// Create tensors

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1915

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1916

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1917

TensorType rhs_reshaped;

1918

TensorType dst;

1919

1920

const unsigned int M = lhs_shape[1];

1921

const unsigned int N = rhs_shape[0];

1922

const unsigned int K = lhs_shape[0];

1923

Michele Di Giorgio

b54ba28

2020-01-14 15:31:55 +0000

[diff] [blame]

1924

GEMMKernelInfo gemm_info;

gemm_info.m = M;

gemm_info.n = N;

gemm_info.k = K;

gemm_info.depth_output_gemm3d = m_h;

1929

gemm_info.lhs_info = lhs_info;

1930

gemm_info.rhs_info = rhs_info;

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1931

// The output tensor will be auto-initialized within the function

1932

1933

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1934

ReshapeRHSOperatorType reshape_rhs;

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1935

GEMMFunctionType gemm;

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1936

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

1937

gemm.configure(lhs.info(), rhs_reshaped.info(), dst.info(), gemm_info);

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1938

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1939

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1940

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1941

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1942

add_padding_x({ &lhs, &rhs, &rhs_reshaped, &dst });

1943

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1944

// Allocate tensors

1945

lhs.allocator()->allocate();

1946

rhs.allocator()->allocate();

1947

rhs_reshaped.allocator()->allocate();

1948

dst.allocator()->allocate();

1949

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1950

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1951

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1952

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1953

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1954

1955

// Fill tensors

1956

fill(AccessorType(lhs), 0);

1957

fill(AccessorType(rhs), 1);

1958

1959

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1960

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1961

reshape_rhs.run(reshape_rhs_pack);

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

1962

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs }, { ACL_SRC_1, &rhs_reshaped }, { ACL_DST, &dst } });

1963

gemm.run(gemm_pack);

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

return dst;

}

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1968

SimpleTensor<int32_t> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, unsigned int m_h, DataType data_type)

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1969

{

1970

TensorShape dst_shape = lhs_shape;

1971

dst_shape.set(0, rhs_shape[0]);

1972

dst_shape.set(1, lhs_shape[1] / m_h);

1973

dst_shape.set(2, m_h);

1974

dst_shape.set(3, lhs_shape[2]);

1975

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1976

if(data_type == DataType::QASYMM8)

1977

{

1978

// Create reference

1979

SimpleTensor<uint8_t> lhs{ lhs_shape, data_type, 1 };

1980

SimpleTensor<uint8_t> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1981

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1982

// Fill reference

1983

fill(lhs, 0);

1984

fill(rhs, 1);

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1985

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1986

return reference::gemmlowp_matrix_multiply_core<int32_t, uint8_t>(lhs, rhs, dst_shape, 0, 0);

}

else

{

// Create reference

SimpleTensor<int8_t> lhs{ lhs_shape, data_type, 1 };

1992

SimpleTensor<int8_t> rhs{ rhs_shape, data_type, 1 };

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

return reference::gemmlowp_matrix_multiply_core<int32_t, int8_t>(lhs, rhs, dst_shape, 0, 0);

1999

}

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

2000

}

2001

2002

TensorType _target{};

2003

SimpleTensor<int32_t> _reference{};

2004

};

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

2005

2006

template <typename TensorType, typename AccessorType, typename GEMMFunctionType>

2007

class GEMMLowpMatrixMultiplyNativeValidationFixture : public framework::Fixture

2008

{

2009

public:

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

2010

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0)

2011

{

2012

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// Set the tensor shapes for LHS and RHS matrices

2021

const TensorShape lhs_shape(k, m, batch_size);

2022

const TensorShape rhs_shape(n, k, batch_size);

2023

2024

_target = compute_target(lhs_shape, rhs_shape, lhs_info, rhs_info);

2025

_reference = compute_reference(lhs_shape, rhs_shape);

}

protected:

template <typename U>

2030

void fill(U &&tensor, int i)

2031

{

2032

// Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path

2033

std::uniform_int_distribution<> distribution(1, 254);

2034

library->fill(tensor, distribution, i);

2035

}

2036

2037

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info)

2038

{

2039

// Create tensors

2040

TensorType lhs = create_tensor<TensorType>(lhs_shape, DataType::QASYMM8, 1);

2041

TensorType rhs = create_tensor<TensorType>(rhs_shape, DataType::QASYMM8, 1);

2042

TensorType dst;

2043

2044

const unsigned int M = lhs_shape[1];

2045

const unsigned int N = rhs_shape[0];

2046

const unsigned int K = lhs_shape[0];

2047

2048

// The output tensor will be auto-initialized within the function

2049

2050

// Create and configure function

2051

GEMMFunctionType gemm;

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

2052

gemm.configure(lhs.info(), rhs.info(), dst.info(), lhs_info, rhs_info, GEMMReshapeInfo(M, N, K));

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

2053

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2054

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

2055

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

2056

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

2057

add_padding_x({ &lhs, &rhs, &dst });

2058

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

2059

// Allocate tensors

2060

lhs.allocator()->allocate();

2061

rhs.allocator()->allocate();

2062

dst.allocator()->allocate();

2063

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2064

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

2065

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

2066

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

2067

2068

// Fill tensors

2069

fill(AccessorType(lhs), 0);

2070

fill(AccessorType(rhs), 1);

2071

2072

// Compute GEMM

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

2073

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs }, { ACL_SRC_1, &rhs }, { ACL_DST, &dst } });

2074

gemm.run(gemm_pack);

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

return dst;

}

SimpleTensor<int32_t> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape)

2080

{

2081

TensorShape dst_shape = lhs_shape;

2082

dst_shape[0] = rhs_shape[0];

2083

dst_shape[1] = lhs_shape[1];

2084

2085

// Create reference

2086

SimpleTensor<uint8_t> lhs{ lhs_shape, DataType::QASYMM8, 1 };

2087

SimpleTensor<uint8_t> rhs{ rhs_shape, DataType::QASYMM8, 1 };

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

return reference::gemmlowp_matrix_multiply_core<int32_t, uint8_t>(lhs, rhs, dst_shape, 0, 0);

2094

}

2095

2096

TensorType _target{};

2097

SimpleTensor<int32_t> _reference{};

2098

};

2099

2100

template <typename TensorType, typename AccessorType, typename GEMMFunctionType>

2101

class GEMMLowpMatrixMultiplyNative3DValidationFixture : public framework::Fixture

2102

{

2103

public:

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

2104

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0)

2105

{

2106

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// In case of GEMM3D, m is the product between m_w and m_h

2115

const unsigned int m = m_w * m_h;

2116

2117

// Set the tensor shapes for LHS and RHS matrices

2118

const TensorShape lhs_shape(k, m, batch_size);

2119

const TensorShape rhs_shape(n, k, batch_size);

2120

2121

_target = compute_target(lhs_shape, rhs_shape, lhs_info, rhs_info, m_h);

2122

_reference = compute_reference(lhs_shape, rhs_shape, m_h);

}

protected:

template <typename U>

2127

void fill(U &&tensor, int i)

2128

{

2129

// Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path

2130

std::uniform_int_distribution<> distribution(1, 254);

2131

library->fill(tensor, distribution, i);

2132

}

2133

2134

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info, unsigned int m_h)

2135

{

2136

// Create tensors

2137

TensorType lhs = create_tensor<TensorType>(lhs_shape, DataType::QASYMM8, 1);

2138

TensorType rhs = create_tensor<TensorType>(rhs_shape, DataType::QASYMM8, 1);

2139

TensorType dst;

2140

2141

const unsigned int M = lhs_shape[1];

2142

const unsigned int N = rhs_shape[0];

2143

const unsigned int K = lhs_shape[0];

2144

2145

// The output tensor will be auto-initialized within the function

2146

2147

// Create and configure function

2148

GEMMFunctionType gemm;

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

2149

gemm.configure(lhs.info(), rhs.info(), dst.info(), lhs_info, rhs_info, GEMMReshapeInfo(M, N, K, 1, 1, m_h));

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

2150

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2151

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

2152

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

2153

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

2154

add_padding_x({ &lhs, &rhs, &dst });

2155

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

2156

// Allocate tensors

2157

lhs.allocator()->allocate();

2158

rhs.allocator()->allocate();

2159

dst.allocator()->allocate();

2160

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2161

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

2162

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

2163

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

2164

2165

// Fill tensors

2166

fill(AccessorType(lhs), 0);

2167

fill(AccessorType(rhs), 1);

2168

2169

// Compute GEMM

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

2170

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs }, { ACL_SRC_1, &rhs }, { ACL_DST, &dst } });

2171

gemm.run(gemm_pack);

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

return dst;

}

SimpleTensor<int32_t> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, unsigned int m_h)

2177

{

2178

TensorShape dst_shape = lhs_shape;

2179

dst_shape.set(0, rhs_shape[0]);

2180

dst_shape.set(1, lhs_shape[1] / m_h);

2181

dst_shape.set(2, m_h);

2182

dst_shape.set(3, lhs_shape[2]);

2183

2184

// Create reference

2185

SimpleTensor<uint8_t> lhs{ lhs_shape, DataType::QASYMM8, 1 };

2186

SimpleTensor<uint8_t> rhs{ rhs_shape, DataType::QASYMM8, 1 };

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

return reference::gemmlowp_matrix_multiply_core<int32_t, uint8_t>(lhs, rhs, dst_shape, 0, 0);

2193

}

2194

2195

TensorType _target{};

2196

SimpleTensor<int32_t> _reference{};

2197

};

Pablo Tello

2017-09-29 11:30:12 +0100

[diff] [blame]

2198

} // namespace validation

2199

} // namespace test

2200

} // namespace arm_compute

SiCong Li