Blame - tests/validation/fixtures/GEMMLowpFixture.h - ml/ComputeLibrary

2019-02-22 16:37:41 +0000

[diff] [blame]

78

// Create tensors

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

79

const DataType data_type_output = output_stage.type == GEMMLowpOutputStageType::NONE ? DataType::S32 : data_type_a;

Manuel Bottini

2019-12-02 16:22:35 +0000

[diff] [blame]

80

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

81

TensorType a = create_tensor<TensorType>(shape_a, data_type_a, 1, a_qinfo);

82

TensorType b = create_tensor<TensorType>(shape_b, data_type_b, 1, b_qinfo); // gemm output before output stage mismatch if i pass data_layout_output here. to be investigated

83

TensorType output = create_tensor<TensorType>(shape_output, data_type_output, 1, output_qinfo /* output_qinfo will be ignored when output stage type is None */);

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

84

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

TensorType bias;

if(is_fused)

{

TensorShape bias_shape(shape_b[0]);

89

bias = create_tensor<TensorType>(bias_shape, DataType::S32, 1);

90

}

91

92

// Create and configure function

93

// The GEMMinfo includes the values of the depth in case of reinterpreted 3d input/output

94

FunctionType gemmlowp;

Giorgio Arena

2021-06-09 15:23:06 +0100

[diff] [blame]

95

gemmlowp.configure(&a, &b, is_fused ? &bias : nullptr, &output, GEMMInfo(false, false, reshape_b_only_on_first_run, (reinterpret_output_as_3d ? shape_output[2] : 0), reinterpret_input_as_3d, false,

96

output_stage));

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

97

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

98

ARM_COMPUTE_ASSERT(a.info()->is_resizable());

99

ARM_COMPUTE_ASSERT(b.info()->is_resizable());

100

ARM_COMPUTE_ASSERT(output.info()->is_resizable());

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

101

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

102

add_padding_x({ &a, &b, &output });

103

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

104

// Allocate tensors

105

a.allocator()->allocate();

106

b.allocator()->allocate();

107

output.allocator()->allocate();

108

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

109

ARM_COMPUTE_ASSERT(!a.info()->is_resizable());

110

ARM_COMPUTE_ASSERT(!b.info()->is_resizable());

111

ARM_COMPUTE_ASSERT(!output.info()->is_resizable());

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

112

113

// Fill tensors

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

114

fill(AccessorType(a), 0 + finfo.hash);

115

fill(AccessorType(b), 1 + finfo.hash);

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

116

117

if(is_fused)

118

{

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

119

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

120

bias.allocator()->allocate();

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

121

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

122

fill_bias_s32(AccessorType(bias), 2 + finfo.hash, finfo.min_bias, finfo.max_bias);

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

123

}

Ramy Elgammal

2022-09-08 11:30:08 +0100

[diff] [blame]

124

125

// Run with variable inputs.

126

if(run_twice)

127

{

128

gemmlowp.run();

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

129

fill(AccessorType(a), 3 + finfo.hash); // Fill tensors with new seed after run

130

fill(AccessorType(b), 4 + finfo.hash);

Ramy Elgammal

2022-09-08 11:30:08 +0100

[diff] [blame]

131

if(is_fused)

132

{

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

133

fill_bias_s32(AccessorType(bias), 5 + finfo.hash, finfo.min_bias, finfo.max_bias);

Ramy Elgammal

2022-09-08 11:30:08 +0100

[diff] [blame]

}

}

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

137

// Compute GEMM function

gemmlowp.run();

return output;

}

Ramy Elgammal

2022-09-08 11:30:08 +0100

[diff] [blame]

142

template <bool reinterpret_input_as_3d, typename TI = uint8_t, typename TW = uint8_t, bool pretranspose_A = false, bool pretranspose_B = false, bool run_twice = false>

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

143

SimpleTensor<int32_t> compute_gemmlowp_reference(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_output, const QuantizationInfo& a_qinfo, const QuantizationInfo& b_qinfo,

144

DataType data_type_a = DataType::QASYMM8, DataType data_type_b = DataType::QASYMM8, const TensorFillInfo& finfo = TensorFillInfo())

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

145

{

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

146

ARM_COMPUTE_ASSERT(is_data_type_quantized_asymmetric(data_type_a));

147

ARM_COMPUTE_ASSERT(data_type_a == data_type_b);

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

148

TensorShape shape_a_to_use = shape_a;

149

if(reinterpret_input_as_3d)

150

{

151

// Collapse the second and third dimension if the input is 3D

152

shape_a_to_use.collapse(2U, 1U);

153

}

154

155

// Create reference

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

156

SimpleTensor<TI> a{ shape_a_to_use, data_type_a, 1, a_qinfo };

157

SimpleTensor<TW> b{ shape_b, data_type_b, 1, b_qinfo };

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

158

Adnan AlSinan

2022-05-05 11:13:19 +0100

[diff] [blame]

159

TensorShape shape_a_to_use_transposed{ shape_a_to_use };

160

TensorShape shape_b_transposed{ shape_b };

161

162

shape_a_to_use_transposed.set(0, shape_a_to_use[1]);

163

shape_a_to_use_transposed.set(1, shape_a_to_use[0]);

164

shape_b_transposed.set(0, shape_b[1]);

165

shape_b_transposed.set(1, shape_b[0]);

166

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

167

SimpleTensor<TI> a_transposed{ shape_a_to_use_transposed, data_type_a, 1, a_qinfo };

168

SimpleTensor<TW> b_transposed{ shape_b_transposed, data_type_b, 1, b_qinfo };

Adnan AlSinan

2022-05-05 11:13:19 +0100

[diff] [blame]

169

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

170

// Fill reference

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

171

fill(a, 0 + finfo.hash);

172

fill(b, 1 + finfo.hash);

Adnan AlSinan

2022-05-05 11:13:19 +0100

[diff] [blame]

173

174

// Transpose reference if required

Adnan AlSinan

3bb72b6

2022-05-06 12:10:11 +0100

[diff] [blame]

175

/* Note: Assuming the usual batch matmul dimensions A = (B x M x K), B = (B x K x N), if pretranspose_A is set to true, then A is assumed to be (B x K x M),

176

therefore, A must be pre-transposed before passing it to the fixture. And, we transpose A again in the fixture to make it (B x M x K)

177

in order to be able to call reference implementation that works with (B x M x K) input.

178

Similarly, if pretranspose_B is set to true, then B is assumed to be (B x N x K), B must be pre-transposed before passing it to the fixture. */

Adnan AlSinan

2022-05-05 11:13:19 +0100

[diff] [blame]

179

if(pretranspose_A)

180

{

181

transpose_matrix<TI>(a, a_transposed);

}

if(pretranspose_B)

{

transpose_matrix<TW>(b, b_transposed);

187

}

188

Ramy Elgammal

2022-09-08 11:30:08 +0100

[diff] [blame]

189

// Run with variable inputs.

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

190

const int32_t a_offset = a_qinfo.uniform().offset;

191

const int32_t b_offset = b_qinfo.uniform().offset;

Ramy Elgammal

2022-09-08 11:30:08 +0100

[diff] [blame]

192

if(run_twice)

193

{

194

reference::gemmlowp_matrix_multiply_core<int32_t, TI, TW>((pretranspose_A ? a_transposed : a), (pretranspose_B ? b_transposed : b), shape_output, a_offset, b_offset);

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

195

fill((pretranspose_A) ? a_transposed : a, 3 + finfo.hash);

196

fill((pretranspose_B) ? b_transposed : b, 4 + finfo.hash);

Ramy Elgammal

2022-09-08 11:30:08 +0100

[diff] [blame]

197

}

198

Adnan AlSinan

2022-05-05 11:13:19 +0100

[diff] [blame]

199

return reference::gemmlowp_matrix_multiply_core<int32_t, TI, TW>((pretranspose_A ? a_transposed : a), (pretranspose_B ? b_transposed : b), shape_output, a_offset, b_offset);

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

200

}

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

201

} // namespace

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

202

Ramy Elgammal

2022-09-08 11:30:08 +0100

[diff] [blame]

203

template <typename TensorType, typename AccessorType, typename FunctionType, bool reinterpret_input_as_3d = false, bool reinterpret_output_as_3d = false, bool run_twice = false>

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

204

class GEMMLowpMatrixMultiplyCoreValidationFixture : public framework::Fixture

Pablo Tello

2017-09-29 11:30:12 +0100

[diff] [blame]

205

{

206

public:

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

207

void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_output, int32_t a_offset, int32_t b_offset)

Pablo Tello

2017-09-29 11:30:12 +0100

[diff] [blame]

208

{

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

209

const auto a_qinfo = QuantizationInfo(1.0f / 255, a_offset);

210

const auto b_qinfo = QuantizationInfo(1.0f / 255, b_offset);

211

_target = compute_target(shape_a, shape_b, shape_output, a_qinfo, b_qinfo);

212

_reference = compute_reference(shape_a, shape_b, shape_output, a_qinfo, b_qinfo);

Pablo Tello

2017-09-29 11:30:12 +0100

[diff] [blame]

213

}

214

215

protected:

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

216

TensorType compute_target(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_output, const QuantizationInfo& a_qinfo, const QuantizationInfo& b_qinfo)

Pablo Tello

2017-09-29 11:30:12 +0100

[diff] [blame]

217

{

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

218

const auto output_qinfo = QuantizationInfo(); // No output stage

219

return compute_gemmlowp_target<TensorType, AccessorType, FunctionType, reinterpret_input_as_3d, reinterpret_output_as_3d, int32_t, false, run_twice>(shape_a, shape_b, shape_output, a_qinfo, b_qinfo, output_qinfo);

Pablo Tello

2017-09-29 11:30:12 +0100

[diff] [blame]

220

}

221

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

222

SimpleTensor<int32_t> compute_reference(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_output, const QuantizationInfo& a_qinfo, const QuantizationInfo& b_qinfo)

Pablo Tello

2017-09-29 11:30:12 +0100

[diff] [blame]

223

{

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

224

return compute_gemmlowp_reference<reinterpret_input_as_3d, uint8_t, uint8_t, false, false, run_twice>(shape_a, shape_b, shape_output, a_qinfo, b_qinfo);

Pablo Tello

bf2fb95

2017-09-29 16:43:25 +0100

[diff] [blame]

225

}

226

Pablo Tello

6ff12a0

2017-11-02 16:09:35 +0000

[diff] [blame]

227

TensorType _target{};

228

SimpleTensor<int32_t> _reference{};

Pablo Tello

bf2fb95

2017-09-29 16:43:25 +0100

[diff] [blame]

229

};

230

Mohammed Suhail Munshi

97a609b

2022-10-21 11:15:54 +0100

[diff] [blame]

231

template <typename TensorType, typename AccessorType, typename FunctionType, bool reinterpret_input_as_3d = false, bool reinterpret_output_as_3d = false, typename TI = uint8_t, typename TW = uint8_t, bool run_twice = false>

Giorgio Arena

2021-06-09 15:23:06 +0100

[diff] [blame]

232

class GEMMLowpMatrixMultiplyCoreFusedOffsetOutputGenericValidationFixture : public framework::Fixture

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

233

{

234

public:

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

235

/** Dynamically initialize the quantization info with saturation awareness

236

*/

237

template <typename T>

238

static void setup_quantization(DataType data_type, const TensorShape& shape_a, const TensorShape& shape_b, QuantizationInfo& a_qinfo, QuantizationInfo& b_qinfo, QuantizationInfo& output_qinfo, TensorFillInfo& finfo)

239

{

240

// This hash is used by random generators. There may be hash collisions but

241

// this is intentional as it's a very easy way to make the the current

242

// random generation process almost different for many test configurations,

243

// which were using the same set of values before.

244

finfo.hash = shape_a[0] + shape_a[1] + shape_b[0] + shape_b[1];

245

246

const int32_t t_max = static_cast<int32_t>(std::numeric_limits<T>::max());

247

const int32_t t_min = static_cast<int32_t>(std::numeric_limits<T>::min());

248

249

std::mt19937 generator(library->seed() + finfo.hash);

250

std::uniform_real_distribution<float> distribution_float(-5.0f, 3.0f);

251

std::uniform_int_distribution<int32_t> distribution_t(t_min, t_max);

252

253

const float scale_lhs = pow(2, distribution_float(generator)); // [2^-5, 2^3]

254

const float scale_rhs = pow(2, distribution_float(generator)); // [2^-5, 2^3]

255

256

const int32_t offset_lhs = distribution_t(generator);

257

const int32_t offset_rhs = distribution_t(generator);

258

259

a_qinfo = QuantizationInfo(scale_lhs, offset_lhs);

260

b_qinfo = QuantizationInfo(scale_rhs, offset_rhs);

261

262

// reinterpret_input_as_3d or reinterpret_output_as_3d can be ignored, as the underlying gemm / matmul computation

263

// is equivalent to a standard 2D one with m-n-k dimensions

264

const int m = shape_a.y();

265

const int n = shape_b.x();

266

const int k = shape_a.x();

267

268

const float bias_fraction = 0.5f; // We enabled is_fused in compute_gemmlowp_target below, thus bias is included

269

270

QuantizationHint q_hint = suggest_matmul_dst_q_info_and_bias(a_qinfo, b_qinfo, m, n, k, data_type, bias_fraction);

271

output_qinfo = q_hint.q_info;

272

finfo.min_bias = q_hint.bias_min;

273

finfo.max_bias = q_hint.bias_max;

274

275

// Both target and reference implementations use negated offsets, i.e.

276

// float_val = (int_val + offset) * scale

277

// instead of

278

// float_val = (int_val - offset) * scale

279

// as usual. Therefore, after calculating the output quantization above, we

280

// negate the offsets of inputs' offsets.

281

a_qinfo = QuantizationInfo(scale_lhs, -offset_lhs);

282

b_qinfo = QuantizationInfo(scale_rhs, -offset_rhs);

283

}

284

285

/** Initialize output stage info from quantization info */

286

static Status init_gemmlowp_output_stage_info(

287

DataType data_type,

288

const QuantizationInfo& a_qinfo,

289

const QuantizationInfo& b_qinfo,

290

const QuantizationInfo& output_qinfo,

291

GEMMLowpOutputStageType type,

292

GEMMLowpOutputStageInfo &gemmlowp_output_stage_info)

293

{

294

ARM_COMPUTE_RETURN_ERROR_ON(!is_data_type_quantized_asymmetric(data_type));

295

296

const UniformQuantizationInfo aq_unif = a_qinfo.uniform();

297

const UniformQuantizationInfo bq_unif = b_qinfo.uniform();

298

const UniformQuantizationInfo oq_unif = output_qinfo.uniform();

299

300

float multiplier = (aq_unif.scale * bq_unif.scale) / oq_unif.scale;

301

int32_t int_multiplier;

302

int32_t shift;

303

304

ARM_COMPUTE_RETURN_ON_ERROR(

305

quantization::calculate_quantized_multiplier(multiplier, &int_multiplier, &shift));

306

307

int32_t type_min = 0;

308

int32_t type_max = 0;

309

std::tie(type_min, type_max) = quantization::get_quantized_asymmetric_output_min_max(output_qinfo, ActivationLayerInfo(), data_type);

310

311

gemmlowp_output_stage_info.gemmlowp_real_multiplier = multiplier;

312

gemmlowp_output_stage_info.gemmlowp_multiplier = int_multiplier;

313

gemmlowp_output_stage_info.gemmlowp_multipliers = { int_multiplier };

314

gemmlowp_output_stage_info.gemmlowp_shift = shift;

315

gemmlowp_output_stage_info.gemmlowp_shifts = { shift };

316

gemmlowp_output_stage_info.gemmlowp_offset = oq_unif.offset;

317

gemmlowp_output_stage_info.type = type;

318

gemmlowp_output_stage_info.gemmlowp_min_bound = type_min;

319

gemmlowp_output_stage_info.gemmlowp_max_bound = type_max;

return Status{};

}

/** Currently this fixture only tests the following data type configurations:

325

*

326

* 1. a and b are of the same data type

327

* 2. The data type is quantized asymmetric

328

*

329

*/

330

void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_output, GEMMLowpOutputStageType output_stage_type, DataType data_type,

Giorgio Arena

2021-06-09 15:23:06 +0100

[diff] [blame]

331

bool reshape_b_only_on_first_run)

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

332

{

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

333

ARM_COMPUTE_ASSERT(output_stage_type != GEMMLowpOutputStageType::NONE);

334

ARM_COMPUTE_ASSERT(is_data_type_quantized_asymmetric(data_type));

Manuel Bottini

2019-12-02 16:22:35 +0000

[diff] [blame]

335

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

336

// Randomized dynamic quantization: randomize quantization info in a way that ensures no result saturation

337

// most of the time

338

QuantizationInfo a_qinfo;

339

QuantizationInfo b_qinfo;

340

QuantizationInfo output_qinfo;

341

TensorFillInfo finfo;

342

setup_quantization<TI>(data_type, shape_a, shape_b, a_qinfo, b_qinfo, output_qinfo, finfo);

Vidhya Sudhan Loganathan

951b8a4

2019-11-04 14:42:08 +0000

[diff] [blame]

343

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

344

GEMMLowpOutputStageInfo output_stage;

345

init_gemmlowp_output_stage_info(data_type, a_qinfo, b_qinfo, output_qinfo, output_stage_type, output_stage);

346

347

_reference = compute_reference(shape_a, shape_b, shape_output, a_qinfo, b_qinfo, data_type, data_type, output_stage, finfo);

348

_target = compute_target(shape_a, shape_b, shape_output, a_qinfo, b_qinfo, output_qinfo, data_type, data_type, output_stage, reshape_b_only_on_first_run, finfo);

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

349

}

350

351

protected:

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

352

TensorType compute_target(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_output, const QuantizationInfo& a_qinfo, const QuantizationInfo& b_qinfo, const QuantizationInfo& output_qinfo,

353

DataType data_type_a, DataType data_type_b, const GEMMLowpOutputStageInfo& output_stage, bool reshape_b_only_on_first_run = false, const TensorFillInfo& finfo = TensorFillInfo())

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

354

{

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

355

return compute_gemmlowp_target<TensorType, AccessorType, FunctionType, reinterpret_input_as_3d, reinterpret_output_as_3d, qasymm8_t, true, run_twice>(shape_a, shape_b, shape_output, a_qinfo,

356

b_qinfo, output_qinfo, data_type_a, data_type_b, output_stage, reshape_b_only_on_first_run, finfo);

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

357

}

358

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

359

SimpleTensor<TI> compute_reference(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_output, const QuantizationInfo& a_qinfo, const QuantizationInfo& b_qinfo,

360

DataType data_type_a, DataType data_type_b, const GEMMLowpOutputStageInfo& output_stage, const TensorFillInfo& finfo = TensorFillInfo())

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

361

{

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

362

SimpleTensor<int32_t> output = compute_gemmlowp_reference<reinterpret_input_as_3d, TI, TW, false, false, run_twice>(shape_a, shape_b, shape_output, a_qinfo, b_qinfo, data_type_a, data_type_b, finfo);

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

363

364

TensorShape bias_shape(shape_b[0]);

365

SimpleTensor<int32_t> bias{ bias_shape, DataType::S32, 1 };

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

366

(run_twice) ? fill_bias_s32(bias, 5 + finfo.hash, finfo.min_bias, finfo.max_bias) : fill_bias_s32(bias, 2 + finfo.hash, finfo.min_bias, finfo.max_bias); // Fill bias with same seed as last run of gemmlowp_target

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

367

368

switch(output_stage.type)

369

{

370

case GEMMLowpOutputStageType::QUANTIZE_DOWN:

Manuel Bottini

2019-12-02 16:22:35 +0000

[diff] [blame]

371

return reference::gemmlowp_quantize_down_scale<int32_t, TW>(output, bias,

372

output_stage.gemmlowp_offset, output_stage.gemmlowp_multipliers, output_stage.gemmlowp_shifts, output_stage.gemmlowp_min_bound, output_stage.gemmlowp_max_bound);

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

373

break;

374

case GEMMLowpOutputStageType::QUANTIZE_DOWN_FIXEDPOINT:

Manuel Bottini

2019-12-02 16:22:35 +0000

[diff] [blame]

375

return reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, TW>(output, bias,

376

output_stage.gemmlowp_multipliers, output_stage.gemmlowp_shifts, output_stage.gemmlowp_offset, output_stage.gemmlowp_min_bound, output_stage.gemmlowp_max_bound);

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

377

break;

378

default:

379

ARM_COMPUTE_ERROR("Not Supported!");

}

}

Manuel Bottini

2019-12-02 16:22:35 +0000

[diff] [blame]

383

TensorType _target{};

384

SimpleTensor<TI> _reference{};

George Wort

2019-02-22 16:37:41 +0000

[diff] [blame]

385

};

386

Giorgio Arena

2021-06-09 15:23:06 +0100

[diff] [blame]

387

template <typename TensorType, typename AccessorType, typename FunctionType, bool reinterpret_input_as_3d = false, bool reinterpret_output_as_3d = false, typename TI = uint8_t, typename TW = uint8_t>

388

class GEMMLowpMatrixMultiplyCoreFusedOffsetOutputValidationFixture : public

389

GEMMLowpMatrixMultiplyCoreFusedOffsetOutputGenericValidationFixture<TensorType, AccessorType, FunctionType, reinterpret_input_as_3d, reinterpret_output_as_3d, TI, TW>

390

{

391

public:

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

392

void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_output, GEMMLowpOutputStageType output_stage_type, DataType data_type)

Giorgio Arena

2021-06-09 15:23:06 +0100

[diff] [blame]

393

{

394

GEMMLowpMatrixMultiplyCoreFusedOffsetOutputGenericValidationFixture<TensorType, AccessorType, FunctionType, reinterpret_input_as_3d, reinterpret_output_as_3d, TI, TW>::setup(shape_a, shape_b,

SiCong Li

2023-11-07 12:04:59 +0000

[diff] [blame^]

395

shape_output, output_stage_type, data_type, false /* reshape_b_only_on_first_run */);

Giorgio Arena

2021-06-09 15:23:06 +0100

[diff] [blame]

}

};

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

399

template <typename TensorType, typename AccessorType, typename FunctionType>

400

class GEMMLowpQuantizeDownInt32ToUint8ScaleValidationFixture : public framework::Fixture

401

{

402

public:

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

403

void setup(TensorShape shape, int32_t result_offset, int32_t result_mult_int, int32_t result_shift, int32_t min, int32_t max, bool add_bias)

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

404

{

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

405

_target = compute_target(shape, result_offset, result_mult_int, result_shift, min, max, add_bias);

406

_reference = compute_reference(shape, result_offset, result_mult_int, result_shift, min, max, add_bias);

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

}

protected:

template <typename U>

411

void fill(U &&tensor, int i)

412

{

413

std::uniform_int_distribution<> distribution(-6000, 6000);

414

library->fill(tensor, distribution, i);

415

}

416

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

417

TensorType compute_target(const TensorShape &shape, int32_t result_offset, int32_t result_mult_int, int32_t result_shift, int32_t min, int32_t max, bool add_bias)

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

418

{

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

419

TensorShape shape_bias(shape[0]);

420

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

421

// Create tensors

422

TensorType a = create_tensor<TensorType>(shape, DataType::S32, 1);

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

423

TensorType b = create_tensor<TensorType>(shape_bias, DataType::S32, 1);

424

TensorType c = create_tensor<TensorType>(shape, DataType::QASYMM8, 1);

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

425

426

// Create and configure function

Luca Foschiani

2020-02-13 15:07:36 +0000

[diff] [blame]

427

FunctionType output_stage;

428

GEMMLowpOutputStageInfo output_stage_info = GEMMLowpOutputStageInfo();

429

output_stage_info.type = GEMMLowpOutputStageType::QUANTIZE_DOWN;

430

output_stage_info.gemmlowp_offset = result_offset;

431

output_stage_info.gemmlowp_multiplier = result_mult_int;

432

output_stage_info.gemmlowp_shift = result_shift;

433

output_stage_info.gemmlowp_min_bound = min;

434

output_stage_info.gemmlowp_max_bound = max;

435

output_stage_info.output_data_type = DataType::QASYMM8;

436

output_stage.configure(&a, add_bias ? &b : nullptr, &c, output_stage_info);

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

437

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

438

ARM_COMPUTE_ASSERT(a.info()->is_resizable());

439

ARM_COMPUTE_ASSERT(c.info()->is_resizable());

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

440

441

// Allocate tensors

442

a.allocator()->allocate();

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

443

c.allocator()->allocate();

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

444

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

445

ARM_COMPUTE_ASSERT(!a.info()->is_resizable());

446

ARM_COMPUTE_ASSERT(!c.info()->is_resizable());

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

447

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

448

// Fill tensor

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

449

fill(AccessorType(a), 0);

450

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

451

if(add_bias)

452

{

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

453

ARM_COMPUTE_ASSERT(b.info()->is_resizable());

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

454

455

// Allocate bias tensor

456

b.allocator()->allocate();

457

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

458

ARM_COMPUTE_ASSERT(!b.info()->is_resizable());

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

459

460

// Fill tensor

461

fill(AccessorType(b), 1);

462

}

463

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

464

// Compute GEMM function

465

output_stage.run();

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

466

return c;

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

467

}

468

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

469

SimpleTensor<uint8_t> compute_reference(const TensorShape &shape, int32_t result_offset, int32_t result_mult_int, int32_t result_shift, int32_t min, int32_t max, bool add_bias)

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

470

{

471

// Create reference

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

472

TensorShape shape_bias(shape[0]);

473

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

474

SimpleTensor<int32_t> a{ shape, DataType::S32, 1 };

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

475

SimpleTensor<int32_t> b{ shape_bias, DataType::S32, 1 };

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

// Fill reference

fill(a, 0);

Vidhya Sudhan Loganathan

951b8a4

2019-11-04 14:42:08 +0000

[diff] [blame]

480

const std::vector<int32_t> result_mult_int_vec = { result_mult_int };

481

const std::vector<int32_t> result_shift_vec = { result_shift };

482

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

if(add_bias)

{

// Fill bias

fill(b, 1);

Manuel Bottini

2019-12-02 16:22:35 +0000

[diff] [blame]

488

return reference::gemmlowp_quantize_down_scale<int32_t, uint8_t>(a, b, result_offset, result_mult_int_vec, result_shift_vec, min, max);

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

489

}

490

else

491

{

Manuel Bottini

2019-12-02 16:22:35 +0000

[diff] [blame]

492

return reference::gemmlowp_quantize_down_scale<int32_t, uint8_t>(a, result_offset, result_mult_int_vec, result_shift_vec, min, max);

Gian Marco

2017-11-17 09:27:57 +0000

[diff] [blame]

493

}

Gian Marco

2017-11-08 12:24:09 +0000

[diff] [blame]

494

}

495

496

TensorType _target{};

497

SimpleTensor<uint8_t> _reference{};

498

};

Gian Marco

2017-11-28 09:10:03 +0000

[diff] [blame]

499

500

template <typename TensorType, typename AccessorType, typename FunctionType>

Luca Foschiani

2020-02-13 15:07:36 +0000

[diff] [blame]

501

class GEMMLowpQuantizeDownInt32ToInt8ScaleValidationFixture : public framework::Fixture

502

{

503

public:

Luca Foschiani

2020-02-13 15:07:36 +0000

[diff] [blame]

504

void setup(TensorShape shape, int32_t result_offset, int32_t result_mult_int, int32_t result_shift, int32_t min, int32_t max, bool add_bias)

505

{

506

_target = compute_target(shape, result_offset, result_mult_int, result_shift, min, max, add_bias);

507

_reference = compute_reference(shape, result_offset, result_mult_int, result_shift, min, max, add_bias);

}

protected:

template <typename U>

512

void fill(U &&tensor, int i)

513

{

514

std::uniform_int_distribution<> distribution(-6000, 6000);

515

library->fill(tensor, distribution, i);

516

}

517

518

TensorType compute_target(const TensorShape &shape, int32_t result_offset, int32_t result_mult_int, int32_t result_shift, int32_t min, int32_t max, bool add_bias)

519

{

520

TensorShape shape_bias(shape[0]);

521

522

// Create tensors

523

TensorType a = create_tensor<TensorType>(shape, DataType::S32, 1);

524

TensorType b = create_tensor<TensorType>(shape_bias, DataType::S32, 1);

525

TensorType c = create_tensor<TensorType>(shape, DataType::QASYMM8_SIGNED, 1);

526

527

// Create and configure function

528

FunctionType output_stage;

529

GEMMLowpOutputStageInfo output_stage_info = GEMMLowpOutputStageInfo();

530

output_stage_info.type = GEMMLowpOutputStageType::QUANTIZE_DOWN;

531

output_stage_info.gemmlowp_offset = result_offset;

532

output_stage_info.gemmlowp_multiplier = result_mult_int;

533

output_stage_info.gemmlowp_shift = result_shift;

534

output_stage_info.gemmlowp_min_bound = min;

535

output_stage_info.gemmlowp_max_bound = max;

536

output_stage_info.output_data_type = DataType::QASYMM8_SIGNED;

537

output_stage.configure(&a, add_bias ? &b : nullptr, &c, output_stage_info);

538

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

539

ARM_COMPUTE_ASSERT(a.info()->is_resizable());

540

ARM_COMPUTE_ASSERT(c.info()->is_resizable());

Luca Foschiani

2020-02-13 15:07:36 +0000

[diff] [blame]

541

542

// Allocate tensors

543

a.allocator()->allocate();

544

c.allocator()->allocate();

545

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

546

ARM_COMPUTE_ASSERT(!a.info()->is_resizable());

547

ARM_COMPUTE_ASSERT(!c.info()->is_resizable());

Luca Foschiani

2020-02-13 15:07:36 +0000

[diff] [blame]

548

549

// Fill tensor

550

fill(AccessorType(a), 0);

551

552

if(add_bias)

553

{

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

554

ARM_COMPUTE_ASSERT(b.info()->is_resizable());

Luca Foschiani

2020-02-13 15:07:36 +0000

[diff] [blame]

555

556

// Allocate bias tensor

557

b.allocator()->allocate();

558

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

559

ARM_COMPUTE_ASSERT(!b.info()->is_resizable());

Luca Foschiani

2020-02-13 15:07:36 +0000

[diff] [blame]

560

561

// Fill tensor

562

fill(AccessorType(b), 1);

563

}

564

565

// Compute GEMM function

output_stage.run();

return c;

}

SimpleTensor<int8_t> compute_reference(const TensorShape &shape, int32_t result_offset, int32_t result_mult_int, int32_t result_shift, int32_t min, int32_t max, bool add_bias)

571

{

572

// Create reference

573

TensorShape shape_bias(shape[0]);

574

575

SimpleTensor<int32_t> a{ shape, DataType::S32, 1 };

576

SimpleTensor<int32_t> b{ shape_bias, DataType::S32, 1 };

// Fill reference

fill(a, 0);

const std::vector<int32_t> result_mult_int_vec = { result_mult_int };

582

const std::vector<int32_t> result_shift_vec = { result_shift };

if(add_bias)

{

// Fill bias

fill(b, 1);

return reference::gemmlowp_quantize_down_scale<int32_t, int8_t>(a, b, result_offset, result_mult_int_vec, result_shift_vec, min, max);

}

else

{

return reference::gemmlowp_quantize_down_scale<int32_t, int8_t>(a, result_offset, result_mult_int_vec, result_shift_vec, min, max);

}

}

TensorType _target{};

598

SimpleTensor<int8_t> _reference{};

599

};

600

601

template <typename TensorType, typename AccessorType, typename FunctionType>

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

602

class GEMMLowpQuantizeDownInt32ToInt8ScaleByFixedPointValidationFixture : public framework::Fixture

603

{

604

public:

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

605

void setup(TensorShape shape, int32_t result_fixedpoint_multiplier, int32_t result_shift, int32_t result_offset_after_shift, int32_t min, int32_t max, bool add_bias)

606

{

607

_target = compute_target(shape, result_fixedpoint_multiplier, result_shift, result_offset_after_shift, min, max, add_bias);

608

_reference = compute_reference(shape, result_fixedpoint_multiplier, result_shift, result_offset_after_shift, min, max, add_bias);

}

protected:

template <typename U>

613

void fill(U &&tensor, int i)

614

{

615

std::uniform_int_distribution<> distribution(-6000, 6000);

616

library->fill(tensor, distribution, i);

617

}

618

619

TensorType compute_target(const TensorShape &shape, int32_t result_fixedpoint_multiplier, int32_t result_shift, int32_t result_offset_after_shift, int32_t min, int32_t max, bool add_bias)

620

{

621

TensorShape shape_bias(shape[0]);

622

623

// Create tensors

624

TensorType a = create_tensor<TensorType>(shape, DataType::S32, 1);

625

TensorType b = create_tensor<TensorType>(shape_bias, DataType::S32, 1);

626

TensorType c = create_tensor<TensorType>(shape, DataType::QASYMM8_SIGNED, 1);

627

628

// Create and configure function

629

FunctionType output_stage;

630

output_stage.configure(&a, add_bias ? &b : nullptr, &c, result_fixedpoint_multiplier, result_shift, result_offset_after_shift, min, max);

631

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

632

ARM_COMPUTE_ASSERT(a.info()->is_resizable());

633

ARM_COMPUTE_ASSERT(c.info()->is_resizable());

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

634

635

// Allocate tensors

636

a.allocator()->allocate();

637

c.allocator()->allocate();

638

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

639

ARM_COMPUTE_ASSERT(!a.info()->is_resizable());

640

ARM_COMPUTE_ASSERT(!c.info()->is_resizable());

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

641

642

// Fill tensor

643

fill(AccessorType(a), 0);

644

645

if(add_bias)

646

{

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

647

ARM_COMPUTE_ASSERT(b.info()->is_resizable());

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

648

649

// Allocate bias tensor

650

b.allocator()->allocate();

651

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

652

ARM_COMPUTE_ASSERT(!b.info()->is_resizable());

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

653

654

// Fill tensor

655

fill(AccessorType(b), 1);

656

}

657

658

// Compute GEMM function

output_stage.run();

return c;

}

SimpleTensor<int8_t> compute_reference(const TensorShape &shape, int32_t result_fixed_point_multiplier, int32_t result_shift, int32_t result_offset_after_shift, int32_t min, int32_t max,

bool add_bias)

{

// Create reference

TensorShape shape_bias(shape[0]);

668

669

SimpleTensor<int32_t> a{ shape, DataType::S32, 1 };

670

SimpleTensor<int32_t> b{ shape_bias, DataType::S32, 1 };

// Fill reference

fill(a, 0);

const std::vector<int32_t> result_fixed_point_multiplier_vec = { result_fixed_point_multiplier };

676

const std::vector<int32_t> result_shift_vec = { result_shift };

if(add_bias)

{

// Fill bias

fill(b, 1);

return reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, int8_t>(a, b, result_fixed_point_multiplier_vec, result_shift_vec, result_offset_after_shift, min, max);

}

else

{

return reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, int8_t>(a, result_fixed_point_multiplier_vec, result_shift_vec, result_offset_after_shift, min, max);

}

}

TensorType _target{};

692

SimpleTensor<int8_t> _reference{};

693

};

694

695

template <typename TensorType, typename AccessorType, typename FunctionType>

Gian Marco

2017-11-28 09:10:03 +0000

[diff] [blame]

696

class GEMMLowpQuantizeDownInt32ToUint8ScaleByFixedPointValidationFixture : public framework::Fixture

697

{

698

public:

Gian Marco

2017-11-28 09:10:03 +0000

[diff] [blame]

699

void setup(TensorShape shape, int32_t result_fixedpoint_multiplier, int32_t result_shift, int32_t result_offset_after_shift, int32_t min, int32_t max, bool add_bias)

700

{

701

_target = compute_target(shape, result_fixedpoint_multiplier, result_shift, result_offset_after_shift, min, max, add_bias);

702

_reference = compute_reference(shape, result_fixedpoint_multiplier, result_shift, result_offset_after_shift, min, max, add_bias);

}

protected:

template <typename U>

707

void fill(U &&tensor, int i)

708

{

709

std::uniform_int_distribution<> distribution(-6000, 6000);

710

library->fill(tensor, distribution, i);

711

}

712

713

TensorType compute_target(const TensorShape &shape, int32_t result_fixedpoint_multiplier, int32_t result_shift, int32_t result_offset_after_shift, int32_t min, int32_t max, bool add_bias)

714

{

715

TensorShape shape_bias(shape[0]);

716

717

// Create tensors

718

TensorType a = create_tensor<TensorType>(shape, DataType::S32, 1);

719

TensorType b = create_tensor<TensorType>(shape_bias, DataType::S32, 1);

720

TensorType c = create_tensor<TensorType>(shape, DataType::QASYMM8, 1);

721

722

// Create and configure function

723

FunctionType output_stage;

724

output_stage.configure(&a, add_bias ? &b : nullptr, &c, result_fixedpoint_multiplier, result_shift, result_offset_after_shift, min, max);

725

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

726

ARM_COMPUTE_ASSERT(a.info()->is_resizable());

727

ARM_COMPUTE_ASSERT(c.info()->is_resizable());

Gian Marco

2017-11-28 09:10:03 +0000

[diff] [blame]

728

729

// Allocate tensors

730

a.allocator()->allocate();

731

c.allocator()->allocate();

732

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

733

ARM_COMPUTE_ASSERT(!a.info()->is_resizable());

734

ARM_COMPUTE_ASSERT(!c.info()->is_resizable());

Gian Marco

2017-11-28 09:10:03 +0000

[diff] [blame]

735

736

// Fill tensor

737

fill(AccessorType(a), 0);

738

739

if(add_bias)

740

{

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

741

ARM_COMPUTE_ASSERT(b.info()->is_resizable());

Gian Marco

2017-11-28 09:10:03 +0000

[diff] [blame]

742

743

// Allocate bias tensor

744

b.allocator()->allocate();

745

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

746

ARM_COMPUTE_ASSERT(!b.info()->is_resizable());

Gian Marco

2017-11-28 09:10:03 +0000

[diff] [blame]

747

748

// Fill tensor

749

fill(AccessorType(b), 1);

750

}

751

752

// Compute GEMM function

output_stage.run();

return c;

}

SimpleTensor<uint8_t> compute_reference(const TensorShape &shape, int32_t result_fixed_point_multiplier, int32_t result_shift, int32_t result_offset_after_shift, int32_t min, int32_t max,

bool add_bias)

{

// Create reference

TensorShape shape_bias(shape[0]);

762

763

SimpleTensor<int32_t> a{ shape, DataType::S32, 1 };

764

SimpleTensor<int32_t> b{ shape_bias, DataType::S32, 1 };

// Fill reference

fill(a, 0);

Vidhya Sudhan Loganathan

951b8a4

2019-11-04 14:42:08 +0000

[diff] [blame]

769

const std::vector<int32_t> result_fixed_point_multiplier_vec = { result_fixed_point_multiplier };

770

const std::vector<int32_t> result_shift_vec = { result_shift };

771

Gian Marco

2017-11-28 09:10:03 +0000

[diff] [blame]

if(add_bias)

{

// Fill bias

fill(b, 1);

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

777

return reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, uint8_t>(a, b, result_fixed_point_multiplier_vec, result_shift_vec, result_offset_after_shift, min, max);

Gian Marco

2017-11-28 09:10:03 +0000

[diff] [blame]

778

}

779

else

780

{

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

781

return reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, uint8_t>(a, result_fixed_point_multiplier_vec, result_shift_vec, result_offset_after_shift, min, max);

Gian Marco

2017-11-28 09:10:03 +0000

[diff] [blame]

}

}

TensorType _target{};

786

SimpleTensor<uint8_t> _reference{};

787

};

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

788

Sheri Zhang

2020-03-09 14:29:52 +0000

[diff] [blame]

789

template <typename TensorType, typename AccessorType, typename FunctionType, typename T>

790

class GEMMLowpQuantizeDownInt32ScaleByFloatValidationFixture : public framework::Fixture

791

{

792

public:

Sheri Zhang

2020-03-09 14:29:52 +0000

[diff] [blame]

793

void setup(DataType data_type, TensorShape shape, float result_real_multiplier, int32_t result_offset, int32_t min, int32_t max, bool add_bias)

794

{

795

_target = compute_target(data_type, shape, result_real_multiplier, result_offset, min, max, add_bias);

796

_reference = compute_reference(shape, result_real_multiplier, result_offset, min, max, add_bias);

}

protected:

template <typename U>

801

void fill(U &&tensor, int i)

802

{

803

// To avoid data all being clampped

804

std::uniform_int_distribution<> distribution(-500, 500);

805

library->fill(tensor, distribution, i);

806

}

807

808

TensorType compute_target(DataType data_type, const TensorShape &shape, float result_multiplier, int32_t result_offset, int32_t min, int32_t max, bool add_bias)

809

{

810

TensorShape shape_bias(shape[0]);

811

812

// Create tensors

813

TensorType a = create_tensor<TensorType>(shape, DataType::S32, 1);

814

TensorType b = create_tensor<TensorType>(shape_bias, DataType::S32, 1);

815

TensorType c = create_tensor<TensorType>(shape, data_type, 1);

816

817

// create output stage info

818

GEMMLowpOutputStageInfo info;

819

info.gemmlowp_max_bound = max;

820

info.gemmlowp_min_bound = min;

821

info.gemmlowp_real_multiplier = result_multiplier;

822

info.gemmlowp_offset = result_offset;

823

info.type = GEMMLowpOutputStageType::QUANTIZE_DOWN_FLOAT;

824

info.output_data_type = data_type;

825

826

// Create and configure function

827

FunctionType output_stage;

828

output_stage.configure(&a, add_bias ? &b : nullptr, &c, info);

829

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

830

ARM_COMPUTE_ASSERT(a.info()->is_resizable());

831

ARM_COMPUTE_ASSERT(c.info()->is_resizable());

Sheri Zhang

2020-03-09 14:29:52 +0000

[diff] [blame]

832

833

// Allocate tensors

834

a.allocator()->allocate();

835

c.allocator()->allocate();

836

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

837

ARM_COMPUTE_ASSERT(!a.info()->is_resizable());

838

ARM_COMPUTE_ASSERT(!c.info()->is_resizable());

Sheri Zhang

2020-03-09 14:29:52 +0000

[diff] [blame]

839

840

// Fill tensor

841

fill(AccessorType(a), 0);

842

843

if(add_bias)

844

{

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

845

ARM_COMPUTE_ASSERT(b.info()->is_resizable());

Sheri Zhang

2020-03-09 14:29:52 +0000

[diff] [blame]

846

847

// Allocate bias tensor

848

b.allocator()->allocate();

849

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

850

ARM_COMPUTE_ASSERT(!b.info()->is_resizable());

Sheri Zhang

2020-03-09 14:29:52 +0000

[diff] [blame]

851

852

// Fill tensor

853

fill(AccessorType(b), 1);

854

}

855

856

// Compute GEMM function

output_stage.run();

return c;

}

SimpleTensor<T> compute_reference(const TensorShape &shape, float_t result_real_multiplier, int32_t result_offset, int32_t min, int32_t max, bool add_bias)

862

{

863

// Create reference

864

TensorShape shape_bias(shape[0]);

865

866

SimpleTensor<int32_t> a{ shape, DataType::S32, 1 };

867

SimpleTensor<int32_t> b{ shape_bias, DataType::S32, 1 };

// Fill reference

fill(a, 0);

const std::vector<float_t> result_float_multiplier_vec = { result_real_multiplier };

if(add_bias)

{

// Fill bias

fill(b, 1);

return reference::gemmlowp_quantize_down_scale_by_float<int32_t, T>(a, b, result_float_multiplier_vec, result_offset, min, max);

}

else

{

return reference::gemmlowp_quantize_down_scale_by_float<int32_t, T>(a, result_float_multiplier_vec, result_offset, min, max);

}

}

TensorType _target{};

888

SimpleTensor<T> _reference{};

889

};

890

Gian Marco Iodice

2019-06-13 15:58:32 +0100

[diff] [blame]

891

template <typename TensorType, typename AccessorType, typename FunctionType>

892

class GEMMLowpQuantizeDownInt32ToInt16ScaleByFixedPointValidationFixture : public framework::Fixture

893

{

894

public:

Gian Marco Iodice

2019-06-13 15:58:32 +0100

[diff] [blame]

895

void setup(TensorShape shape, int32_t result_fixedpoint_multiplier, int32_t result_shift, int32_t min, int32_t max, bool add_bias)

896

{

897

_target = compute_target(shape, result_fixedpoint_multiplier, result_shift, min, max, add_bias);

898

_reference = compute_reference(shape, result_fixedpoint_multiplier, result_shift, min, max, add_bias);

}

protected:

template <typename U>

903

void fill(U &&tensor, int i)

904

{

905

std::uniform_int_distribution<> distribution(-6000, 6000);

906

library->fill(tensor, distribution, i);

907

}

908

909

TensorType compute_target(const TensorShape &shape, int32_t result_fixedpoint_multiplier, int32_t result_shift, int32_t min, int32_t max, bool add_bias)

910

{

911

TensorShape shape_bias(shape[0]);

912

913

// Create tensors

914

TensorType a = create_tensor<TensorType>(shape, DataType::S32, 1);

915

TensorType b = create_tensor<TensorType>(shape_bias, DataType::S32, 1);

916

TensorType c = create_tensor<TensorType>(shape, DataType::QSYMM16, 1);

917

918

// Create and configure function

919

FunctionType output_stage;

920

output_stage.configure(&a, add_bias ? &b : nullptr, &c, result_fixedpoint_multiplier, result_shift, min, max);

921

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

922

ARM_COMPUTE_ASSERT(a.info()->is_resizable());

923

ARM_COMPUTE_ASSERT(c.info()->is_resizable());

Gian Marco Iodice

2019-06-13 15:58:32 +0100

[diff] [blame]

924

925

// Allocate tensors

926

a.allocator()->allocate();

927

c.allocator()->allocate();

928

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

929

ARM_COMPUTE_ASSERT(!a.info()->is_resizable());

930

ARM_COMPUTE_ASSERT(!c.info()->is_resizable());

Gian Marco Iodice

2019-06-13 15:58:32 +0100

[diff] [blame]

931

932

// Fill tensor

933

fill(AccessorType(a), 0);

934

935

if(add_bias)

936

{

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

937

ARM_COMPUTE_ASSERT(b.info()->is_resizable());

Gian Marco Iodice

2019-06-13 15:58:32 +0100

[diff] [blame]

938

939

// Allocate bias tensor

940

b.allocator()->allocate();

941

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

942

ARM_COMPUTE_ASSERT(!b.info()->is_resizable());

Gian Marco Iodice

2019-06-13 15:58:32 +0100

[diff] [blame]

943

944

// Fill tensor

945

fill(AccessorType(b), 1);

946

}

947

948

// Compute GEMM function

output_stage.run();

return c;

}

SimpleTensor<int16_t> compute_reference(const TensorShape &shape, int32_t result_fixed_point_multiplier, int32_t result_shift, int32_t min, int32_t max,

bool add_bias)

{

// Create reference

TensorShape shape_bias(shape[0]);

958

959

SimpleTensor<int32_t> a{ shape, DataType::S32, 1 };

960

SimpleTensor<int32_t> b{ shape_bias, DataType::S32, 1 };

// Fill reference

fill(a, 0);

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

965

const std::vector<int32_t> result_fixed_point_multiplier_vec = { result_fixed_point_multiplier };

966

const std::vector<int32_t> result_shift_vec = { result_shift };

967

Gian Marco Iodice

2019-06-13 15:58:32 +0100

[diff] [blame]

if(add_bias)

{

// Fill bias

fill(b, 1);

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

973

return reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, int16_t>(a, b, result_fixed_point_multiplier_vec, result_shift_vec, 0, min, max);

Gian Marco Iodice

2019-06-13 15:58:32 +0100

[diff] [blame]

974

}

975

else

976

{

Georgios Pinitas

2019-11-21 14:10:25 +0000

[diff] [blame]

977

return reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, int16_t>(a, result_fixed_point_multiplier_vec, result_shift_vec, 0, min, max);

Gian Marco Iodice

2019-06-13 15:58:32 +0100

[diff] [blame]

}

}

TensorType _target{};

982

SimpleTensor<int16_t> _reference{};

983

};

984

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

985

template <typename TensorType, typename AccessorType, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMFunctionType>

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

986

class GEMMLowpMatrixMultiplyReshapedValidationFixture : public framework::Fixture

987

{

988

public:

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

989

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0, bool interleave_lhs,

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

990

bool interleave_rhs, DataType data_type)

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

991

{

992

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

997

lhs_info.transpose = false;

998

999

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1004

rhs_info.transpose = true;

1005

1006

// Set the tensor shapes for LHS and RHS matrices

1007

const TensorShape lhs_shape(k, m, batch_size);

1008

const TensorShape rhs_shape(n, k, batch_size);

1009

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1010

_target = compute_target(lhs_shape, rhs_shape, lhs_info, rhs_info, data_type);

1011

_reference = compute_reference(lhs_shape, rhs_shape, data_type);

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

}

protected:

template <typename U>

1016

void fill(U &&tensor, int i)

1017

{

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1018

switch(tensor.data_type())

1019

{

1020

case DataType::QASYMM8:

1021

{

1022

// Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path

1023

std::uniform_int_distribution<> distribution(1, 254);

1024

library->fill(tensor, distribution, i);

1025

}

1026

break;

1027

case DataType::QASYMM8_SIGNED:

1028

{

1029

std::uniform_int_distribution<> distribution(-127, 126);

1030

library->fill(tensor, distribution, i);

}

break;

default:

ARM_COMPUTE_ERROR("Unsupported data type");

1035

}

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1036

}

1037

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1038

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info, DataType data_type)

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1039

{

1040

// Create tensors

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1041

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1042

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1043

TensorType lhs_reshaped;

1044

TensorType rhs_reshaped;

1045

TensorType dst;

1046

1047

const unsigned int M = lhs_shape[1];

1048

const unsigned int N = rhs_shape[0];

1049

const unsigned int K = lhs_shape[0];

1050

1051

// The output tensor will be auto-initialized within the function

1052

1053

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1054

ReshapeLHSOperatorType reshape_lhs;

1055

ReshapeRHSOperatorType reshape_rhs;

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1056

GEMMFunctionType gemm;

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1057

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

1058

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

1059

gemm.configure(lhs_reshaped.info(), rhs_reshaped.info(), dst.info(), lhs_info, rhs_info, GEMMReshapeInfo(M, N, K));

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1060

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1061

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1062

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1063

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1064

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &dst });

1065

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1066

// Allocate tensors

1067

lhs.allocator()->allocate();

1068

rhs.allocator()->allocate();

1069

lhs_reshaped.allocator()->allocate();

1070

rhs_reshaped.allocator()->allocate();

1071

dst.allocator()->allocate();

1072

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1073

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1074

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1075

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

1076

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1077

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1078

1079

// Fill tensors

1080

fill(AccessorType(lhs), 0);

1081

fill(AccessorType(rhs), 1);

1082

1083

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1084

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

1085

reshape_lhs.run(reshape_lhs_pack);

1086

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1087

reshape_rhs.run(reshape_rhs_pack);

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

1088

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped }, { ACL_SRC_1, &rhs_reshaped }, { ACL_DST, &dst } });

1089

gemm.run(gemm_pack);

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

return dst;

}

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1094

SimpleTensor<int32_t> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type)

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1095

{

1096

TensorShape dst_shape = lhs_shape;

1097

dst_shape[0] = rhs_shape[0];

1098

dst_shape[1] = lhs_shape[1];

1099

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1100

switch(data_type)

1101

{

1102

case DataType::QASYMM8:

1103

{

1104

// Create reference

1105

SimpleTensor<uint8_t> lhs{ lhs_shape, data_type, 1 };

1106

SimpleTensor<uint8_t> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1107

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1108

// Fill reference

1109

fill(lhs, 0);

1110

fill(rhs, 1);

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1111

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1112

return reference::gemmlowp_matrix_multiply_core<int32_t, uint8_t>(lhs, rhs, dst_shape, 0, 0);

1113

}

1114

case DataType::QASYMM8_SIGNED:

1115

{

1116

// Create reference

1117

SimpleTensor<int8_t> lhs{ lhs_shape, data_type, 1 };

1118

SimpleTensor<int8_t> rhs{ rhs_shape, data_type, 1 };

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

return reference::gemmlowp_matrix_multiply_core<int32_t, int8_t>(lhs, rhs, dst_shape, 0, 0);

1125

}

1126

default:

1127

ARM_COMPUTE_ERROR("Unsupported data type");

1128

}

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1129

}

1130

1131

TensorType _target{};

1132

SimpleTensor<int32_t> _reference{};

1133

};

1134

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1135

template <typename TensorType, typename AccessorType, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMFunctionType>

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1136

class GEMMLowpMatrixMultiplyReshaped3DValidationFixture : public framework::Fixture

1137

{

1138

public:

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1139

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0,

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1140

bool interleave_lhs, bool interleave_rhs, DataType data_type)

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1141

{

1142

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

1147

lhs_info.transpose = false;

1148

1149

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1154

rhs_info.transpose = true;

1155

1156

// In case of GEMM3D, m is the product between m_w and m_h

1157

const unsigned int m = m_w * m_h;

1158

1159

// Set the tensor shapes for LHS and RHS matrices

1160

const TensorShape lhs_shape(k, m, batch_size);

1161

const TensorShape rhs_shape(n, k, batch_size);

1162

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1163

_target = compute_target(lhs_shape, rhs_shape, lhs_info, rhs_info, m_h, data_type);

1164

_reference = compute_reference(lhs_shape, rhs_shape, m_h, data_type);

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

}

protected:

template <typename U>

1169

void fill(U &&tensor, int i)

1170

{

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1171

switch(tensor.data_type())

1172

{

1173

case DataType::QASYMM8:

1174

{

1175

// Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path

1176

std::uniform_int_distribution<> distribution(1, 254);

1177

library->fill(tensor, distribution, i);

1178

}

1179

break;

1180

case DataType::QASYMM8_SIGNED:

1181

{

1182

std::uniform_int_distribution<> distribution(-127, 126);

1183

library->fill(tensor, distribution, i);

}

break;

default:

ARM_COMPUTE_ERROR("Unsupported data type");

1188

}

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1189

}

1190

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1191

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info, unsigned int m_h,

1192

DataType data_type)

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1193

{

1194

// Create tensors

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1195

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1196

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1197

TensorType lhs_reshaped;

1198

TensorType rhs_reshaped;

1199

TensorType dst;

1200

1201

const unsigned int M = lhs_shape[1];

1202

const unsigned int N = rhs_shape[0];

1203

const unsigned int K = lhs_shape[0];

1204

1205

// The output tensor will be auto-initialized within the function

1206

1207

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1208

ReshapeLHSOperatorType reshape_lhs;

1209

ReshapeRHSOperatorType reshape_rhs;

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1210

GEMMFunctionType gemm;

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1211

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

1212

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

1213

gemm.configure(lhs_reshaped.info(), rhs_reshaped.info(), dst.info(), lhs_info, rhs_info, GEMMReshapeInfo(M, N, K, 1, 1, m_h));

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1214

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1215

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1216

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1217

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1218

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &dst });

1219

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1220

// Allocate tensors

1221

lhs.allocator()->allocate();

1222

rhs.allocator()->allocate();

1223

lhs_reshaped.allocator()->allocate();

1224

rhs_reshaped.allocator()->allocate();

1225

dst.allocator()->allocate();

1226

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1227

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1228

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1229

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

1230

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1231

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1232

1233

// Fill tensors

1234

fill(AccessorType(lhs), 0);

1235

fill(AccessorType(rhs), 1);

1236

1237

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1238

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

1239

reshape_lhs.run(reshape_lhs_pack);

1240

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1241

reshape_rhs.run(reshape_rhs_pack);

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

1242

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped }, { ACL_SRC_1, &rhs_reshaped }, { ACL_DST, &dst } });

1243

gemm.run(gemm_pack);

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

return dst;

}

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1248

SimpleTensor<int32_t> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, unsigned int m_h, DataType data_type)

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1249

{

1250

TensorShape dst_shape = lhs_shape;

1251

dst_shape.set(0, rhs_shape[0]);

1252

dst_shape.set(1, lhs_shape[1] / m_h);

1253

dst_shape.set(2, m_h);

1254

dst_shape.set(3, lhs_shape[2]);

1255

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1256

switch(data_type)

1257

{

1258

case DataType::QASYMM8:

1259

{

1260

// Create reference

1261

SimpleTensor<uint8_t> lhs{ lhs_shape, data_type, 1 };

1262

SimpleTensor<uint8_t> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1263

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1264

// Fill reference

1265

fill(lhs, 0);

1266

fill(rhs, 1);

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1267

Sheri Zhang

2020-02-25 14:13:54 +0000

[diff] [blame]

1268

return reference::gemmlowp_matrix_multiply_core<int32_t, uint8_t>(lhs, rhs, dst_shape, 0, 0);

1269

}

1270

case DataType::QASYMM8_SIGNED:

1271

{

1272

// Create reference

1273

SimpleTensor<int8_t> lhs{ lhs_shape, data_type, 1 };

1274

SimpleTensor<int8_t> rhs{ rhs_shape, data_type, 1 };

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

return reference::gemmlowp_matrix_multiply_core<int32_t, int8_t>(lhs, rhs, dst_shape, 0, 0);

1281

}

1282

default:

1283

ARM_COMPUTE_ERROR("Unsupported data type");

1284

}

Gian Marco Iodice

2019-01-17 09:47:04 +0000

[diff] [blame]

1285

}

1286

1287

TensorType _target{};

1288

SimpleTensor<int32_t> _reference{};

1289

};

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1290

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1291

template <typename TensorType, typename AccessorType, typename ReshapeRHSOperatorType, typename GEMMFunctionType>

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1292

class GEMMLowpMatrixMultiplyReshapedOnlyRHSValidationFixture : public framework::Fixture

1293

{

1294

public:

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1295

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0,

1296

unsigned int k0, unsigned int h0, bool interleave_rhs, bool transpose_rhs, DataType data_type)

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1297

{

1298

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1307

rhs_info.transpose = transpose_rhs;

1308

1309

// Set the tensor shapes for LHS and RHS matrices

1310

const TensorShape lhs_shape(k, m, batch_size);

1311

const TensorShape rhs_shape(n, k, batch_size);

1312

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1313

_target = compute_target(lhs_shape, rhs_shape, lhs_info, rhs_info, data_type);

1314

_reference = compute_reference(lhs_shape, rhs_shape, data_type);

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

}

protected:

template <typename U>

1319

void fill(U &&tensor, int i)

1320

{

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1321

switch(tensor.data_type())

1322

{

1323

case DataType::QASYMM8:

1324

{

1325

// Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path

1326

std::uniform_int_distribution<> distribution(1, 254);

1327

library->fill(tensor, distribution, i);

1328

}

1329

break;

1330

case DataType::QASYMM8_SIGNED:

1331

{

1332

std::uniform_int_distribution<> distribution(-127, 126);

1333

library->fill(tensor, distribution, i);

}

break;

default:

ARM_COMPUTE_ERROR("Unsupported data type");

1338

}

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1339

}

1340

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1341

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const GEMMLHSMatrixInfo &lhs_info,

1342

const GEMMRHSMatrixInfo &rhs_info, DataType data_type)

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1343

{

1344

// Create tensors

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1345

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1346

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1347

TensorType rhs_reshaped;

1348

TensorType dst;

1349

1350

const unsigned int M = lhs_shape[1];

1351

const unsigned int N = rhs_shape[0];

1352

const unsigned int K = lhs_shape[0];

1353

Michele Di Giorgio

b54ba28

2020-01-14 15:31:55 +0000

[diff] [blame]

1354

GEMMKernelInfo gemm_info;

gemm_info.m = M;

gemm_info.n = N;

gemm_info.k = K;

gemm_info.lhs_info = lhs_info;

1359

gemm_info.rhs_info = rhs_info;

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1360

// The output tensor will be auto-initialized within the function

1361

1362

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1363

ReshapeRHSOperatorType reshape_rhs;

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1364

GEMMFunctionType gemm;

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1365

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

1366

gemm.configure(lhs.info(), rhs_reshaped.info(), dst.info(), gemm_info);

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1367

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1368

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1369

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1370

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1371

add_padding_x({ &lhs, &rhs, &rhs_reshaped, &dst });

1372

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1373

// Allocate tensors

1374

lhs.allocator()->allocate();

1375

rhs.allocator()->allocate();

1376

rhs_reshaped.allocator()->allocate();

1377

dst.allocator()->allocate();

1378

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1379

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1380

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1381

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1382

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1383

1384

// Fill tensors

1385

fill(AccessorType(lhs), 0);

1386

fill(AccessorType(rhs), 1);

1387

1388

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1389

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1390

reshape_rhs.run(reshape_rhs_pack);

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

1391

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs }, { ACL_SRC_1, &rhs_reshaped }, { ACL_DST, &dst } });

1392

gemm.run(gemm_pack);

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

return dst;

}

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1397

SimpleTensor<int32_t> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type)

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1398

{

1399

TensorShape dst_shape = lhs_shape;

1400

dst_shape[0] = rhs_shape[0];

1401

dst_shape[1] = lhs_shape[1];

1402

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1403

if(data_type == DataType::QASYMM8)

1404

{

1405

// Create reference

1406

SimpleTensor<uint8_t> lhs{ lhs_shape, data_type, 1 };

1407

SimpleTensor<uint8_t> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1408

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1409

// Fill reference

1410

fill(lhs, 0);

1411

fill(rhs, 1);

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1412

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1413

return reference::gemmlowp_matrix_multiply_core<int32_t, uint8_t>(lhs, rhs, dst_shape, 0, 0);

}

else

{

// Create reference

SimpleTensor<int8_t> lhs{ lhs_shape, data_type, 1 };

1419

SimpleTensor<int8_t> rhs{ rhs_shape, data_type, 1 };

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

return reference::gemmlowp_matrix_multiply_core<int32_t, int8_t>(lhs, rhs, dst_shape, 0, 0);

1426

}

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1427

}

1428

1429

TensorType _target{};

1430

SimpleTensor<int32_t> _reference{};

1431

};

1432

Freddie Liardet

2022-05-16 14:09:10 +0100

[diff] [blame]

1433

template <typename T, typename TensorType, typename AccessorType, typename ReshapeRHSOperatorType, typename GEMMFunctionType, typename ReduceOperation, typename CastOperation>

1434

class GEMMLowpMatrixMultiplyReshapedOnlyRHSMMULOutputStageValidationFixture : public framework::Fixture

1435

{

1436

public:

Freddie Liardet

2022-05-16 14:09:10 +0100

[diff] [blame]

1437

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0,

1438

unsigned int k0, unsigned int h0, bool interleave_rhs, bool transpose_rhs, bool broadcast_bias, DataType data_type)

1439

{

1440

GEMMLowpOutputStageInfo output_stage;

1441

output_stage.type = GEMMLowpOutputStageType::QUANTIZE_DOWN_FIXEDPOINT;

1442

output_stage.output_data_type = data_type;

1443

output_stage.gemmlowp_multipliers = std::vector<int32_t> { 1 };

1444

output_stage.gemmlowp_shifts = std::vector<int32_t> { 1 };

1445

output_stage.gemmlowp_multipliers[0] = 1;

1446

output_stage.gemmlowp_shifts[0] = 1;

1447

output_stage.gemmlowp_offset = 0;

1448

constexpr float scale = 0.001f;

1449

quantization::calculate_quantized_multiplier(scale, &output_stage.gemmlowp_multipliers[0], &output_stage.gemmlowp_shifts[0]);

1450

output_stage.gemmlowp_min_bound = -100;

1451

output_stage.gemmlowp_max_bound = 100;

1452

1453

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1462

rhs_info.transpose = transpose_rhs;

int a_offset = 1;

int b_offset = 1;

// Set the tensor shapes for LHS and RHS matrices

1468

const TensorShape lhs_shape(k, m, batch_size);

1469

const TensorShape rhs_shape(n, k, batch_size);

1470

const TensorShape bias_shape(n,

1471

broadcast_bias ? 1 : m,

1472

broadcast_bias ? 1 : batch_size);

1473

Ramy Elgammal

2022-09-08 11:30:08 +0100

[diff] [blame]

1474

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, output_stage, a_offset, b_offset);

Freddie Liardet

2022-05-16 14:09:10 +0100

[diff] [blame]

1475

if(gemm_validated == true)

1476

{

1477

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, output_stage, a_offset, b_offset);

}

}

protected:

template <typename U>

1483

void fill(U &&tensor, int i)

1484

{

1485

switch(tensor.data_type())

1486

{

1487

case DataType::QASYMM8:

1488

{

1489

// Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path

1490

std::uniform_int_distribution<> distribution(1, 254);

1491

library->fill(tensor, distribution, i);

1492

}

1493

break;

1494

case DataType::QASYMM8_SIGNED:

1495

{

1496

std::uniform_int_distribution<> distribution(-127, 126);

1497

library->fill(tensor, distribution, i);

}

break;

case DataType::S32:

{

std::uniform_int_distribution<> distribution(-10000, 10000);

1503

library->fill(tensor, distribution, i);

}

break;

default:

ARM_COMPUTE_ERROR("Unsupported data type");

}

}

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info,

1512

const GEMMRHSMatrixInfo &rhs_info, DataType data_type, GEMMLowpOutputStageInfo output_stage, const int a_offset, const int b_offset)

1513

{

1514

// Create tensors

1515

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1, QuantizationInfo(1.0f / 255, a_offset));

1516

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1, QuantizationInfo(1.0f / 255, b_offset));

1517

TensorType bias = create_tensor<TensorType>(bias_shape, DataType::S32, 1);

1518

TensorType dst;

1519

TensorType rhs_reshaped;

1520

1521

const unsigned int M = lhs_shape[1];

1522

const unsigned int N = rhs_shape[0];

1523

const unsigned int K = lhs_shape[0];

1524

1525

// Tensors for precomputing sum of lhs rows / rhs columns

1526

TensorType vec_sum_rows = create_tensor<TensorType>(TensorShape(M, 1, lhs_shape[2]), DataType::S32, 1);

1527

TensorType vec_sum_cols = create_tensor<TensorType>(TensorShape(N, 1, rhs_shape[2]), DataType::S32, 1);

1528

1529

GEMMKernelInfo gemm_info;

gemm_info.m = M;

gemm_info.n = N;

gemm_info.k = K;

gemm_info.lhs_info = lhs_info;

1534

gemm_info.rhs_info = rhs_info;

1535

gemm_info.output_stage = output_stage;

1536

gemm_info.a_offset = a_offset;

1537

gemm_info.b_offset = b_offset;

1538

// The output tensor will be auto-initialized within the function

1539

1540

// Create and configure function

1541

ReshapeRHSOperatorType reshape_rhs;

1542

GEMMFunctionType gemm;

1543

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1544

1545

// If GEMM is not validated, do not try to run. The validation will check

1546

// if the technology supports this extension. If not, the test will be skipped.

1547

// If it supports, the test will fail anyway because target and reference

1548

// will not match.

1549

gemm_validated = bool(gemm.validate(lhs.info(), rhs_reshaped.info(), dst.info(), gemm_info, vec_sum_cols.info(), vec_sum_rows.info(), bias.info()));

1550

if(gemm_validated == true)

1551

{

1552

gemm.configure(lhs.info(), rhs_reshaped.info(), dst.info(), gemm_info, vec_sum_cols.info(), vec_sum_rows.info(), bias.info());

1553

1554

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1555

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1556

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

1557

1558

// Allocate tensors

1559

lhs.allocator()->allocate();

1560

rhs.allocator()->allocate();

1561

rhs_reshaped.allocator()->allocate();

1562

bias.allocator()->allocate();

1563

vec_sum_cols.allocator()->allocate();

1564

vec_sum_rows.allocator()->allocate();

1565

dst.allocator()->allocate();

1566

1567

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1568

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1569

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1570

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1571

ARM_COMPUTE_ASSERT(!vec_sum_cols.info()->is_resizable());

1572

ARM_COMPUTE_ASSERT(!vec_sum_rows.info()->is_resizable());

1573

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

1574

1575

// Fill tensors

1576

fill(AccessorType(lhs), 0);

1577

fill(AccessorType(rhs), 1);

1578

fill(AccessorType(bias), 2);

1579

1580

TensorType lhs_32 = create_tensor<TensorType>(lhs_shape, DataType::S32, 1);

1581

TensorType rhs_32 = create_tensor<TensorType>(rhs_shape, DataType::S32, 1);

1582

CastOperation cast_lhs;

1583

CastOperation cast_rhs;

1584

cast_lhs.configure(&lhs, &lhs_32, ConvertPolicy::SATURATE);

1585

cast_rhs.configure(&rhs, &rhs_32, ConvertPolicy::SATURATE);

1586

lhs_32.allocator()->allocate();

1587

rhs_32.allocator()->allocate();

cast_lhs.run();

cast_rhs.run();

ReduceOperation lhs_sum_rows;

1592

ReduceOperation rhs_sum_cols;

1593

1594

lhs_sum_rows.configure(&lhs_32, &vec_sum_rows, 0, ReductionOperation::SUM, false);

1595

rhs_sum_cols.configure(&rhs_32, &vec_sum_cols, 1, ReductionOperation::SUM);

lhs_sum_rows.run();

rhs_sum_cols.run();

// Compute GEMM

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1602

reshape_rhs.run(reshape_rhs_pack);

1603

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs }, { ACL_SRC_1, &rhs_reshaped }, { ACL_SRC_2, &bias }, { ACL_DST, &dst }, { ACL_VEC_COL_SUM, &vec_sum_cols }, { ACL_VEC_ROW_SUM, &vec_sum_rows } });

gemm.run(gemm_pack);

}

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, GEMMLowpOutputStageInfo output_stage,

1611

const int a_offset, const int b_offset)

1612

{

1613

TensorShape dst_shape = lhs_shape;

1614

dst_shape[0] = rhs_shape[0];

1615

dst_shape[1] = lhs_shape[1];

1616

1617

// Create reference

1618

SimpleTensor<T> lhs{ lhs_shape, data_type, 1, QuantizationInfo(1.0f / 255, a_offset) };

1619

SimpleTensor<T> rhs{ rhs_shape, data_type, 1, QuantizationInfo(1.0f / 255, b_offset) };

1620

SimpleTensor<int32_t> bias{ bias_shape, DataType::S32, 1 };

1621

SimpleTensor<int32_t> dst{ dst_shape, DataType::S32, 1 };

1622

SimpleTensor<T> dst_final{ dst_shape, data_type, 1 };

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

dst = reference::gemmlowp_matrix_multiply_core<int32_t, T>(lhs, rhs, dst_shape, a_offset, b_offset);

1630

dst_final = reference::gemmlowp_quantize_down_scale_by_fixedpoint<int32_t, T>(dst, bias,

1631

output_stage.gemmlowp_multipliers, output_stage.gemmlowp_shifts, output_stage.gemmlowp_offset, output_stage.gemmlowp_min_bound, output_stage.gemmlowp_max_bound);

return dst_final;

}

bool gemm_validated = true;

1636

TensorType _target{};

1637

SimpleTensor<T> _reference{};

1638

};

1639

1640

template <typename TensorType, typename AccessorType, typename ReshapeRHSOperatorType, typename GEMMFunctionType>

1641

class GEMMLowpMatrixMultiplyReshapedOnlyRHSMMULValidationFixture : public framework::Fixture

1642

{

1643

public:

Freddie Liardet

2022-05-16 14:09:10 +0100

[diff] [blame]

1644

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0,

1645

unsigned int k0, unsigned int h0, bool interleave_rhs, bool transpose_rhs, DataType data_type)

1646

{

1647

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1656

rhs_info.transpose = transpose_rhs;

1657

1658

// Set the tensor shapes for LHS and RHS matrices

1659

const TensorShape lhs_shape(k, m, batch_size);

1660

const TensorShape rhs_shape(n, k, batch_size);

1661

Ramy Elgammal

2022-09-08 11:30:08 +0100

[diff] [blame]

1662

_target = compute_target(lhs_shape, rhs_shape, lhs_info, rhs_info, data_type);

Freddie Liardet

2022-05-16 14:09:10 +0100

[diff] [blame]

1663

if(gemm_validated == true)

1664

{

1665

_reference = compute_reference(lhs_shape, rhs_shape, data_type);

}

}

protected:

template <typename U>

1671

void fill(U &&tensor, int i)

1672

{

1673

switch(tensor.data_type())

1674

{

1675

case DataType::QASYMM8:

1676

{

1677

// Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path

1678

std::uniform_int_distribution<> distribution(1, 254);

1679

library->fill(tensor, distribution, i);

1680

}

1681

break;

1682

case DataType::QASYMM8_SIGNED:

1683

{

1684

std::uniform_int_distribution<> distribution(-127, 126);

1685

library->fill(tensor, distribution, i);

}

break;

default:

ARM_COMPUTE_ERROR("Unsupported data type");

}

}

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const GEMMLHSMatrixInfo &lhs_info,

1694

const GEMMRHSMatrixInfo &rhs_info, DataType data_type)

1695

{

1696

// Create tensors

1697

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1698

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1699

TensorType rhs_reshaped;

1700

TensorType dst;

1701

1702

const unsigned int M = lhs_shape[1];

1703

const unsigned int N = rhs_shape[0];

1704

const unsigned int K = lhs_shape[0];

1705

1706

GEMMKernelInfo gemm_info;

gemm_info.m = M;

gemm_info.n = N;

gemm_info.k = K;

gemm_info.lhs_info = lhs_info;

1711

gemm_info.rhs_info = rhs_info;

1712

// The output tensor will be auto-initialized within the function

1713

1714

// Create and configure function

1715

ReshapeRHSOperatorType reshape_rhs;

1716

GEMMFunctionType gemm;

1717

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1718

1719

// If GEMM is not validated, do not try to run. The validation will check

1720

// if the technology supports this extension. If not, the test will be skipped.

1721

// If it supports, the test will fail anyway because target and reference

1722

// will not match.

1723

gemm_validated = bool(gemm.validate(lhs.info(), rhs_reshaped.info(), dst.info(), gemm_info, nullptr, nullptr, nullptr));

1724

if(gemm_validated == true)

1725

{

1726

gemm.configure(lhs.info(), rhs_reshaped.info(), dst.info(), gemm_info, nullptr, nullptr, nullptr);

1727

1728

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1729

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1730

1731

// Allocate tensors

1732

lhs.allocator()->allocate();

1733

rhs.allocator()->allocate();

1734

rhs_reshaped.allocator()->allocate();

1735

dst.allocator()->allocate();

1736

1737

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1738

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1739

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1740

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

1741

1742

// Fill tensors

1743

fill(AccessorType(lhs), 0);

1744

fill(AccessorType(rhs), 1);

1745

1746

// Compute GEMM

1747

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1748

reshape_rhs.run(reshape_rhs_pack);

1749

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs }, { ACL_SRC_1, &rhs_reshaped }, { ACL_DST, &dst } });

gemm.run(gemm_pack);

}

return dst;

}

SimpleTensor<int32_t> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type)

1757

{

1758

TensorShape dst_shape = lhs_shape;

1759

dst_shape[0] = rhs_shape[0];

1760

dst_shape[1] = lhs_shape[1];

1761

1762

if(data_type == DataType::QASYMM8)

1763

{

1764

// Create reference

1765

SimpleTensor<uint8_t> lhs{ lhs_shape, data_type, 1 };

1766

SimpleTensor<uint8_t> rhs{ rhs_shape, data_type, 1 };

1767

SimpleTensor<int32_t> dst{ dst_shape, DataType::S32, 1 };

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

return reference::gemmlowp_matrix_multiply_core<int32_t, uint8_t>(lhs, rhs, dst_shape, 0, 0);

}

else

{

// Create reference

SimpleTensor<int8_t> lhs{ lhs_shape, data_type, 1 };

1779

SimpleTensor<int8_t> rhs{ rhs_shape, data_type, 1 };

1780

SimpleTensor<int32_t> dst{ dst_shape, DataType::S32, 1 };

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

return reference::gemmlowp_matrix_multiply_core<int32_t, int8_t>(lhs, rhs, dst_shape, 0, 0);

}

}

bool gemm_validated = true;

1791

TensorType _target{};

1792

SimpleTensor<int32_t> _reference{};

1793

};

1794

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1795

template <typename TensorType, typename AccessorType, typename ReshapeRHSOperatorType, typename GEMMFunctionType>

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1796

class GEMMLowpMatrixMultiplyReshapedOnlyRHS3DValidationFixture : public framework::Fixture

1797

{

1798

public:

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1799

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0,

1800

unsigned int k0, unsigned int h0, bool interleave_rhs, bool transpose_rhs, DataType data_type)

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1801

{

1802

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1811

rhs_info.transpose = transpose_rhs;

1812

1813

// In case of GEMM3D, m is the product between m_w and m_h

1814

const unsigned int m = m_w * m_h;

1815

1816

// Set the tensor shapes for LHS and RHS matrices

1817

const TensorShape lhs_shape(k, m, batch_size);

1818

const TensorShape rhs_shape(n, k, batch_size);

1819

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1820

_target = compute_target(lhs_shape, rhs_shape, lhs_info, rhs_info, m_h, data_type);

1821

_reference = compute_reference(lhs_shape, rhs_shape, m_h, data_type);

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

}

protected:

template <typename U>

1826

void fill(U &&tensor, int i)

1827

{

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1828

switch(tensor.data_type())

1829

{

1830

case DataType::QASYMM8:

1831

{

1832

// Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path

1833

std::uniform_int_distribution<> distribution(1, 254);

1834

library->fill(tensor, distribution, i);

1835

}

1836

break;

1837

case DataType::QASYMM8_SIGNED:

1838

{

1839

std::uniform_int_distribution<> distribution(-127, 126);

1840

library->fill(tensor, distribution, i);

}

break;

default:

ARM_COMPUTE_ERROR("Unsupported data type");

1845

}

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1846

}

1847

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1848

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const GEMMLHSMatrixInfo &lhs_info,

1849

const GEMMRHSMatrixInfo &rhs_info, unsigned int m_h, DataType data_type)

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1850

{

1851

// Create tensors

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1852

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1853

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1854

TensorType rhs_reshaped;

1855

TensorType dst;

1856

1857

const unsigned int M = lhs_shape[1];

1858

const unsigned int N = rhs_shape[0];

1859

const unsigned int K = lhs_shape[0];

1860

Michele Di Giorgio

b54ba28

2020-01-14 15:31:55 +0000

[diff] [blame]

1861

GEMMKernelInfo gemm_info;

gemm_info.m = M;

gemm_info.n = N;

gemm_info.k = K;

gemm_info.depth_output_gemm3d = m_h;

1866

gemm_info.lhs_info = lhs_info;

1867

gemm_info.rhs_info = rhs_info;

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1868

// The output tensor will be auto-initialized within the function

1869

1870

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1871

ReshapeRHSOperatorType reshape_rhs;

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1872

GEMMFunctionType gemm;

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1873

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

1874

gemm.configure(lhs.info(), rhs_reshaped.info(), dst.info(), gemm_info);

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1875

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1876

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1877

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1878

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1879

add_padding_x({ &lhs, &rhs, &rhs_reshaped, &dst });

1880

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1881

// Allocate tensors

1882

lhs.allocator()->allocate();

1883

rhs.allocator()->allocate();

1884

rhs_reshaped.allocator()->allocate();

1885

dst.allocator()->allocate();

1886

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1887

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1888

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1889

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1890

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1891

1892

// Fill tensors

1893

fill(AccessorType(lhs), 0);

1894

fill(AccessorType(rhs), 1);

1895

1896

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1897

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1898

reshape_rhs.run(reshape_rhs_pack);

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

1899

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs }, { ACL_SRC_1, &rhs_reshaped }, { ACL_DST, &dst } });

1900

gemm.run(gemm_pack);

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

return dst;

}

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1905

SimpleTensor<int32_t> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, unsigned int m_h, DataType data_type)

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1906

{

1907

TensorShape dst_shape = lhs_shape;

1908

dst_shape.set(0, rhs_shape[0]);

1909

dst_shape.set(1, lhs_shape[1] / m_h);

1910

dst_shape.set(2, m_h);

1911

dst_shape.set(3, lhs_shape[2]);

1912

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1913

if(data_type == DataType::QASYMM8)

1914

{

1915

// Create reference

1916

SimpleTensor<uint8_t> lhs{ lhs_shape, data_type, 1 };

1917

SimpleTensor<uint8_t> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1918

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1919

// Fill reference

1920

fill(lhs, 0);

1921

fill(rhs, 1);

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1922

Michele Di Giorgio

2019-11-27 16:17:30 +0000

[diff] [blame]

1923

return reference::gemmlowp_matrix_multiply_core<int32_t, uint8_t>(lhs, rhs, dst_shape, 0, 0);

}

else

{

// Create reference

SimpleTensor<int8_t> lhs{ lhs_shape, data_type, 1 };

1929

SimpleTensor<int8_t> rhs{ rhs_shape, data_type, 1 };

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

return reference::gemmlowp_matrix_multiply_core<int32_t, int8_t>(lhs, rhs, dst_shape, 0, 0);

1936

}

Gian Marco Iodice

2019-03-11 16:07:12 +0000

[diff] [blame]

1937

}

1938

1939

TensorType _target{};

1940

SimpleTensor<int32_t> _reference{};

1941

};

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

1942

1943

template <typename TensorType, typename AccessorType, typename GEMMFunctionType>

1944

class GEMMLowpMatrixMultiplyNativeValidationFixture : public framework::Fixture

1945

{

1946

public:

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

1947

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0)

1948

{

1949

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// Set the tensor shapes for LHS and RHS matrices

1958

const TensorShape lhs_shape(k, m, batch_size);

1959

const TensorShape rhs_shape(n, k, batch_size);

1960

1961

_target = compute_target(lhs_shape, rhs_shape, lhs_info, rhs_info);

1962

_reference = compute_reference(lhs_shape, rhs_shape);

}

protected:

template <typename U>

1967

void fill(U &&tensor, int i)

1968

{

1969

// Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path

1970

std::uniform_int_distribution<> distribution(1, 254);

1971

library->fill(tensor, distribution, i);

1972

}

1973

1974

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info)

1975

{

1976

// Create tensors

1977

TensorType lhs = create_tensor<TensorType>(lhs_shape, DataType::QASYMM8, 1);

1978

TensorType rhs = create_tensor<TensorType>(rhs_shape, DataType::QASYMM8, 1);

1979

TensorType dst;

1980

1981

const unsigned int M = lhs_shape[1];

1982

const unsigned int N = rhs_shape[0];

1983

const unsigned int K = lhs_shape[0];

1984

1985

// The output tensor will be auto-initialized within the function

1986

1987

// Create and configure function

1988

GEMMFunctionType gemm;

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

1989

gemm.configure(lhs.info(), rhs.info(), dst.info(), lhs_info, rhs_info, GEMMReshapeInfo(M, N, K));

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

1990

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1991

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1992

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

1993

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1994

add_padding_x({ &lhs, &rhs, &dst });

1995

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

1996

// Allocate tensors

1997

lhs.allocator()->allocate();

1998

rhs.allocator()->allocate();

1999

dst.allocator()->allocate();

2000

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2001

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

2002

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

2003

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

2004

2005

// Fill tensors

2006

fill(AccessorType(lhs), 0);

2007

fill(AccessorType(rhs), 1);

2008

2009

// Compute GEMM

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

2010

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs }, { ACL_SRC_1, &rhs }, { ACL_DST, &dst } });

2011

gemm.run(gemm_pack);

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

return dst;

}

SimpleTensor<int32_t> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape)

2017

{

2018

TensorShape dst_shape = lhs_shape;

2019

dst_shape[0] = rhs_shape[0];

2020

dst_shape[1] = lhs_shape[1];

2021

2022

// Create reference

2023

SimpleTensor<uint8_t> lhs{ lhs_shape, DataType::QASYMM8, 1 };

2024

SimpleTensor<uint8_t> rhs{ rhs_shape, DataType::QASYMM8, 1 };

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

return reference::gemmlowp_matrix_multiply_core<int32_t, uint8_t>(lhs, rhs, dst_shape, 0, 0);

2031

}

2032

2033

TensorType _target{};

2034

SimpleTensor<int32_t> _reference{};

2035

};

2036

2037

template <typename TensorType, typename AccessorType, typename GEMMFunctionType>

2038

class GEMMLowpMatrixMultiplyNative3DValidationFixture : public framework::Fixture

2039

{

2040

public:

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

2041

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0)

2042

{

2043

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// In case of GEMM3D, m is the product between m_w and m_h

2052

const unsigned int m = m_w * m_h;

2053

2054

// Set the tensor shapes for LHS and RHS matrices

2055

const TensorShape lhs_shape(k, m, batch_size);

2056

const TensorShape rhs_shape(n, k, batch_size);

2057

2058

_target = compute_target(lhs_shape, rhs_shape, lhs_info, rhs_info, m_h);

2059

_reference = compute_reference(lhs_shape, rhs_shape, m_h);

}

protected:

template <typename U>

2064

void fill(U &&tensor, int i)

2065

{

2066

// Between 1 and 254 in order to avoid having -128 and 128 for the DOT product path

2067

std::uniform_int_distribution<> distribution(1, 254);

2068

library->fill(tensor, distribution, i);

2069

}

2070

2071

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info, unsigned int m_h)

2072

{

2073

// Create tensors

2074

TensorType lhs = create_tensor<TensorType>(lhs_shape, DataType::QASYMM8, 1);

2075

TensorType rhs = create_tensor<TensorType>(rhs_shape, DataType::QASYMM8, 1);

2076

TensorType dst;

2077

2078

const unsigned int M = lhs_shape[1];

2079

const unsigned int N = rhs_shape[0];

2080

const unsigned int K = lhs_shape[0];

2081

2082

// The output tensor will be auto-initialized within the function

2083

2084

// Create and configure function

2085

GEMMFunctionType gemm;

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

2086

gemm.configure(lhs.info(), rhs.info(), dst.info(), lhs_info, rhs_info, GEMMReshapeInfo(M, N, K, 1, 1, m_h));

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

2087

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2088

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

2089

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

2090

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

2091

add_padding_x({ &lhs, &rhs, &dst });

2092

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

2093

// Allocate tensors

2094

lhs.allocator()->allocate();

2095

rhs.allocator()->allocate();

2096

dst.allocator()->allocate();

2097

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2098

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

2099

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

2100

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

2101

2102

// Fill tensors

2103

fill(AccessorType(lhs), 0);

2104

fill(AccessorType(rhs), 1);

2105

2106

// Compute GEMM

Georgios Pinitas

2021-06-25 12:13:49 +0100

[diff] [blame]

2107

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs }, { ACL_SRC_1, &rhs }, { ACL_DST, &dst } });

2108

gemm.run(gemm_pack);

Gian Marco Iodice

2019-06-03 17:28:17 +0100

[diff] [blame]

return dst;

}

SimpleTensor<int32_t> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, unsigned int m_h)

2114

{

2115

TensorShape dst_shape = lhs_shape;

2116

dst_shape.set(0, rhs_shape[0]);

2117

dst_shape.set(1, lhs_shape[1] / m_h);

2118

dst_shape.set(2, m_h);

2119

dst_shape.set(3, lhs_shape[2]);

2120

2121

// Create reference

2122

SimpleTensor<uint8_t> lhs{ lhs_shape, DataType::QASYMM8, 1 };

2123

SimpleTensor<uint8_t> rhs{ rhs_shape, DataType::QASYMM8, 1 };

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

return reference::gemmlowp_matrix_multiply_core<int32_t, uint8_t>(lhs, rhs, dst_shape, 0, 0);

2130

}

2131

2132

TensorType _target{};

2133

SimpleTensor<int32_t> _reference{};

2134

};

Pablo Tello

2017-09-29 11:30:12 +0100

[diff] [blame]

2135

} // namespace validation

2136

} // namespace test

2137

} // namespace arm_compute

SiCong Li