Blame - tests/validation/CL/GEMMMatrixMultiply.cpp - ml/ComputeLibrary

const auto status = CLGEMMMatrixMultiplyKernel::validate(&lhs, &rhs, nullptr, &out, alpha, beta, is_interleaved_transposed, reshape_info, gpu_target);

144

ARM_COMPUTE_EXPECT(bool(status) == false, framework::LogLevel::ERRORS);

145

}

146

147

// Unsupported SIZE_T data type

148

{

149

const auto lhs = TensorInfo(TensorShape(13U, 12U, 1U, 1U), 1, DataType::SIZET);

150

const auto rhs = TensorInfo(TensorShape(14U, 13U, 1U, 1U), 1, DataType::SIZET);

151

const auto out = TensorInfo(TensorShape(14U, 12U, 1U, 1U), 1, DataType::SIZET);

152

constexpr float alpha = 1.3f;

153

constexpr float beta = 0.7f;

154

const bool is_interleaved_transposed = false;

155

const GEMMReshapeInfo reshape_info = GEMMReshapeInfo(12, 14, 13, 1, 1, 0, false, false);

156

const GPUTarget gpu_target = GPUTarget::MIDGARD;

157

const auto status = CLGEMMMatrixMultiplyKernel::validate(&lhs, &rhs, nullptr, &out, alpha, beta, is_interleaved_transposed, reshape_info, gpu_target);

158

ARM_COMPUTE_EXPECT(bool(status) == false, framework::LogLevel::ERRORS);

159

}

160

161

// Mixed precision with F32

162

{

163

const auto lhs = TensorInfo(TensorShape(13U, 12U, 1U, 1U), 1, DataType::F32);

164

const auto rhs = TensorInfo(TensorShape(14U, 13U, 1U, 1U), 1, DataType::F32);

165

const auto out = TensorInfo(TensorShape(14U, 12U, 1U, 1U), 1, DataType::F32);

166

constexpr float alpha = 1.3f;

167

constexpr float beta = 0.7f;

168

const bool is_interleaved_transposed = false;

169

const GEMMReshapeInfo reshape_info = GEMMReshapeInfo(12, 14, 13, 1, 1, 0, false, false);

170

const GPUTarget gpu_target = GPUTarget::MIDGARD;

171

const bool fp_mixed_precision = true;

172

const auto status = CLGEMMMatrixMultiplyKernel::validate(&lhs, &rhs, nullptr, &out, alpha, beta, is_interleaved_transposed, reshape_info, gpu_target, fp_mixed_precision);

173

ARM_COMPUTE_EXPECT(bool(status) == false, framework::LogLevel::ERRORS);

174

}

175

176

// Max number of dimensions LHS matrix

177

{

178

const auto lhs = TensorInfo(TensorShape(13U, 12U, 1U, 1U, 4U), 1, DataType::F32);

179

const auto rhs = TensorInfo(TensorShape(14U, 13U, 1U, 1U), 1, DataType::F32);

180

const auto out = TensorInfo(TensorShape(14U, 12U, 1U, 1U), 1, DataType::F32);

181

constexpr float alpha = 1.3f;

182

constexpr float beta = 0.7f;

183

const bool is_interleaved_transposed = false;

184

const GEMMReshapeInfo reshape_info = GEMMReshapeInfo(12, 14, 13, 1, 1, 0, false, false);

185

const GPUTarget gpu_target = GPUTarget::MIDGARD;

186

const auto status = CLGEMMMatrixMultiplyKernel::validate(&lhs, &rhs, nullptr, &out, alpha, beta, is_interleaved_transposed, reshape_info, gpu_target);

187

ARM_COMPUTE_EXPECT(bool(status) == false, framework::LogLevel::ERRORS);

188

}

189

190

// Max number of dimensions RHS matrix

191

{

192

const auto lhs = TensorInfo(TensorShape(13U, 12U, 1U, 4U), 1, DataType::F32);

193

const auto rhs = TensorInfo(TensorShape(14U, 13U, 1U, 4U), 1, DataType::F32);

194

const auto out = TensorInfo(TensorShape(14U, 12U, 1U, 4U), 1, DataType::F32);

195

constexpr float alpha = 1.3f;

196

constexpr float beta = 0.7f;

197

const bool is_interleaved_transposed = false;

198

const GEMMReshapeInfo reshape_info = GEMMReshapeInfo(12, 14, 13, 1, 1, 0, false, false);

199

const GPUTarget gpu_target = GPUTarget::MIDGARD;

200

const auto status = CLGEMMMatrixMultiplyKernel::validate(&lhs, &rhs, nullptr, &out, alpha, beta, is_interleaved_transposed, reshape_info, gpu_target);

201

ARM_COMPUTE_EXPECT(bool(status) == false, framework::LogLevel::ERRORS);

}

// Broadcast bias

{

const auto lhs = TensorInfo(TensorShape(13U, 12U, 1U, 1U), 1, DataType::F16);

207

const auto rhs = TensorInfo(TensorShape(14U, 13U, 1U, 1U), 1, DataType::F16);

208

// The correct shape should be bias = TensorInfo(TensorShape(14U, 1U, 1U, 1U), 1, DataType::F32);

209

const auto bias = TensorInfo(TensorShape(14U, 12U, 1U, 1U), 1, DataType::F16);

210

const auto out = TensorInfo(TensorShape(14U, 12U, 1U, 1U), 1, DataType::F16);

211

constexpr float alpha = 1.3f;

212

constexpr float beta = 0.7f;

213

const bool is_interleaved_transposed = false;

214

const GEMMReshapeInfo reshape_info = GEMMReshapeInfo(12, 14, 13, 1, 1, 0, false, true);

215

const GPUTarget gpu_target = GPUTarget::MIDGARD;

216

const bool fp_mixed_precision = false;

217

const auto status = CLGEMMMatrixMultiplyKernel::validate(&lhs, &rhs, &bias, &out, alpha, beta, is_interleaved_transposed, reshape_info, gpu_target, fp_mixed_precision);

218

ARM_COMPUTE_EXPECT(bool(status) == false, framework::LogLevel::ERRORS);

219

}

220

221

// Invalid dimensions for the bias

222

{

223

const auto lhs = TensorInfo(TensorShape(13U, 12U, 1U, 1U), 1, DataType::F32);

224

const auto rhs = TensorInfo(TensorShape(14U, 13U, 1U, 1U), 1, DataType::F32);

225

// The correct shape should be bias = TensorInfo(TensorShape(14U, 12U, 1U, 1U), 1, DataType::F32);

226

const auto bias = TensorInfo(TensorShape(14U, 8U, 1U, 1U), 1, DataType::F32);

227

const auto out = TensorInfo(TensorShape(14U, 12U, 1U, 1U), 1, DataType::F32);

228

constexpr float alpha = 1.3f;

229

constexpr float beta = 0.7f;

230

const bool is_interleaved_transposed = false;

231

const GEMMReshapeInfo reshape_info = GEMMReshapeInfo(12, 14, 13, 1, 1, 0, false, false);

232

const GPUTarget gpu_target = GPUTarget::MIDGARD;

233

const bool fp_mixed_precision = false;

234

const auto status = CLGEMMMatrixMultiplyKernel::validate(&lhs, &rhs, &bias, &out, alpha, beta, is_interleaved_transposed, reshape_info, gpu_target, fp_mixed_precision);

235

ARM_COMPUTE_EXPECT(bool(status) == false, framework::LogLevel::ERRORS);

236

}

237

238

// Invalid dimensions for the output

239

{

240

const auto lhs = TensorInfo(TensorShape(13U, 12U, 1U, 1U), 1, DataType::F32);

241

const auto rhs = TensorInfo(TensorShape(14U, 13U, 1U, 1U), 1, DataType::F32);

242

// The correct shape should be out = TensorInfo(TensorShape(14U, 12U, 1U, 1U), 1, DataType::F32);

243

const auto out = TensorInfo(TensorShape(14U, 7U, 1U, 1U), 1, DataType::F32);

244

constexpr float alpha = 1.3f;

245

constexpr float beta = 0.7f;

246

const bool is_interleaved_transposed = false;

247

const GEMMReshapeInfo reshape_info = GEMMReshapeInfo(12, 14, 13, 1, 1, 0, false, false);

248

const GPUTarget gpu_target = GPUTarget::MIDGARD;

249

const auto status = CLGEMMMatrixMultiplyKernel::validate(&lhs, &rhs, nullptr, &out, alpha, beta, is_interleaved_transposed, reshape_info, gpu_target);

250

ARM_COMPUTE_EXPECT(bool(status) == false, framework::LogLevel::ERRORS);

}

}

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

254

TEST_SUITE(Float)

255

TEST_SUITE(FP32)

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

256

257

FIXTURE_DATA_TEST_CASE(RunSmall, CLGEMMMatrixMultiplyNativeFixture<float>, framework::DatasetMode::ALL,

SiCong Li

7e5b7bf

2020-11-17 09:41:13 +0000

[diff] [blame]

258

combine(combine(combine(combine(combine(combine(combine(combine(combine(

259

m_n_values,

Gian Marco Iodice

c630e94

2020-05-11 12:15:54 +0100

[diff] [blame]

260

k_values),

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

b_values),

alpha_values),

beta_values),

broadcast_bias_values),

265

framework::dataset::make("fp16_mixed_precision", false)),

266

act_values),

267

framework::dataset::make("DataType", DataType::F32)),

gpu_arch_values))

{

// Validate output

validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);

272

}

273

274

FIXTURE_DATA_TEST_CASE(RunSmall3D, CLGEMMMatrixMultiplyNative3DFixture<float>, framework::DatasetMode::ALL,

275

combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(

Gian Marco Iodice

c630e94

2020-05-11 12:15:54 +0100

[diff] [blame]

m_w_values,

m_h_values),

n_values),

k_values),

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

b_values),

alpha_values),

beta_values),

broadcast_bias_values),

284

framework::dataset::make("fp16_mixed_precision", false)),

285

act_values),

286

framework::dataset::make("DataType", DataType::F32)),

gpu_arch_values))

{

// Validate output

validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);

291

}

292

293

TEST_SUITE_END() // FP32

294

295

TEST_SUITE(FP16)

296

FIXTURE_DATA_TEST_CASE(RunSmall, CLGEMMMatrixMultiplyNativeFixture<half>, framework::DatasetMode::ALL,

SiCong Li

7e5b7bf

2020-11-17 09:41:13 +0000

[diff] [blame]

297

combine(combine(combine(combine(combine(combine(combine(combine(combine(

298

m_n_values,

Gian Marco Iodice

c630e94

2020-05-11 12:15:54 +0100

[diff] [blame]

299

k_values),

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

b_values),

alpha_values),

beta_values),

broadcast_bias_values),

304

fp16_mixed_precision_values),

305

act_values),

306

framework::dataset::make("DataType", DataType::F16)),

gpu_arch_values))

{

// Validate output

validate(CLAccessor(_target), _reference, rel_tolerance_f16, tolerance_num_f16);

311

}

312

313

FIXTURE_DATA_TEST_CASE(RunSmall3D, CLGEMMMatrixMultiplyNative3DFixture<half>, framework::DatasetMode::ALL,

314

combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(

Gian Marco Iodice

c630e94

2020-05-11 12:15:54 +0100

[diff] [blame]

m_w_values,

m_h_values),

n_values),

k_values),

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

b_values),

alpha_values),

beta_values),

broadcast_bias_values),

323

fp16_mixed_precision_values),

324

act_values),

325

framework::dataset::make("DataType", DataType::F16)),

gpu_arch_values))

{

// Validate output

validate(CLAccessor(_target), _reference, rel_tolerance_f16, tolerance_num_f16);

330

}

331

332

TEST_SUITE_END() // FP16

333

TEST_SUITE_END() // Float

334

TEST_SUITE_END() // GEMMMatrixMuliplty

335

TEST_SUITE_END() // CL

336

} // namespace validation

337

} // namespace test

338

} // namespace arm_compute