Blame - src/core/utils/quantization/AsymmHelpers.cpp - ml/ComputeLibrary

2023-04-11 17:16:27 +0100

[diff] [blame]

182

{

Viet-Hoa Do

2023-04-26 15:38:45 +0100

[diff] [blame]

183

ARM_COMPUTE_ERROR_ON(data_type != DataType::QASYMM8 && data_type != DataType::QASYMM8_SIGNED);

184

185

const auto min_max = get_min_max(data_type);

186

187

int32_t type_min = std::get<0>(min_max).get<int32_t>();

188

int32_t type_max = std::get<1>(min_max).get<int32_t>();

189

Viet-Hoa Do

2023-04-11 17:16:27 +0100

[diff] [blame]

190

const UniformQuantizationInfo q_unif = q_info.uniform();

191

192

if(act_info.enabled())

193

{

194

switch(act_info.activation())

195

{

196

case ActivationLayerInfo::ActivationFunction::RELU:

Viet-Hoa Do

2023-04-26 15:38:45 +0100

[diff] [blame]

197

type_min = q_unif.offset;

Viet-Hoa Do

2023-04-11 17:16:27 +0100

[diff] [blame]

198

break;

199

case ActivationLayerInfo::ActivationFunction::BOUNDED_RELU:

Viet-Hoa Do

2023-04-26 15:38:45 +0100

[diff] [blame]

200

type_min = q_unif.offset;

201

type_max = (data_type == DataType::QASYMM8) ? quantize_qasymm8(act_info.a(), q_info) : quantize_qasymm8_signed(act_info.a(), q_info);

Viet-Hoa Do

2023-04-11 17:16:27 +0100

[diff] [blame]

202

break;

203

case ActivationLayerInfo::ActivationFunction::LU_BOUNDED_RELU:

Viet-Hoa Do

2023-04-26 15:38:45 +0100

[diff] [blame]

204

type_min = (data_type == DataType::QASYMM8) ? quantize_qasymm8(act_info.b(), q_info) : quantize_qasymm8_signed(act_info.b(), q_info);

205

type_max = (data_type == DataType::QASYMM8) ? quantize_qasymm8(act_info.a(), q_info) : quantize_qasymm8_signed(act_info.a(), q_info);

Viet-Hoa Do

2023-04-11 17:16:27 +0100

[diff] [blame]

206

break;

207

default:

208

ARM_COMPUTE_ERROR("Activation function not supported.");

break;

}

}

Viet-Hoa Do

2023-04-26 15:38:45 +0100

[diff] [blame]

213

return std::make_tuple(type_min, type_max);

Viet-Hoa Do

2023-04-11 17:16:27 +0100

[diff] [blame]

214

}

215

Vidhya Sudhan Loganathan

951b8a4

2019-11-04 14:42:08 +0000

[diff] [blame]

216

void compute_quantized_multipliers_and_shifts(const ITensorInfo *input,

217

const ITensorInfo *weights,

218

const ITensorInfo *output,

Vidhya Sudhan Loganathan

951b8a4

2019-11-04 14:42:08 +0000

[diff] [blame]

219

int32_t *output_multipliers_ptr,

220

int32_t *output_shifts_ptr)

Michele Di Giorgio

2019-10-09 15:32:39 +0100

[diff] [blame]

221

{

Vidhya Sudhan Loganathan

951b8a4

2019-11-04 14:42:08 +0000

[diff] [blame]

222

const UniformQuantizationInfo iq_info = input->quantization_info().uniform();

223

const QuantizationInfo wq_info = weights->quantization_info();

224

const UniformQuantizationInfo oq_info = output->quantization_info().uniform();

Michele Di Giorgio

2019-10-09 15:32:39 +0100

[diff] [blame]

225

Michele Di Giorgio

d02d5ed

2021-01-22 09:47:04 +0000

[diff] [blame]

226

const unsigned int num_filters = wq_info.scale().size();

227

Michele Di Giorgio

2019-10-09 15:32:39 +0100

[diff] [blame]

228

for(unsigned int i = 0; i < num_filters; ++i)

229

{

Michalis Spyrou

e7be8a0

2019-12-12 16:16:09 +0000

[diff] [blame]

230

int32_t output_multiplier = 0;

231

int32_t output_shift = 0;

Michele Di Giorgio

2019-10-09 15:32:39 +0100

[diff] [blame]

232

const float multiplier = iq_info.scale * wq_info.scale()[i] / oq_info.scale;

Michele Di Giorgio

14cbfb2

2019-10-23 10:53:10 +0100

[diff] [blame]

233

calculate_quantized_multiplier(multiplier, &output_multiplier, &output_shift);

Michele Di Giorgio

2019-10-09 15:32:39 +0100

[diff] [blame]

234

235

output_multipliers_ptr[i] = output_multiplier;

236

output_shifts_ptr[i] = output_shift;

237

}

238

}

Sang-Hoon Park

396cb95

2020-03-26 14:02:37 +0000

[diff] [blame]

239

240

int32_t saturating_rounding_doubling_highmul(int32_t a, int32_t b)

241

{

242

bool overflow = a == b && a == std::numeric_limits<int32_t>::min();

243

int64_t a_64(a);

244

int64_t b_64(b);

Sang-Hoon Park

2020-03-13 14:56:05 +0000

[diff] [blame]

245

int64_t ab_64 = a_64 * b_64;

Pablo Tello

4e66d70

2022-03-07 18:20:12 +0000

[diff] [blame]

246

const bool is_positive_or_zero =

247

a == 0 || b == 0 ||

248

(std::signbit(static_cast<double>(a)) == std::signbit(static_cast<double>(b)));

Sang-Hoon Park

2020-03-13 14:56:05 +0000

[diff] [blame]

249

int32_t nudge = is_positive_or_zero ? (1 << 30) : (1 - (1 << 30));

250

int32_t ab_x2_high32 = static_cast<int32_t>((ab_64 + nudge) / (1ll << 31));

Sang-Hoon Park

396cb95

2020-03-26 14:02:37 +0000

[diff] [blame]

251

return overflow ? std::numeric_limits<int32_t>::max() : ab_x2_high32;

252

}

253

254

inline int32_t rounding_divide_by_pow2(int32_t x, int exponent)

255

{

256

const int32_t mask = (1 << exponent) - 1;

257

const int32_t threshold = (mask >> 1) + (x < 0 ? 1 : 0);

258

return (x >> exponent) + ((x & mask) > threshold ? 1 : 0);

259

}

260

Sang-Hoon Park

2020-03-13 14:56:05 +0000

[diff] [blame]

261

int32_t multiply_by_quantized_multiplier(int32_t input, int32_t qmul, int32_t shift)

Sang-Hoon Park

396cb95

2020-03-26 14:02:37 +0000

[diff] [blame]

262

{

263

const auto left_shift = shift > 0 ? shift : 0;

264

const auto right_shift = shift > 0 ? 0 : -shift;

265

return rounding_divide_by_pow2(saturating_rounding_doubling_highmul(input * (1 << left_shift), qmul), right_shift);

266

}

267

268

int32_t saturating_rounding_multiply_by_pow2(int32_t exponent, int32_t v)

{

if(exponent == 0)

{

return v;

}

else if(exponent < 0)

275

{

276

return rounding_divide_by_pow2(v, -exponent);

}

else

{

constexpr auto min = std::numeric_limits<int32_t>::min();

281

constexpr auto max = std::numeric_limits<int32_t>::max();

282

const auto width = sizeof(int32_t) * 8;

283

284

const int32_t threshold = ((1 << (width - 1 - exponent)) - 1);

285

bool pos_mask = v > threshold;

286

bool neg_mask = v < -threshold;

287

int32_t result = v << exponent;

288

result = pos_mask ? max : result;

289

result = neg_mask ? min : result;

290

return result;

291

}

292

}

Sang-Hoon Park