Blame - src/core/utils/quantization/AsymmHelpers.cpp - ml/ComputeLibrary

2023-04-11 17:16:27 +0100

[diff] [blame]

183

{

Viet-Hoa Do

2023-04-26 15:38:45 +0100

[diff] [blame]

184

ARM_COMPUTE_ERROR_ON(data_type != DataType::QASYMM8 && data_type != DataType::QASYMM8_SIGNED);

185

186

const auto min_max = get_min_max(data_type);

187

188

int32_t type_min = std::get<0>(min_max).get<int32_t>();

189

int32_t type_max = std::get<1>(min_max).get<int32_t>();

190

Viet-Hoa Do

2023-04-11 17:16:27 +0100

[diff] [blame]

191

const UniformQuantizationInfo q_unif = q_info.uniform();

192

193

if(act_info.enabled())

194

{

195

switch(act_info.activation())

196

{

197

case ActivationLayerInfo::ActivationFunction::RELU:

Viet-Hoa Do

2023-04-26 15:38:45 +0100

[diff] [blame]

198

type_min = q_unif.offset;

Viet-Hoa Do

2023-04-11 17:16:27 +0100

[diff] [blame]

199

break;

200

case ActivationLayerInfo::ActivationFunction::BOUNDED_RELU:

Viet-Hoa Do

2023-04-26 15:38:45 +0100

[diff] [blame]

201

type_min = q_unif.offset;

202

type_max = (data_type == DataType::QASYMM8) ? quantize_qasymm8(act_info.a(), q_info) : quantize_qasymm8_signed(act_info.a(), q_info);

Viet-Hoa Do

2023-04-11 17:16:27 +0100

[diff] [blame]

203

break;

204

case ActivationLayerInfo::ActivationFunction::LU_BOUNDED_RELU:

Viet-Hoa Do

2023-04-26 15:38:45 +0100

[diff] [blame]

205

type_min = (data_type == DataType::QASYMM8) ? quantize_qasymm8(act_info.b(), q_info) : quantize_qasymm8_signed(act_info.b(), q_info);

206

type_max = (data_type == DataType::QASYMM8) ? quantize_qasymm8(act_info.a(), q_info) : quantize_qasymm8_signed(act_info.a(), q_info);

Viet-Hoa Do

2023-04-11 17:16:27 +0100

[diff] [blame]

207

break;

208

default:

209

ARM_COMPUTE_ERROR("Activation function not supported.");

break;

}

}

Viet-Hoa Do

2023-04-26 15:38:45 +0100

[diff] [blame]

214

return std::make_tuple(type_min, type_max);

Viet-Hoa Do

2023-04-11 17:16:27 +0100

[diff] [blame]

215

}

216

Vidhya Sudhan Loganathan

951b8a4

2019-11-04 14:42:08 +0000

[diff] [blame]

217

void compute_quantized_multipliers_and_shifts(const ITensorInfo *input,

218

const ITensorInfo *weights,

219

const ITensorInfo *output,

Vidhya Sudhan Loganathan

951b8a4

2019-11-04 14:42:08 +0000

[diff] [blame]

220

int32_t *output_multipliers_ptr,

221

int32_t *output_shifts_ptr)

Michele Di Giorgio

2019-10-09 15:32:39 +0100

[diff] [blame]

222

{

Vidhya Sudhan Loganathan

951b8a4

2019-11-04 14:42:08 +0000

[diff] [blame]

223

const UniformQuantizationInfo iq_info = input->quantization_info().uniform();

224

const QuantizationInfo wq_info = weights->quantization_info();

225

const UniformQuantizationInfo oq_info = output->quantization_info().uniform();

Michele Di Giorgio

2019-10-09 15:32:39 +0100

[diff] [blame]

226

Michele Di Giorgio

d02d5ed

2021-01-22 09:47:04 +0000

[diff] [blame]

227

const unsigned int num_filters = wq_info.scale().size();

228

Michele Di Giorgio

2019-10-09 15:32:39 +0100

[diff] [blame]

229

for(unsigned int i = 0; i < num_filters; ++i)

230

{

Michalis Spyrou

e7be8a0

2019-12-12 16:16:09 +0000

[diff] [blame]

231

int32_t output_multiplier = 0;

232

int32_t output_shift = 0;

Michele Di Giorgio

2019-10-09 15:32:39 +0100

[diff] [blame]

233

const float multiplier = iq_info.scale * wq_info.scale()[i] / oq_info.scale;

Michele Di Giorgio

14cbfb2

2019-10-23 10:53:10 +0100

[diff] [blame]

234

calculate_quantized_multiplier(multiplier, &output_multiplier, &output_shift);

Michele Di Giorgio

2019-10-09 15:32:39 +0100

[diff] [blame]

235

236

output_multipliers_ptr[i] = output_multiplier;

237

output_shifts_ptr[i] = output_shift;

238

}

239

}

Sang-Hoon Park

396cb95

2020-03-26 14:02:37 +0000

[diff] [blame]

240

241

int32_t saturating_rounding_doubling_highmul(int32_t a, int32_t b)

242

{

243

bool overflow = a == b && a == std::numeric_limits<int32_t>::min();

244

int64_t a_64(a);

245

int64_t b_64(b);

Sang-Hoon Park

2020-03-13 14:56:05 +0000

[diff] [blame]

246

int64_t ab_64 = a_64 * b_64;

Pablo Tello

4e66d70

2022-03-07 18:20:12 +0000

[diff] [blame]

247

const bool is_positive_or_zero =

248

a == 0 || b == 0 ||

249

(std::signbit(static_cast<double>(a)) == std::signbit(static_cast<double>(b)));

Sang-Hoon Park

2020-03-13 14:56:05 +0000

[diff] [blame]

250

int32_t nudge = is_positive_or_zero ? (1 << 30) : (1 - (1 << 30));

251

int32_t ab_x2_high32 = static_cast<int32_t>((ab_64 + nudge) / (1ll << 31));

Sang-Hoon Park

396cb95

2020-03-26 14:02:37 +0000

[diff] [blame]

252

return overflow ? std::numeric_limits<int32_t>::max() : ab_x2_high32;

253

}

254

255

inline int32_t rounding_divide_by_pow2(int32_t x, int exponent)

256

{

257

const int32_t mask = (1 << exponent) - 1;

258

const int32_t threshold = (mask >> 1) + (x < 0 ? 1 : 0);

259

return (x >> exponent) + ((x & mask) > threshold ? 1 : 0);

260

}

261

Sang-Hoon Park

2020-03-13 14:56:05 +0000

[diff] [blame]

262

int32_t multiply_by_quantized_multiplier(int32_t input, int32_t qmul, int32_t shift)

Sang-Hoon Park

396cb95

2020-03-26 14:02:37 +0000

[diff] [blame]

263

{

264

const auto left_shift = shift > 0 ? shift : 0;

265

const auto right_shift = shift > 0 ? 0 : -shift;

266

return rounding_divide_by_pow2(saturating_rounding_doubling_highmul(input * (1 << left_shift), qmul), right_shift);

267

}

268

269

int32_t saturating_rounding_multiply_by_pow2(int32_t exponent, int32_t v)

{

if(exponent == 0)

{

return v;

}

else if(exponent < 0)

276

{

277

return rounding_divide_by_pow2(v, -exponent);

}

else

{

constexpr auto min = std::numeric_limits<int32_t>::min();

282

constexpr auto max = std::numeric_limits<int32_t>::max();

283

const auto width = sizeof(int32_t) * 8;

284

285

const int32_t threshold = ((1 << (width - 1 - exponent)) - 1);

286

bool pos_mask = v > threshold;

287

bool neg_mask = v < -threshold;

288

int32_t result = v << exponent;

289

result = pos_mask ? max : result;

290

result = neg_mask ? min : result;

291

return result;

292

}

293

}

Sang-Hoon Park