chapters/type_conversion.adoc - tosa/specification - Gitiles

 //
 // This confidential and proprietary software may be used only as
 // authorised by a licensing agreement from ARM Limited
 // (C) COPYRIGHT 2020-2023 ARM Limited
 // ALL RIGHTS RESERVED
 // The entire notice above must be reproduced on all authorised
 // copies and copies may only be made to the extent permitted
 // by a licensing agreement from ARM Limited.

 === Type Conversion

 ==== CAST

 Casts a tensor from one data type to another.

 include::{generated}/operators/CAST.adoc[]

 [source,c++]
 ----
 for_each(index in shape) {
     in_t in = tensor_read<in_t>(input, shape, index);
     out_t out;
     if (out_t == bool_t) {
         out = (in != 0) ? true : false;
     } else if (in_t == bool_t) {
         out = (in) ? 1 : 0;
     } else if (out_t == fp16_t || out_t == bf16_t || out_t == fp32_t) {
         out = round_to_nearest_float(in);
     } else if (in_t == fp16_t || in_t == bf16_t || in_t == fp32_t) {
         out = apply_clip<out_t>(round_to_nearest_int(in), minimum<out_t>, maximum<out_t>);
     } else if (sizeof(out_t) >= sizeof(in_t)) {
         out = sign_extend<out_t>(in);
     } else {
         out = truncate(in);
     }
     tensor_write<out_t>(output, shape, index, out)
 }
 ----

 ==== RESCALE

 Rescale quantized values into a new domain. This function scales by factor: multiplier * 2^-shift^.

 include::{generated}/operators/RESCALE.adoc[]

 [source,c++]
 ----
 for_each(index in shape) {
     // uint16 values can have zero_point 0 or 32768
     // int8/uint8 can have zero point within their valid range
     // No other types can have zero point != 0
     ERROR_IF(in_t != i8_t &&
              (in_t != i16_t || input_unsigned == False) && input_zp != 0);
     ERROR_IF(out_t != i8_t &&
              (out_t != i16_t || output_unsigned == False) && output_zp != 0);
     ERROR_IF(in_t == i16_t && input_unsigned == True && input_zp != 0 && input_zp != 32768);
     ERROR_IF(out_t == i16_t && output_unsigned == True && output_zp != 0 && output_zp != 32768);
     ERROR_IF(scale32 && in_t == i48_t);
     ERROR_IF(!scale32 && double_round);
     ERROR_IF(in_t == i16_t && out_t == i32_t && input_unsigned);
     ERROR_IF(in_t == i32_t && out_t == i16_t && output_unsigned);

     in_t in_value = tensor_read<in_t>(input, shape, index);

     int48_t value, extended_in_zp;
     if (input_unsigned) {
         value = zero_extend<int48_t>(in_value);
         extended_in_zp = zero_extend<int48_t>(input_zp);
     }
     else {
         value = sign_extend<int48_t>(value);
         extended_in_zp = sign_extend<int48_t>(input_zp);
     }

     value = value - extended_in_zp;
     int c = (per_channel) ? index[rank(input) - 1] : 0;
     int32_t result = (scale32) ?
         apply_scale_32(value, multiplier[c], shift[c], double_round) :
         apply_scale_16(value, multiplier[c], shift[c]);

     if (output_unsigned) {
         int32_t extended_out_zp = zero_extend<int32_t>(output_zp);
         result = apply_add_s<int32_t>(result, extended_out_zp);
         out_t out = static_cast<out_t>(apply_clip<int32_t>(result,
                                                            minimum_u<out_t>,
                                                            maximum_u<out_t>));
     }
     else {
         int32_t extended_out_zp = sign_extend<int32_t>(output_zp);
         result = apply_add_s<int32_t>(result, extended_out_zp);
         out_t out = static_cast<out_t>(apply_clip<int32_t>(result,
                                                            minimum_s<out_t>,
                                                            maximum_s<out_t>));
     }
     tensor_write<out_t>(output, shape, index, out);
 }
 ----
	//
	// This confidential and proprietary software may be used only as
	// authorised by a licensing agreement from ARM Limited
	// (C) COPYRIGHT 2020-2023 ARM Limited
	// ALL RIGHTS RESERVED
	// The entire notice above must be reproduced on all authorised
	// copies and copies may only be made to the extent permitted
	// by a licensing agreement from ARM Limited.

	=== Type Conversion

	==== CAST

	Casts a tensor from one data type to another.

	include::{generated}/operators/CAST.adoc[]

	[source,c++]
	----
	for_each(index in shape) {
	in_t in = tensor_read<in_t>(input, shape, index);
	out_t out;
	if (out_t == bool_t) {
	out = (in != 0) ? true : false;
	} else if (in_t == bool_t) {
	out = (in) ? 1 : 0;
	} else if (out_t == fp16_t \|\| out_t == bf16_t \|\| out_t == fp32_t) {
	out = round_to_nearest_float(in);
	} else if (in_t == fp16_t \|\| in_t == bf16_t \|\| in_t == fp32_t) {
	out = apply_clip<out_t>(round_to_nearest_int(in), minimum<out_t>, maximum<out_t>);
	} else if (sizeof(out_t) >= sizeof(in_t)) {
	out = sign_extend<out_t>(in);
	} else {
	out = truncate(in);
	}
	tensor_write<out_t>(output, shape, index, out)
	}
	----

	==== RESCALE

	Rescale quantized values into a new domain. This function scales by factor: multiplier * 2^-shift^.

	include::{generated}/operators/RESCALE.adoc[]

	[source,c++]
	----
	for_each(index in shape) {
	// uint16 values can have zero_point 0 or 32768
	// int8/uint8 can have zero point within their valid range
	// No other types can have zero point != 0
	ERROR_IF(in_t != i8_t &&
	(in_t != i16_t \|\| input_unsigned == False) && input_zp != 0);
	ERROR_IF(out_t != i8_t &&
	(out_t != i16_t \|\| output_unsigned == False) && output_zp != 0);
	ERROR_IF(in_t == i16_t && input_unsigned == True && input_zp != 0 && input_zp != 32768);
	ERROR_IF(out_t == i16_t && output_unsigned == True && output_zp != 0 && output_zp != 32768);
	ERROR_IF(scale32 && in_t == i48_t);
	ERROR_IF(!scale32 && double_round);
	ERROR_IF(in_t == i16_t && out_t == i32_t && input_unsigned);
	ERROR_IF(in_t == i32_t && out_t == i16_t && output_unsigned);

	in_t in_value = tensor_read<in_t>(input, shape, index);

	int48_t value, extended_in_zp;
	if (input_unsigned) {
	value = zero_extend<int48_t>(in_value);
	extended_in_zp = zero_extend<int48_t>(input_zp);
	}
	else {
	value = sign_extend<int48_t>(value);
	extended_in_zp = sign_extend<int48_t>(input_zp);
	}

	value = value - extended_in_zp;
	int c = (per_channel) ? index[rank(input) - 1] : 0;
	int32_t result = (scale32) ?
	apply_scale_32(value, multiplier[c], shift[c], double_round) :
	apply_scale_16(value, multiplier[c], shift[c]);

	if (output_unsigned) {
	int32_t extended_out_zp = zero_extend<int32_t>(output_zp);
	result = apply_add_s<int32_t>(result, extended_out_zp);
	out_t out = static_cast<out_t>(apply_clip<int32_t>(result,
	minimum_u<out_t>,
	maximum_u<out_t>));
	}
	else {
	int32_t extended_out_zp = sign_extend<int32_t>(output_zp);
	result = apply_add_s<int32_t>(result, extended_out_zp);
	out_t out = static_cast<out_t>(apply_clip<int32_t>(result,
	minimum_s<out_t>,
	maximum_s<out_t>));
	}
	tensor_write<out_t>(output, shape, index, out);
	}
	----