Blame - src/core/CL/cl_kernels/scale_quantized.cl - ml/ComputeLibrary

2018-12-10 16:19:20 +0000

[diff] [blame]

88

#if defined(DEPTH_OUT)

Michalis Spyrou

2018-09-12 13:35:38 +0100

[diff] [blame]

89

/** Performs scale on an image interpolating with the BILINEAR method. (NHWC)

90

*

91

* @note Sampling policy to be used is passed as -DSAMPLING_POLICY_(TYPE) e.g. -DSAMPLING_POLICY_TOP_LEFT

92

* @note Scale value for QASYMM8 data type to used is passed as -DSCALE=<VALUE> e.g. -DSCALE=0.5

93

* @note Offset value for QASYMM8 data type to used is passed as -DOFFSET=<VALUE> e.g. -DOFFSET=1

94

* @note If border mode replicate is used, is should be passed as -DBORDER_MODE_REPLICATE

Michalis Spyrou

2018-12-10 16:19:20 +0000

[diff] [blame]

95

* @note Output tensor's depth should be given as a preprocessor argument using -DDEPTH_OUT=size. e.g. -DDEPTH=16

Manuel Bottini

2020-12-03 16:26:35 +0000

[diff] [blame]

96

* @note The value to be used at the edges of the images shoud be given as a preprocessor argument using -DCONSTANT_VALUE=value.

Michalis Spyrou

2018-09-12 13:35:38 +0100

[diff] [blame]

97

*

98

* @param[in] in_ptr Pointer to the source image. Supported data types: QASYMM8.

99

* @param[in] in_stride_x Stride of the source image in X dimension (in bytes)

100

* @param[in] in_step_x src_stride_x * number of elements along X processed per workitem(in bytes)

101

* @param[in] in_stride_y Stride of the source image in Y dimension (in bytes)

102

* @param[in] in_step_y src_stride_y * number of elements along Y processed per workitem(in bytes)

103

* @param[in] in_stride_z Stride of the source image in Z dimension (in bytes)

104

* @param[in] in_step_z src_stride_z * number of elements along Z processed per workitem(in bytes)

105

* @param[in] in_offset_first_element_in_bytes The offset of the first element in the source image

106

* @param[out] out_ptr Pointer to the destination image. Supported data types: same as @p in_ptr

107

* @param[in] out_stride_x Stride of the destination image in X dimension (in bytes)

108

* @param[in] out_step_x dst_stride_x * number of elements along X processed per workitem(in bytes)

109

* @param[in] out_stride_y Stride of the destination image in Y dimension (in bytes)

110

* @param[in] out_step_y dst_stride_y * number of elements along Y processed per workitem(in bytes)

111

* @param[in] out_stride_z Stride of the destination image in Z dimension (in bytes)

112

* @param[in] out_step_z dst_stride_y * number of elements along Z processed per workitem(in bytes)

113

* @param[in] out_offset_first_element_in_bytes The offset of the first element in the destination image

114

* @param[in] input_width Input image width

115

* @param[in] input_height Input image height

116

* @param[in] scale_x The scale factor along x dimension

117

* @param[in] scale_y The scale factor along y dimension

Manuel Bottini

2020-12-03 16:26:35 +0000

[diff] [blame]

118

* @param[in] constant_border_value Constant border value to use

Michalis Spyrou

2018-09-12 13:35:38 +0100

[diff] [blame]

119

*/

120

__kernel void scale_bilinear_quantized_nhwc(

Michalis Spyrou

2018-12-10 16:19:20 +0000

[diff] [blame]

121

TENSOR4D_DECLARATION(in),

122

TENSOR4D_DECLARATION(out),

Michalis Spyrou

2018-09-12 13:35:38 +0100

[diff] [blame]

123

const float input_width,

124

const float input_height,

125

const float scale_x,

126

const float scale_y)

127

{

Michalis Spyrou

2018-12-10 16:19:20 +0000

[diff] [blame]

128

Tensor4D in = CONVERT_TO_TENSOR4D_STRUCT_NO_STEP(in, 0);

129

Tensor4D out = CONVERT_TO_TENSOR4D_STRUCT(out, DEPTH_OUT);

Michalis Spyrou

2018-09-12 13:35:38 +0100

[diff] [blame]

130

131

#ifdef SAMPLING_POLICY_TOP_LEFT

132

const float new_x = get_global_id(1) * scale_x;

Michalis Spyrou

2018-12-10 16:19:20 +0000

[diff] [blame]

133

const float new_y = (get_global_id(2) % DEPTH_OUT) * scale_y;

Michalis Spyrou

2018-09-12 13:35:38 +0100

[diff] [blame]

134

#elif SAMPLING_POLICY_CENTER

135

const float new_x = (get_global_id(1) + 0.5f) * scale_x - 0.5f;

Michalis Spyrou

2018-12-10 16:19:20 +0000

[diff] [blame]

136

const float new_y = ((get_global_id(2) % DEPTH_OUT) + 0.5f) * scale_y - 0.5f;

Michalis Spyrou

2018-09-12 13:35:38 +0100

[diff] [blame]

137

#else /* SAMPLING_POLICY */

138

#error("Unsupported sampling policy");

139

#endif /* SAMPLING_POLICY */

140

Manuel Bottini

2020-12-03 16:26:35 +0000

[diff] [blame]

141

const float new_xf = floor(new_x);

142

const float new_yf = floor(new_y);

143

const float clamped_x = clamp(new_xf, 0.0f, input_width - 1);

144

const float clamped_x1 = clamp(new_xf + 1, 0.0f, input_width - 1);

145

const float clamped_y = clamp(new_yf, 0.0f, input_height - 1);

146

const float clamped_y1 = clamp(new_yf + 1, 0.0f, input_height - 1);

Michalis Spyrou

2018-09-12 13:35:38 +0100

[diff] [blame]

147

148

#ifndef BORDER_MODE_REPLICATE

Manuel Bottini