Blame - tests/validation/CPP/DepthwiseConvolution.cpp - ml/ComputeLibrary

2017-08-01 16:09:33 +0100

[diff] [blame]

54

{

55

// Create reference

56

SimpleTensor<T> dst{ dst_shape, src.data_type(), 1, src.fixed_point_position() };

57

58

// Compute reference

Jaroslaw Rzepecki

2017-10-13 11:13:58 +0100

[diff] [blame]

59

const int filter_width = weights.shape().x();

60

const int filter_height = weights.shape().y();

61

const int filter_plane = filter_width * filter_height;

62

const int input_width = src.shape().x();

63

const int input_height = src.shape().y();

64

const int input_depth = src.shape().z();

65

const int num_batches = src.shape().total_size() / (input_width * input_height * input_depth);

Giorgio Arena

2017-08-01 16:09:33 +0100

[diff] [blame]

66

Jaroslaw Rzepecki

2017-10-13 11:13:58 +0100

[diff] [blame]

67

const int filter_half_width = filter_width / 2;

68

const int filter_half_height = filter_height / 2;

69

70

const int pad_left = std::min(static_cast<int>(conv_info.pad_left()), filter_half_width);

71

const int pad_top = std::min(static_cast<int>(conv_info.pad_top()), filter_half_height);

72

const int pad_right = std::min(static_cast<int>(conv_info.pad_right()), filter_half_width);

73

const int pad_bottom = std::min(static_cast<int>(conv_info.pad_bottom()), filter_half_height);

74

75

const int minimum_x = -pad_left + filter_half_width;

76

const int minimum_y = -pad_top + filter_half_height;

77

const int maximum_x = input_width + pad_left - filter_half_width + pad_right - filter_half_width;

78

const int maximum_y = input_height + pad_top - filter_half_height + pad_bottom - filter_half_height;

Giorgio Arena

2017-08-01 16:09:33 +0100

[diff] [blame]

79

80

int out_pos = 0;

Giorgio Arena

2017-08-23 16:36:24 +0100

[diff] [blame]

81

for(int r = 0; r < num_batches; ++r)

Giorgio Arena

2017-08-01 16:09:33 +0100

[diff] [blame]

82

{

Jaroslaw Rzepecki

2017-10-13 11:13:58 +0100

[diff] [blame]

83

for(int z = 0; z < input_depth; ++z)

Giorgio Arena

2017-08-01 16:09:33 +0100

[diff] [blame]

84

{

Jaroslaw Rzepecki

2017-10-13 11:13:58 +0100

[diff] [blame]

85

for(int y = minimum_y; y < minimum_y + maximum_y; y += conv_info.stride().second)

Giorgio Arena

2017-08-01 16:09:33 +0100

[diff] [blame]

86

{

Jaroslaw Rzepecki

2017-10-13 11:13:58 +0100

[diff] [blame]

87

for(int x = minimum_x; x < minimum_x + maximum_x; x += conv_info.stride().first)

Giorgio Arena

2017-08-01 16:09:33 +0100

[diff] [blame]

88

{

Giorgio Arena

2017-08-23 16:36:24 +0100

[diff] [blame]

89

Coordinates coords(static_cast<int>(x), static_cast<int>(y), static_cast<int>(z), static_cast<int>(r));

90

size_t filter_offset = filter_plane * z;

91

92

T val = 0;

93

for(int j = y - filter_half_height; j <= static_cast<int>(y + filter_half_height); ++j)

Giorgio Arena

2017-08-01 16:09:33 +0100

[diff] [blame]

94

{

Giorgio Arena

2017-08-23 16:36:24 +0100

[diff] [blame]

95

for(int i = x - filter_half_width; i <= static_cast<int>(x + filter_half_width); ++i)

{

coords.set(0, i);

coords.set(1, j);

val += *(weights.data() + filter_offset) * tensor_elem_at(src, coords, BorderMode::CONSTANT, 0.f);

100

++filter_offset;

101

}

Giorgio Arena

2017-08-01 16:09:33 +0100

[diff] [blame]

102

}

Giorgio Arena

2017-08-23 16:36:24 +0100

[diff] [blame]

103

coords.set(0, x);

104

coords.set(1, y);

Dmitry Savenko

2017-11-20 22:00:08 +0700

[diff] [blame]

105

dst[out_pos++] = saturate_cast<T>(val + *static_cast<const TB *>(biases(Coordinates(z))));

Giorgio Arena

2017-08-01 16:09:33 +0100

[diff] [blame]

106

}

Giorgio Arena

2017-08-01 16:09:33 +0100

[diff] [blame]

}

}

}

return dst;

}

Dmitry Savenko

2017-11-20 22:00:08 +0700

[diff] [blame]

114

template <>

115

SimpleTensor<uint8_t> depthwise_convolution(const SimpleTensor<uint8_t> &src, const SimpleTensor<uint8_t> &weights, const SimpleTensor<int32_t> &biases, const TensorShape &dst_shape,

116

const PadStrideInfo &conv_info)

117

{

118

// Create reference

119

SimpleTensor<uint8_t> dst{ dst_shape, src.data_type(), 1, src.fixed_point_position(), src.quantization_info() };

120

121

const int input_offset = -src.quantization_info().offset;

122

const float input_scale = src.quantization_info().scale;

123

const int weights_offset = -weights.quantization_info().offset;

124

const float weights_scale = weights.quantization_info().scale;

125

const int output_offset = dst.quantization_info().offset;

126

const float output_scale = dst.quantization_info().scale;

127

128

int output_multiplier;

129

int output_shift;

130

const float multiplier = input_scale * weights_scale / output_scale;

131

arm_compute::quantization::calculate_quantized_multiplier_less_than_one(multiplier, &output_multiplier, &output_shift);

132

133

// Compute reference

134

const int filter_width = weights.shape().x();

135

const int filter_height = weights.shape().y();

136

const int filter_plane = filter_width * filter_height;

137

const int input_width = src.shape().x();

138

const int input_height = src.shape().y();

139

const int input_depth = src.shape().z();

Georgios Pinitas

2017-11-29 10:17:56 +0000

[diff] [blame^]

140

const int num_batches = src.shape().total_size() / (input_width * input_height * input_depth);

Dmitry Savenko

2017-11-20 22:00:08 +0700

[diff] [blame]

141

142

const int filter_half_size = filter_width / 2;

143

const int pad_x = std::min(filter_half_size, static_cast<int>(conv_info.pad().first));

144

const int pad_y = std::min(filter_half_size, static_cast<int>(conv_info.pad().second));

145

const int minimum_x = -pad_x + filter_half_size;

146

const int minimum_y = -pad_y + filter_half_size;

147

148

int out_pos = 0;

Georgios Pinitas

2017-11-29 10:17:56 +0000

[diff] [blame^]

149

for(int r = 0; r < num_batches; ++r)

Dmitry Savenko

2017-11-20 22:00:08 +0700

[diff] [blame]

150

{

Georgios Pinitas

2017-11-29 10:17:56 +0000

[diff] [blame^]

151

for(int z = 0; z < input_depth; ++z)

Dmitry Savenko

2017-11-20 22:00:08 +0700

[diff] [blame]

152

{

Georgios Pinitas

2017-11-29 10:17:56 +0000

[diff] [blame^]

153

int32_t bias_val = *static_cast<const int32_t *>(biases(Coordinates(z)));

154

for(int y = minimum_y; y < input_height + pad_y - filter_half_size; y += conv_info.stride().second)

Dmitry Savenko

2017-11-20 22:00:08 +0700

[diff] [blame]

155

{

Georgios Pinitas

2017-11-29 10:17:56 +0000

[diff] [blame^]

156

for(int x = minimum_x; x < input_width + pad_x - filter_half_size; x += conv_info.stride().first)

Dmitry Savenko

2017-11-20 22:00:08 +0700

[diff] [blame]

157

{

Georgios Pinitas

2017-11-29 10:17:56 +0000

[diff] [blame^]

158

Coordinates coords(x, y, z);

159

int filter_offset = filter_plane * z;

Dmitry Savenko

2017-11-20 22:00:08 +0700

[diff] [blame]

160

Georgios Pinitas

2017-11-29 10:17:56 +0000

[diff] [blame^]

161

uint32_t val = 0;

162

for(int j = y - filter_half_size; j <= (y + filter_half_size); ++j)

163

{

164

for(int i = x - filter_half_size; i <= (x + filter_half_size); ++i)

{

coords.set(0, i);

coords.set(1, j);

auto in_val = tensor_elem_at<uint8_t>(src, coords, BorderMode::CONSTANT, 0);

169

uint8_t w_val = *(weights.data() + filter_offset);

170

val += (in_val + input_offset) * (w_val + weights_offset);

++filter_offset;

}

}

val += bias_val;

val = asymm_rounding_divide_by_pow2(asymm_int_mult(val, output_multiplier), output_shift);

176

val += output_offset;

177

val = std::max<int32_t>(val, 0);

178

val = std::min<int32_t>(val, 255);

179

180

// Store the result

181

dst[out_pos++] = val;

182

}

Dmitry Savenko

2017-11-20 22:00:08 +0700

[diff] [blame]

}

}

}

return dst;

}

Georgios Pinitas

2017-10-23 20:29:30 +0100

[diff] [blame]

190

template SimpleTensor<float> depthwise_convolution(const SimpleTensor<float> &src, const SimpleTensor<float> &weights, const SimpleTensor<float> &biases, const TensorShape &dst_shape,

191

const PadStrideInfo &conv_info);

Giorgio Arena