COMPMID-477 - Optimized CLDirectConvolution1x1 for Bifrost
	    - Fixed bug in CLDirectConvolution3x3

Change-Id: Iaf34ef44f0b7bc02e66f3eb4452ff7a90ef83523
Reviewed-on: http://mpd-gerrit.cambridge.arm.com/86725
Tested-by: Kaizen <jeremy.johnson+kaizengerrit@arm.com>
Reviewed-by: Georgios Pinitas <georgios.pinitas@arm.com>
Reviewed-by: Moritz Pflanzer <moritz.pflanzer@arm.com>
diff --git a/src/core/CL/cl_kernels/direct_convolution3x3.cl b/src/core/CL/cl_kernels/direct_convolution3x3.cl
index 26f24e1..1a228dd 100644
--- a/src/core/CL/cl_kernels/direct_convolution3x3.cl
+++ b/src/core/CL/cl_kernels/direct_convolution3x3.cl
@@ -288,11 +288,11 @@
 #ifdef HAS_BIAS
     Vector biases = CONVERT_TO_VECTOR_STRUCT_NO_STEP(biases);
 
-    float4 bias = (float4) * ((__global float *)(vector_offset(&biases, kernel_index)));
+    float bias = (float) * ((__global float *)(vector_offset(&biases, kernel_index)));
 
-    pixels0 += bias;
-    pixels1 += bias;
-    pixels2 += bias;
+    pixels0 += (float4)bias;
+    pixels1 += (float4)bias;
+    pixels2 += (float4)bias;
 #endif /* defined(HAS_BIAS) */
 
     vstore4(pixels0, 0, (__global float *)(dst.ptr + 0 * dst_stride_y));