MLBEDSW-2935: LUT fusing with preceding operator

Allows fusing of LUT with a preceding operator regardless of
input/output scale.

Change-Id: Ia378adbb3fe61d71299feb085f7313377e0efa39
Signed-off-by: Louis Verhaard <louis.verhaard@arm.com>
diff --git a/ethosu/vela/register_command_stream_generator.py b/ethosu/vela/register_command_stream_generator.py
index 0a35647..8f34e63 100644
--- a/ethosu/vela/register_command_stream_generator.py
+++ b/ethosu/vela/register_command_stream_generator.py
@@ -909,7 +909,11 @@
                 if tens is None:
                     continue
 
-                need_zero_point = (faf is not None) or (fmf == "ConcatSliceWrite") or fused_quantize
+                need_zero_point = (
+                    (faf is not None and forced_ofm_quantization is None)
+                    or (fmf == "ConcatSliceWrite")
+                    or fused_quantize
+                )
                 if (
                     (
                         primary_op.type in set(("AvgPool", "AvgPoolAct", "ResizeBilinear", "CLZ", "SHL"))