MLBEDSW-6271: MLCE: Layer wise Utilization info from Vela

 - Added support to print per operator sram usage and performance
information
 - Added new CLI option --verbose-performance to control this feature

Signed-off-by: Tim Hall <tim.hall@arm.com>
Change-Id: I368599b410e5d441d9804871fc51b7a1049d85b3
diff --git a/ethosu/vela/architecture_features.py b/ethosu/vela/architecture_features.py
index 08ff260..679947f 100644
--- a/ethosu/vela/architecture_features.py
+++ b/ethosu/vela/architecture_features.py
@@ -301,6 +301,7 @@
 
         self.num_elem_wise_units = accel_config.elem_units
         self.num_macs_per_cycle = dpu_min_height * dpu_min_width * dpu_dot_product_width * dpu_min_ofm_channels
+        assert self.num_macs_per_cycle == accel_config.macs, f"{self.num_macs_per_cycle} != {accel_config.macs}"
         # Max value in address offsets
         self.max_address_offset = 1 << axi_port_address_width