Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 1 | /* |
Richard Burton | f32a86a | 2022-11-15 11:46:11 +0000 | [diff] [blame] | 2 | * SPDX-FileCopyrightText: Copyright 2022 Arm Limited and/or its affiliates <open-source-office@arm.com> |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 3 | * SPDX-License-Identifier: Apache-2.0 |
| 4 | * |
| 5 | * Licensed under the Apache License, Version 2.0 (the "License"); |
| 6 | * you may not use this file except in compliance with the License. |
| 7 | * You may obtain a copy of the License at |
| 8 | * |
| 9 | * http://www.apache.org/licenses/LICENSE-2.0 |
| 10 | * |
| 11 | * Unless required by applicable law or agreed to in writing, software |
| 12 | * distributed under the License is distributed on an "AS IS" BASIS, |
| 13 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 14 | * See the License for the specific language governing permissions and |
| 15 | * limitations under the License. |
| 16 | */ |
| 17 | #include "UseCaseHandler.hpp" |
| 18 | #include "InputFiles.hpp" |
| 19 | #include "YoloFastestModel.hpp" |
| 20 | #include "UseCaseCommonUtils.hpp" |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 21 | #include "DetectorPostProcessing.hpp" |
Richard Burton | ef90497 | 2022-04-27 17:24:36 +0100 | [diff] [blame] | 22 | #include "DetectorPreProcessing.hpp" |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 23 | #include "hal.h" |
alexander | 31ae9f0 | 2022-02-10 16:15:54 +0000 | [diff] [blame] | 24 | #include "log_macros.h" |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 25 | |
alexander | 31ae9f0 | 2022-02-10 16:15:54 +0000 | [diff] [blame] | 26 | #include <cinttypes> |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 27 | |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 28 | namespace arm { |
| 29 | namespace app { |
| 30 | |
Isabella Gottardi | 3107aa2 | 2022-01-27 16:39:37 +0000 | [diff] [blame] | 31 | /** |
| 32 | * @brief Presents inference results along using the data presentation |
| 33 | * object. |
Isabella Gottardi | 3107aa2 | 2022-01-27 16:39:37 +0000 | [diff] [blame] | 34 | * @param[in] results Vector of detection results to be displayed. |
| 35 | * @return true if successful, false otherwise. |
| 36 | **/ |
Richard Burton | ef90497 | 2022-04-27 17:24:36 +0100 | [diff] [blame] | 37 | static bool PresentInferenceResult(const std::vector<object_detection::DetectionResult>& results); |
Richard Burton | 9c54990 | 2022-02-15 16:39:18 +0000 | [diff] [blame] | 38 | |
| 39 | /** |
| 40 | * @brief Draw boxes directly on the LCD for all detected objects. |
Richard Burton | 9c54990 | 2022-02-15 16:39:18 +0000 | [diff] [blame] | 41 | * @param[in] results Vector of detection results to be displayed. |
| 42 | * @param[in] imageStartX X coordinate where the image starts on the LCD. |
| 43 | * @param[in] imageStartY Y coordinate where the image starts on the LCD. |
| 44 | * @param[in] imgDownscaleFactor How much image has been downscaled on LCD. |
| 45 | **/ |
Kshitij Sisodia | 68fdd11 | 2022-04-06 13:03:20 +0100 | [diff] [blame] | 46 | static void DrawDetectionBoxes( |
Richard Burton | ef90497 | 2022-04-27 17:24:36 +0100 | [diff] [blame] | 47 | const std::vector<object_detection::DetectionResult>& results, |
Kshitij Sisodia | 68fdd11 | 2022-04-06 13:03:20 +0100 | [diff] [blame] | 48 | uint32_t imgStartX, |
| 49 | uint32_t imgStartY, |
| 50 | uint32_t imgDownscaleFactor); |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 51 | |
Richard Burton | ef90497 | 2022-04-27 17:24:36 +0100 | [diff] [blame] | 52 | /* Object detection inference handler. */ |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 53 | bool ObjectDetectionHandler(ApplicationContext& ctx, uint32_t imgIndex, bool runAll) |
| 54 | { |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 55 | auto& profiler = ctx.Get<Profiler&>("profiler"); |
| 56 | |
| 57 | constexpr uint32_t dataPsnImgDownscaleFactor = 1; |
| 58 | constexpr uint32_t dataPsnImgStartX = 10; |
| 59 | constexpr uint32_t dataPsnImgStartY = 35; |
| 60 | |
Richard Burton | 71f282e | 2022-12-01 12:31:23 +0000 | [diff] [blame] | 61 | constexpr uint32_t dataPsnTxtInfStartX = 20; |
| 62 | constexpr uint32_t dataPsnTxtInfStartY = 28; |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 63 | |
Kshitij Sisodia | 68fdd11 | 2022-04-06 13:03:20 +0100 | [diff] [blame] | 64 | hal_lcd_clear(COLOR_BLACK); |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 65 | |
| 66 | auto& model = ctx.Get<Model&>("model"); |
Isabella Gottardi | 3107aa2 | 2022-01-27 16:39:37 +0000 | [diff] [blame] | 67 | |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 68 | /* If the request has a valid size, set the image index. */ |
| 69 | if (imgIndex < NUMBER_OF_FILES) { |
| 70 | if (!SetAppCtxIfmIdx(ctx, imgIndex, "imgIndex")) { |
| 71 | return false; |
| 72 | } |
| 73 | } |
| 74 | if (!model.IsInited()) { |
| 75 | printf_err("Model is not initialised! Terminating processing.\n"); |
| 76 | return false; |
| 77 | } |
| 78 | |
Richard Burton | ef90497 | 2022-04-27 17:24:36 +0100 | [diff] [blame] | 79 | auto initialImgIdx = ctx.Get<uint32_t>("imgIndex"); |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 80 | |
| 81 | TfLiteTensor* inputTensor = model.GetInputTensor(0); |
Richard Burton | ef90497 | 2022-04-27 17:24:36 +0100 | [diff] [blame] | 82 | TfLiteTensor* outputTensor0 = model.GetOutputTensor(0); |
| 83 | TfLiteTensor* outputTensor1 = model.GetOutputTensor(1); |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 84 | |
| 85 | if (!inputTensor->dims) { |
| 86 | printf_err("Invalid input tensor dims\n"); |
| 87 | return false; |
| 88 | } else if (inputTensor->dims->size < 3) { |
| 89 | printf_err("Input tensor dimension should be >= 3\n"); |
| 90 | return false; |
| 91 | } |
| 92 | |
| 93 | TfLiteIntArray* inputShape = model.GetInputShape(0); |
| 94 | |
Richard Burton | ef90497 | 2022-04-27 17:24:36 +0100 | [diff] [blame] | 95 | const int inputImgCols = inputShape->data[YoloFastestModel::ms_inputColsIdx]; |
| 96 | const int inputImgRows = inputShape->data[YoloFastestModel::ms_inputRowsIdx]; |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 97 | |
Richard Burton | ef90497 | 2022-04-27 17:24:36 +0100 | [diff] [blame] | 98 | /* Set up pre and post-processing. */ |
| 99 | DetectorPreProcess preProcess = DetectorPreProcess(inputTensor, true, model.IsDataSigned()); |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 100 | |
Richard Burton | ef90497 | 2022-04-27 17:24:36 +0100 | [diff] [blame] | 101 | std::vector<object_detection::DetectionResult> results; |
Richard Burton | 6f6df09 | 2022-05-17 12:52:50 +0100 | [diff] [blame] | 102 | const object_detection::PostProcessParams postProcessParams { |
| 103 | inputImgRows, inputImgCols, object_detection::originalImageSize, |
| 104 | object_detection::anchor1, object_detection::anchor2 |
| 105 | }; |
Richard Burton | ef90497 | 2022-04-27 17:24:36 +0100 | [diff] [blame] | 106 | DetectorPostProcess postProcess = DetectorPostProcess(outputTensor0, outputTensor1, |
Richard Burton | 6f6df09 | 2022-05-17 12:52:50 +0100 | [diff] [blame] | 107 | results, postProcessParams); |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 108 | do { |
Matthew Sloyan | 0bc74e9 | 2022-05-10 13:21:01 +0100 | [diff] [blame] | 109 | /* Ensure there are no results leftover from previous inference when running all. */ |
| 110 | results.clear(); |
| 111 | |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 112 | /* Strings for presentation/logging. */ |
| 113 | std::string str_inf{"Running inference... "}; |
| 114 | |
Richard Burton | ef90497 | 2022-04-27 17:24:36 +0100 | [diff] [blame] | 115 | const uint8_t* currImage = get_img_array(ctx.Get<uint32_t>("imgIndex")); |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 116 | |
Richard Burton | ef90497 | 2022-04-27 17:24:36 +0100 | [diff] [blame] | 117 | auto dstPtr = static_cast<uint8_t*>(inputTensor->data.uint8); |
Isabella Gottardi | 3107aa2 | 2022-01-27 16:39:37 +0000 | [diff] [blame] | 118 | const size_t copySz = inputTensor->bytes < IMAGE_DATA_SIZE ? |
| 119 | inputTensor->bytes : IMAGE_DATA_SIZE; |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 120 | |
Richard Burton | ef90497 | 2022-04-27 17:24:36 +0100 | [diff] [blame] | 121 | /* Run the pre-processing, inference and post-processing. */ |
| 122 | if (!preProcess.DoPreProcess(currImage, copySz)) { |
| 123 | printf_err("Pre-processing failed."); |
| 124 | return false; |
| 125 | } |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 126 | |
Isabella Gottardi | e76a691 | 2022-02-16 10:42:32 +0000 | [diff] [blame] | 127 | /* Display image on the LCD. */ |
Kshitij Sisodia | 68fdd11 | 2022-04-06 13:03:20 +0100 | [diff] [blame] | 128 | hal_lcd_display_image( |
Liam Barry | 213a543 | 2022-05-09 17:06:19 +0100 | [diff] [blame] | 129 | (arm::app::object_detection::channelsImageDisplayed == 3) ? currImage : dstPtr, |
| 130 | inputImgCols, |
| 131 | inputImgRows, |
| 132 | arm::app::object_detection::channelsImageDisplayed, |
| 133 | dataPsnImgStartX, |
| 134 | dataPsnImgStartY, |
| 135 | dataPsnImgDownscaleFactor); |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 136 | |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 137 | /* Display message on the LCD - inference running. */ |
Kshitij Sisodia | 68fdd11 | 2022-04-06 13:03:20 +0100 | [diff] [blame] | 138 | hal_lcd_display_text(str_inf.c_str(), str_inf.size(), |
Richard Burton | ef90497 | 2022-04-27 17:24:36 +0100 | [diff] [blame] | 139 | dataPsnTxtInfStartX, dataPsnTxtInfStartY, false); |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 140 | |
| 141 | /* Run inference over this image. */ |
| 142 | info("Running inference on image %" PRIu32 " => %s\n", ctx.Get<uint32_t>("imgIndex"), |
| 143 | get_filename(ctx.Get<uint32_t>("imgIndex"))); |
| 144 | |
| 145 | if (!RunInference(model, profiler)) { |
Richard Burton | ef90497 | 2022-04-27 17:24:36 +0100 | [diff] [blame] | 146 | printf_err("Inference failed."); |
| 147 | return false; |
| 148 | } |
| 149 | |
| 150 | if (!postProcess.DoPostProcess()) { |
| 151 | printf_err("Post-processing failed."); |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 152 | return false; |
| 153 | } |
| 154 | |
| 155 | /* Erase. */ |
| 156 | str_inf = std::string(str_inf.size(), ' '); |
Kshitij Sisodia | 68fdd11 | 2022-04-06 13:03:20 +0100 | [diff] [blame] | 157 | hal_lcd_display_text(str_inf.c_str(), str_inf.size(), |
Richard Burton | ef90497 | 2022-04-27 17:24:36 +0100 | [diff] [blame] | 158 | dataPsnTxtInfStartX, dataPsnTxtInfStartY, false); |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 159 | |
Richard Burton | 9c54990 | 2022-02-15 16:39:18 +0000 | [diff] [blame] | 160 | /* Draw boxes. */ |
Kshitij Sisodia | 68fdd11 | 2022-04-06 13:03:20 +0100 | [diff] [blame] | 161 | DrawDetectionBoxes(results, dataPsnImgStartX, dataPsnImgStartY, dataPsnImgDownscaleFactor); |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 162 | |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 163 | #if VERIFY_TEST_OUTPUT |
Richard Burton | ef90497 | 2022-04-27 17:24:36 +0100 | [diff] [blame] | 164 | DumpTensor(modelOutput0); |
| 165 | DumpTensor(modelOutput1); |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 166 | #endif /* VERIFY_TEST_OUTPUT */ |
| 167 | |
Kshitij Sisodia | 68fdd11 | 2022-04-06 13:03:20 +0100 | [diff] [blame] | 168 | if (!PresentInferenceResult(results)) { |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 169 | return false; |
| 170 | } |
| 171 | |
| 172 | profiler.PrintProfilingResult(); |
| 173 | |
| 174 | IncrementAppCtxIfmIdx(ctx,"imgIndex"); |
| 175 | |
Richard Burton | ef90497 | 2022-04-27 17:24:36 +0100 | [diff] [blame] | 176 | } while (runAll && ctx.Get<uint32_t>("imgIndex") != initialImgIdx); |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 177 | |
| 178 | return true; |
| 179 | } |
| 180 | |
Richard Burton | ef90497 | 2022-04-27 17:24:36 +0100 | [diff] [blame] | 181 | static bool PresentInferenceResult(const std::vector<object_detection::DetectionResult>& results) |
Isabella Gottardi | 3107aa2 | 2022-01-27 16:39:37 +0000 | [diff] [blame] | 182 | { |
Kshitij Sisodia | 68fdd11 | 2022-04-06 13:03:20 +0100 | [diff] [blame] | 183 | hal_lcd_set_text_color(COLOR_GREEN); |
Isabella Gottardi | 3107aa2 | 2022-01-27 16:39:37 +0000 | [diff] [blame] | 184 | |
| 185 | /* If profiling is enabled, and the time is valid. */ |
| 186 | info("Final results:\n"); |
| 187 | info("Total number of inferences: 1\n"); |
| 188 | |
| 189 | for (uint32_t i = 0; i < results.size(); ++i) { |
| 190 | info("%" PRIu32 ") (%f) -> %s {x=%d,y=%d,w=%d,h=%d}\n", i, |
| 191 | results[i].m_normalisedVal, "Detection box:", |
| 192 | results[i].m_x0, results[i].m_y0, results[i].m_w, results[i].m_h ); |
| 193 | } |
| 194 | |
| 195 | return true; |
| 196 | } |
| 197 | |
Richard Burton | ef90497 | 2022-04-27 17:24:36 +0100 | [diff] [blame] | 198 | static void DrawDetectionBoxes(const std::vector<object_detection::DetectionResult>& results, |
Richard Burton | 9c54990 | 2022-02-15 16:39:18 +0000 | [diff] [blame] | 199 | uint32_t imgStartX, |
| 200 | uint32_t imgStartY, |
| 201 | uint32_t imgDownscaleFactor) |
| 202 | { |
| 203 | uint32_t lineThickness = 1; |
| 204 | |
| 205 | for (const auto& result: results) { |
| 206 | /* Top line. */ |
Kshitij Sisodia | 68fdd11 | 2022-04-06 13:03:20 +0100 | [diff] [blame] | 207 | hal_lcd_display_box(imgStartX + result.m_x0/imgDownscaleFactor, |
Richard Burton | 9c54990 | 2022-02-15 16:39:18 +0000 | [diff] [blame] | 208 | imgStartY + result.m_y0/imgDownscaleFactor, |
| 209 | result.m_w/imgDownscaleFactor, lineThickness, COLOR_GREEN); |
| 210 | /* Bot line. */ |
Kshitij Sisodia | 68fdd11 | 2022-04-06 13:03:20 +0100 | [diff] [blame] | 211 | hal_lcd_display_box(imgStartX + result.m_x0/imgDownscaleFactor, |
Richard Burton | 9c54990 | 2022-02-15 16:39:18 +0000 | [diff] [blame] | 212 | imgStartY + (result.m_y0 + result.m_h)/imgDownscaleFactor - lineThickness, |
| 213 | result.m_w/imgDownscaleFactor, lineThickness, COLOR_GREEN); |
| 214 | |
| 215 | /* Left line. */ |
Kshitij Sisodia | 68fdd11 | 2022-04-06 13:03:20 +0100 | [diff] [blame] | 216 | hal_lcd_display_box(imgStartX + result.m_x0/imgDownscaleFactor, |
Richard Burton | 9c54990 | 2022-02-15 16:39:18 +0000 | [diff] [blame] | 217 | imgStartY + result.m_y0/imgDownscaleFactor, |
| 218 | lineThickness, result.m_h/imgDownscaleFactor, COLOR_GREEN); |
| 219 | /* Right line. */ |
Kshitij Sisodia | 68fdd11 | 2022-04-06 13:03:20 +0100 | [diff] [blame] | 220 | hal_lcd_display_box(imgStartX + (result.m_x0 + result.m_w)/imgDownscaleFactor - lineThickness, |
Richard Burton | 9c54990 | 2022-02-15 16:39:18 +0000 | [diff] [blame] | 221 | imgStartY + result.m_y0/imgDownscaleFactor, |
| 222 | lineThickness, result.m_h/imgDownscaleFactor, COLOR_GREEN); |
| 223 | } |
| 224 | } |
| 225 | |
Michael Levit | 06fcf75 | 2022-01-12 11:53:46 +0200 | [diff] [blame] | 226 | } /* namespace app */ |
| 227 | } /* namespace arm */ |