blob: 758b7533863a5bf879b86a77ecd3abaeba88cbbe [file] [log] [blame]
telsoa014fcda012018-03-09 14:13:49 +00001//
2// Copyright © 2017 Arm Ltd. All rights reserved.
David Beckecb56cd2018-09-05 12:52:57 +01003// SPDX-License-Identifier: MIT
telsoa014fcda012018-03-09 14:13:49 +00004//
5#pragma once
6
telsoa01c577f2c2018-08-31 09:22:23 +01007#include "ProfilingEvent.hpp"
telsoa014fcda012018-03-09 14:13:49 +00008
9#include "armnn/ArmNN.hpp"
telsoa01c577f2c2018-08-31 09:22:23 +010010#include "armnn/IProfiler.hpp"
11
12#include "WallClockTimer.hpp"
telsoa014fcda012018-03-09 14:13:49 +000013
14#include <chrono>
15#include <iosfwd>
16#include <ctime>
17#include <vector>
18#include <stack>
19#include <map>
20
telsoa01c577f2c2018-08-31 09:22:23 +010021#include <boost/core/ignore_unused.hpp>
22
telsoa014fcda012018-03-09 14:13:49 +000023namespace armnn
24{
25
telsoa014fcda012018-03-09 14:13:49 +000026// Simple single-threaded profiler.
27// Tracks events reported by BeginEvent()/EndEvent() and outputs detailed information and stats when
28// Profiler::AnalyzeEventsAndWriteResults() is called.
telsoa01c577f2c2018-08-31 09:22:23 +010029class Profiler final : public IProfiler
telsoa014fcda012018-03-09 14:13:49 +000030{
31public:
telsoa01c577f2c2018-08-31 09:22:23 +010032 Profiler();
33 ~Profiler();
34 using InstrumentPtr = std::unique_ptr<Instrument>;
35
telsoa014fcda012018-03-09 14:13:49 +000036 // Marks the beginning of a user-defined event.
telsoa01c577f2c2018-08-31 09:22:23 +010037 // No attempt will be made to copy the name string: it must be known at compile time.
38 Event* BeginEvent(Compute compute, const std::string& name, std::vector<InstrumentPtr>&& instruments);
telsoa014fcda012018-03-09 14:13:49 +000039
40 // Marks the end of a user-defined event.
telsoa01c577f2c2018-08-31 09:22:23 +010041 void EndEvent(Event* event);
42
43 // Enables/disables profiling.
44 void EnableProfiling(bool enableProfiling) override;
45
46 // Checks if profiling is enabled.
47 bool IsProfilingEnabled() override;
telsoa014fcda012018-03-09 14:13:49 +000048
49 // Increments the event tag, allowing grouping of events in a user-defined manner (e.g. per inference).
telsoa01c577f2c2018-08-31 09:22:23 +010050 void UpdateEventTag();
telsoa014fcda012018-03-09 14:13:49 +000051
52 // Analyzes the tracked events and writes the results to the given output stream.
53 // Please refer to the configuration variables in Profiling.cpp to customize the information written.
telsoa01c577f2c2018-08-31 09:22:23 +010054 void AnalyzeEventsAndWriteResults(std::ostream& outStream) const override;
telsoa014fcda012018-03-09 14:13:49 +000055
telsoa01c577f2c2018-08-31 09:22:23 +010056 // Print stats for events in JSON Format to the given output stream.
57 void Print(std::ostream& outStream) const override;
telsoa014fcda012018-03-09 14:13:49 +000058
telsoa01c577f2c2018-08-31 09:22:23 +010059 // Gets the color to render an event with, based on which device it denotes.
60 uint32_t GetEventColor(Compute compute) const;
telsoa014fcda012018-03-09 14:13:49 +000061
62private:
telsoa01c577f2c2018-08-31 09:22:23 +010063 using EventPtr = std::unique_ptr<Event>;
telsoa014fcda012018-03-09 14:13:49 +000064 struct Marker
65 {
66 std::size_t m_Id;
telsoa014fcda012018-03-09 14:13:49 +000067 };
68
69 struct ProfilingEventStats
70 {
71 double m_TotalMs;
72 double m_MinMs;
73 double m_MaxMs;
telsoa01c577f2c2018-08-31 09:22:23 +010074 uint32_t m_Count;
telsoa014fcda012018-03-09 14:13:49 +000075 };
76
telsoa014fcda012018-03-09 14:13:49 +000077 // Waits for a compute device to finish working to guarantee correct timings.
78 // Currently used exclusively when emitting profiling events denoting GPU work.
79 void WaitForDevice(Compute compute) const;
80
telsoa01c577f2c2018-08-31 09:22:23 +010081 template<typename EventIterType>
82 void AnalyzeEventSequenceAndWriteResults(EventIterType first, EventIterType last, std::ostream& outStream) const;
telsoa014fcda012018-03-09 14:13:49 +000083
84 std::map<std::string, ProfilingEventStats> CalculateProfilingEventStats() const;
telsoa01c577f2c2018-08-31 09:22:23 +010085 void PopulateInferences(std::vector<const Event*>& outInferences, int& outBaseLevel) const;
86 void PopulateDescendants(std::map<const Event*, std::vector<const Event*>>& outDescendantsMap) const;
telsoa014fcda012018-03-09 14:13:49 +000087
telsoa01c577f2c2018-08-31 09:22:23 +010088 std::stack<Event*> m_Parents;
89 std::vector<EventPtr> m_EventSequence;
90 bool m_ProfilingEnabled;
telsoa014fcda012018-03-09 14:13:49 +000091
telsoa01c577f2c2018-08-31 09:22:23 +010092private:
93 // Friend functions for unit testing, see ProfilerTests.cpp.
94 friend size_t GetProfilerEventSequenceSize(armnn::Profiler* profiler);
telsoa014fcda012018-03-09 14:13:49 +000095};
96
telsoa01c577f2c2018-08-31 09:22:23 +010097// Singleton profiler manager.
98// Keeps track of all the running profiler instances.
99class ProfilerManager
100{
101public:
102 // Register the given profiler as a thread local pointer.
103 void RegisterProfiler(Profiler* profiler);
104
105 // Gets the thread local pointer to the profiler.
106 Profiler* GetProfiler();
107
108 // Accesses the singleton.
109 static ProfilerManager& GetInstance();
110
111private:
112 // The constructor is kept private so that other instances of this class (other that the singleton's)
113 // can't be allocated.
114 ProfilerManager() {}
115};
116
117// Helper to easily add event markers to the codebase.
telsoa014fcda012018-03-09 14:13:49 +0000118class ScopedProfilingEvent
119{
120public:
telsoa01c577f2c2018-08-31 09:22:23 +0100121 using InstrumentPtr = std::unique_ptr<Instrument>;
122
123 template<typename... Args>
124 ScopedProfilingEvent(Compute compute, const std::string& name, Args... args)
125 : m_Event(nullptr)
126 , m_Profiler(ProfilerManager::GetInstance().GetProfiler())
telsoa014fcda012018-03-09 14:13:49 +0000127 {
telsoa01c577f2c2018-08-31 09:22:23 +0100128 if (m_Profiler && m_Profiler->IsProfilingEnabled())
129 {
130 std::vector<InstrumentPtr> instruments(0);
131 instruments.reserve(sizeof...(args)); //One allocation
132 ConstructNextInVector(instruments, args...);
133 m_Event = m_Profiler->BeginEvent(compute, name, std::move(instruments));
134 }
telsoa014fcda012018-03-09 14:13:49 +0000135 }
136
137 ~ScopedProfilingEvent()
138 {
telsoa01c577f2c2018-08-31 09:22:23 +0100139 if (m_Profiler && m_Event)
140 {
141 m_Profiler->EndEvent(m_Event);
142 }
telsoa014fcda012018-03-09 14:13:49 +0000143 }
144
145private:
telsoa01c577f2c2018-08-31 09:22:23 +0100146
147 void ConstructNextInVector(std::vector<InstrumentPtr>& instruments)
148 {
149 boost::ignore_unused(instruments);
150 }
151
152 template<typename Arg, typename... Args>
153 void ConstructNextInVector(std::vector<InstrumentPtr>& instruments, Arg arg, Args... args)
154 {
155 instruments.emplace_back(std::make_unique<Arg>(arg));
156 ConstructNextInVector(instruments, args...);
157 }
158
159 Event* m_Event; ///< Event to track
160 Profiler* m_Profiler; ///< Profiler used
telsoa014fcda012018-03-09 14:13:49 +0000161};
162
163} // namespace armnn
164
telsoa014fcda012018-03-09 14:13:49 +0000165// The event name must be known at compile time
telsoa01c577f2c2018-08-31 09:22:23 +0100166#define ARMNN_SCOPED_PROFILING_EVENT_WITH_INSTRUMENTS(compute, /*name,*/ ...) \
167 armnn::ScopedProfilingEvent e_##__FILE__##__LINE__(compute, /*name,*/ __VA_ARGS__);
telsoa014fcda012018-03-09 14:13:49 +0000168
telsoa01c577f2c2018-08-31 09:22:23 +0100169#define ARMNN_SCOPED_PROFILING_EVENT(compute, name) \
170 ARMNN_SCOPED_PROFILING_EVENT_WITH_INSTRUMENTS(compute, name, armnn::WallClockTimer())