Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 1 | //===-- TimeProfiler.cpp - Hierarchical Time Profiler ---------------------===// |
| 2 | // |
Anton Afanasyev | 2653672 | 2019-04-15 21:02:47 +0000 | [diff] [blame] | 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | // |
Anton Afanasyev | 2653672 | 2019-04-15 21:02:47 +0000 | [diff] [blame] | 9 | // This file implements hierarchical time profiler. |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 10 | // |
| 11 | //===----------------------------------------------------------------------===// |
| 12 | |
| 13 | #include "llvm/Support/TimeProfiler.h" |
Anton Afanasyev | 03c3e0d | 2019-04-09 12:18:44 +0000 | [diff] [blame] | 14 | #include "llvm/ADT/StringMap.h" |
Anton Afanasyev | 2653672 | 2019-04-15 21:02:47 +0000 | [diff] [blame] | 15 | #include "llvm/Support/CommandLine.h" |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 16 | #include "llvm/Support/FileSystem.h" |
Anton Afanasyev | 6547d51 | 2019-04-16 06:35:07 +0000 | [diff] [blame] | 17 | #include "llvm/Support/JSON.h" |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 18 | #include <cassert> |
| 19 | #include <chrono> |
| 20 | #include <string> |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 21 | #include <vector> |
| 22 | |
| 23 | using namespace std::chrono; |
| 24 | |
| 25 | namespace llvm { |
| 26 | |
| 27 | TimeTraceProfiler *TimeTraceProfilerInstance = nullptr; |
| 28 | |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 29 | typedef duration<steady_clock::rep, steady_clock::period> DurationType; |
Russell Gallop | c6fda60 | 2019-09-05 09:26:04 +0000 | [diff] [blame] | 30 | typedef time_point<steady_clock> TimePointType; |
Anton Afanasyev | 03c3e0d | 2019-04-09 12:18:44 +0000 | [diff] [blame] | 31 | typedef std::pair<size_t, DurationType> CountAndDurationType; |
| 32 | typedef std::pair<std::string, CountAndDurationType> |
| 33 | NameAndCountAndDurationType; |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 34 | |
| 35 | struct Entry { |
Russell Gallop | c6fda60 | 2019-09-05 09:26:04 +0000 | [diff] [blame] | 36 | TimePointType Start; |
| 37 | TimePointType End; |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 38 | std::string Name; |
| 39 | std::string Detail; |
Anton Afanasyev | 2653672 | 2019-04-15 21:02:47 +0000 | [diff] [blame] | 40 | |
Russell Gallop | c6fda60 | 2019-09-05 09:26:04 +0000 | [diff] [blame] | 41 | Entry(TimePointType &&S, TimePointType &&E, std::string &&N, std::string &&Dt) |
| 42 | : Start(std::move(S)), End(std::move(E)), Name(std::move(N)), |
Anton Afanasyev | 2653672 | 2019-04-15 21:02:47 +0000 | [diff] [blame] | 43 | Detail(std::move(Dt)){}; |
Russell Gallop | c6fda60 | 2019-09-05 09:26:04 +0000 | [diff] [blame] | 44 | |
| 45 | // Calculate timings for FlameGraph. Cast time points to microsecond precision |
| 46 | // rather than casting duration. This avoid truncation issues causing inner |
| 47 | // scopes overruning outer scopes. |
| 48 | steady_clock::rep getFlameGraphStartUs(TimePointType StartTime) const { |
| 49 | return (time_point_cast<microseconds>(Start) - |
| 50 | time_point_cast<microseconds>(StartTime)) |
| 51 | .count(); |
| 52 | } |
| 53 | |
| 54 | steady_clock::rep getFlameGraphDurUs() const { |
| 55 | return (time_point_cast<microseconds>(End) - |
| 56 | time_point_cast<microseconds>(Start)) |
| 57 | .count(); |
| 58 | } |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 59 | }; |
| 60 | |
| 61 | struct TimeTraceProfiler { |
| 62 | TimeTraceProfiler() { |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 63 | StartTime = steady_clock::now(); |
| 64 | } |
| 65 | |
| 66 | void begin(std::string Name, llvm::function_ref<std::string()> Detail) { |
Russell Gallop | c6fda60 | 2019-09-05 09:26:04 +0000 | [diff] [blame] | 67 | Stack.emplace_back(steady_clock::now(), TimePointType(), std::move(Name), |
Anton Afanasyev | 2653672 | 2019-04-15 21:02:47 +0000 | [diff] [blame] | 68 | Detail()); |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 69 | } |
| 70 | |
| 71 | void end() { |
| 72 | assert(!Stack.empty() && "Must call begin() first"); |
| 73 | auto &E = Stack.back(); |
Russell Gallop | c6fda60 | 2019-09-05 09:26:04 +0000 | [diff] [blame] | 74 | E.End = steady_clock::now(); |
| 75 | |
| 76 | // Check that end times monotonically increase. |
| 77 | assert((Entries.empty() || |
| 78 | (E.getFlameGraphStartUs(StartTime) + E.getFlameGraphDurUs() >= |
| 79 | Entries.back().getFlameGraphStartUs(StartTime) + |
| 80 | Entries.back().getFlameGraphDurUs())) && |
| 81 | "TimeProfiler scope ended earlier than previous scope"); |
| 82 | |
| 83 | // Calculate duration at full precision for overall counts. |
| 84 | DurationType Duration = E.End - E.Start; |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 85 | |
Anton Afanasyev | 3f3a257 | 2019-08-19 22:58:26 +0000 | [diff] [blame] | 86 | // Only include sections longer or equal to TimeTraceGranularity msec. |
Russell Gallop | c6fda60 | 2019-09-05 09:26:04 +0000 | [diff] [blame] | 87 | if (duration_cast<microseconds>(Duration).count() >= TimeTraceGranularity) |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 88 | Entries.emplace_back(E); |
| 89 | |
| 90 | // Track total time taken by each "name", but only the topmost levels of |
| 91 | // them; e.g. if there's a template instantiation that instantiates other |
| 92 | // templates from within, we only want to add the topmost one. "topmost" |
| 93 | // happens to be the ones that don't have any currently open entries above |
| 94 | // itself. |
| 95 | if (std::find_if(++Stack.rbegin(), Stack.rend(), [&](const Entry &Val) { |
| 96 | return Val.Name == E.Name; |
| 97 | }) == Stack.rend()) { |
Anton Afanasyev | 03c3e0d | 2019-04-09 12:18:44 +0000 | [diff] [blame] | 98 | auto &CountAndTotal = CountAndTotalPerName[E.Name]; |
| 99 | CountAndTotal.first++; |
Russell Gallop | c6fda60 | 2019-09-05 09:26:04 +0000 | [diff] [blame] | 100 | CountAndTotal.second += Duration; |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 101 | } |
| 102 | |
| 103 | Stack.pop_back(); |
| 104 | } |
| 105 | |
Anton Afanasyev | 2653672 | 2019-04-15 21:02:47 +0000 | [diff] [blame] | 106 | void Write(raw_pwrite_stream &OS) { |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 107 | assert(Stack.empty() && |
| 108 | "All profiler sections should be ended when calling Write"); |
Sam McCall | a7edcfb | 2019-04-25 12:51:42 +0000 | [diff] [blame] | 109 | json::OStream J(OS); |
| 110 | J.objectBegin(); |
| 111 | J.attributeBegin("traceEvents"); |
| 112 | J.arrayBegin(); |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 113 | |
| 114 | // Emit all events for the main flame graph. |
| 115 | for (const auto &E : Entries) { |
Russell Gallop | c6fda60 | 2019-09-05 09:26:04 +0000 | [diff] [blame] | 116 | auto StartUs = E.getFlameGraphStartUs(StartTime); |
| 117 | auto DurUs = E.getFlameGraphDurUs(); |
Anton Afanasyev | 6547d51 | 2019-04-16 06:35:07 +0000 | [diff] [blame] | 118 | |
Sam McCall | a7edcfb | 2019-04-25 12:51:42 +0000 | [diff] [blame] | 119 | J.object([&]{ |
| 120 | J.attribute("pid", 1); |
| 121 | J.attribute("tid", 0); |
| 122 | J.attribute("ph", "X"); |
| 123 | J.attribute("ts", StartUs); |
| 124 | J.attribute("dur", DurUs); |
| 125 | J.attribute("name", E.Name); |
| 126 | J.attributeObject("args", [&] { J.attribute("detail", E.Detail); }); |
Anton Afanasyev | 6547d51 | 2019-04-16 06:35:07 +0000 | [diff] [blame] | 127 | }); |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 128 | } |
| 129 | |
| 130 | // Emit totals by section name as additional "thread" events, sorted from |
| 131 | // longest one. |
| 132 | int Tid = 1; |
Anton Afanasyev | 03c3e0d | 2019-04-09 12:18:44 +0000 | [diff] [blame] | 133 | std::vector<NameAndCountAndDurationType> SortedTotals; |
| 134 | SortedTotals.reserve(CountAndTotalPerName.size()); |
Anton Afanasyev | 2653672 | 2019-04-15 21:02:47 +0000 | [diff] [blame] | 135 | for (const auto &E : CountAndTotalPerName) |
Anton Afanasyev | 03c3e0d | 2019-04-09 12:18:44 +0000 | [diff] [blame] | 136 | SortedTotals.emplace_back(E.getKey(), E.getValue()); |
Anton Afanasyev | 2653672 | 2019-04-15 21:02:47 +0000 | [diff] [blame] | 137 | |
| 138 | llvm::sort(SortedTotals.begin(), SortedTotals.end(), |
| 139 | [](const NameAndCountAndDurationType &A, |
| 140 | const NameAndCountAndDurationType &B) { |
| 141 | return A.second.second > B.second.second; |
| 142 | }); |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 143 | for (const auto &E : SortedTotals) { |
Anton Afanasyev | 03c3e0d | 2019-04-09 12:18:44 +0000 | [diff] [blame] | 144 | auto DurUs = duration_cast<microseconds>(E.second.second).count(); |
| 145 | auto Count = CountAndTotalPerName[E.first].first; |
Anton Afanasyev | 6547d51 | 2019-04-16 06:35:07 +0000 | [diff] [blame] | 146 | |
Sam McCall | a7edcfb | 2019-04-25 12:51:42 +0000 | [diff] [blame] | 147 | J.object([&]{ |
| 148 | J.attribute("pid", 1); |
| 149 | J.attribute("tid", Tid); |
| 150 | J.attribute("ph", "X"); |
| 151 | J.attribute("ts", 0); |
| 152 | J.attribute("dur", DurUs); |
| 153 | J.attribute("name", "Total " + E.first); |
| 154 | J.attributeObject("args", [&] { |
| 155 | J.attribute("count", int64_t(Count)); |
| 156 | J.attribute("avg ms", int64_t(DurUs / Count / 1000)); |
| 157 | }); |
Anton Afanasyev | 6547d51 | 2019-04-16 06:35:07 +0000 | [diff] [blame] | 158 | }); |
| 159 | |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 160 | ++Tid; |
| 161 | } |
| 162 | |
| 163 | // Emit metadata event with process name. |
Sam McCall | a7edcfb | 2019-04-25 12:51:42 +0000 | [diff] [blame] | 164 | J.object([&] { |
| 165 | J.attribute("cat", ""); |
| 166 | J.attribute("pid", 1); |
| 167 | J.attribute("tid", 0); |
| 168 | J.attribute("ts", 0); |
| 169 | J.attribute("ph", "M"); |
| 170 | J.attribute("name", "process_name"); |
| 171 | J.attributeObject("args", [&] { J.attribute("name", "clang"); }); |
Anton Afanasyev | 6547d51 | 2019-04-16 06:35:07 +0000 | [diff] [blame] | 172 | }); |
| 173 | |
Sam McCall | a7edcfb | 2019-04-25 12:51:42 +0000 | [diff] [blame] | 174 | J.arrayEnd(); |
| 175 | J.attributeEnd(); |
| 176 | J.objectEnd(); |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 177 | } |
| 178 | |
Anton Afanasyev | 2653672 | 2019-04-15 21:02:47 +0000 | [diff] [blame] | 179 | SmallVector<Entry, 16> Stack; |
| 180 | SmallVector<Entry, 128> Entries; |
Anton Afanasyev | 03c3e0d | 2019-04-09 12:18:44 +0000 | [diff] [blame] | 181 | StringMap<CountAndDurationType> CountAndTotalPerName; |
Russell Gallop | c6fda60 | 2019-09-05 09:26:04 +0000 | [diff] [blame] | 182 | TimePointType StartTime; |
Anton Afanasyev | 4fdcabf | 2019-07-24 14:55:40 +0000 | [diff] [blame] | 183 | |
| 184 | // Minimum time granularity (in microseconds) |
| 185 | unsigned TimeTraceGranularity; |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 186 | }; |
| 187 | |
Anton Afanasyev | 4fdcabf | 2019-07-24 14:55:40 +0000 | [diff] [blame] | 188 | void timeTraceProfilerInitialize(unsigned TimeTraceGranularity) { |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 189 | assert(TimeTraceProfilerInstance == nullptr && |
| 190 | "Profiler should not be initialized"); |
| 191 | TimeTraceProfilerInstance = new TimeTraceProfiler(); |
Anton Afanasyev | 4fdcabf | 2019-07-24 14:55:40 +0000 | [diff] [blame] | 192 | TimeTraceProfilerInstance->TimeTraceGranularity = TimeTraceGranularity; |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 193 | } |
| 194 | |
| 195 | void timeTraceProfilerCleanup() { |
| 196 | delete TimeTraceProfilerInstance; |
| 197 | TimeTraceProfilerInstance = nullptr; |
| 198 | } |
| 199 | |
Anton Afanasyev | 2653672 | 2019-04-15 21:02:47 +0000 | [diff] [blame] | 200 | void timeTraceProfilerWrite(raw_pwrite_stream &OS) { |
Anton Afanasyev | d880de2 | 2019-03-30 08:42:48 +0000 | [diff] [blame] | 201 | assert(TimeTraceProfilerInstance != nullptr && |
| 202 | "Profiler object can't be null"); |
| 203 | TimeTraceProfilerInstance->Write(OS); |
| 204 | } |
| 205 | |
| 206 | void timeTraceProfilerBegin(StringRef Name, StringRef Detail) { |
| 207 | if (TimeTraceProfilerInstance != nullptr) |
| 208 | TimeTraceProfilerInstance->begin(Name, [&]() { return Detail; }); |
| 209 | } |
| 210 | |
| 211 | void timeTraceProfilerBegin(StringRef Name, |
| 212 | llvm::function_ref<std::string()> Detail) { |
| 213 | if (TimeTraceProfilerInstance != nullptr) |
| 214 | TimeTraceProfilerInstance->begin(Name, Detail); |
| 215 | } |
| 216 | |
| 217 | void timeTraceProfilerEnd() { |
| 218 | if (TimeTraceProfilerInstance != nullptr) |
| 219 | TimeTraceProfilerInstance->end(); |
| 220 | } |
| 221 | |
| 222 | } // namespace llvm |