|
|
@@ -0,0 +1,184 @@ |
|
|
//===-- TimeProfiler.cpp - Hierarchical Time Profiler ---------------------===// |
|
|
// |
|
|
// The LLVM Compiler Infrastructure |
|
|
// |
|
|
// This file is distributed under the University of Illinois Open Source |
|
|
// License. See LICENSE.TXT for details. |
|
|
// |
|
|
//===----------------------------------------------------------------------===// |
|
|
// |
|
|
/// \file Hierarchical time profiler implementation. |
|
|
// |
|
|
//===----------------------------------------------------------------------===// |
|
|
|
|
|
#include "llvm/Support/TimeProfiler.h" |
|
|
#include "llvm/ADT/StringExtras.h" |
|
|
#include "llvm/Support/FileSystem.h" |
|
|
#include <cassert> |
|
|
#include <chrono> |
|
|
#include <string> |
|
|
#include <unordered_map> |
|
|
#include <vector> |
|
|
|
|
|
using namespace std::chrono; |
|
|
|
|
|
namespace llvm { |
|
|
|
|
|
TimeTraceProfiler *TimeTraceProfilerInstance = nullptr; |
|
|
|
|
|
static std::string escapeString(StringRef Src) { |
|
|
std::string OS; |
|
|
for (const unsigned char &C : Src) { |
|
|
switch (C) { |
|
|
case '"': |
|
|
case '/': |
|
|
case '\\': |
|
|
case '\b': |
|
|
case '\f': |
|
|
case '\n': |
|
|
case '\r': |
|
|
case '\t': |
|
|
OS += '\\'; |
|
|
OS += C; |
|
|
break; |
|
|
default: |
|
|
if (isPrint(C)) { |
|
|
OS += C; |
|
|
} |
|
|
} |
|
|
} |
|
|
return OS; |
|
|
} |
|
|
|
|
|
typedef duration<steady_clock::rep, steady_clock::period> DurationType; |
|
|
typedef std::pair<std::string, DurationType> NameAndDuration; |
|
|
|
|
|
struct Entry { |
|
|
time_point<steady_clock> Start; |
|
|
DurationType Duration; |
|
|
std::string Name; |
|
|
std::string Detail; |
|
|
}; |
|
|
|
|
|
struct TimeTraceProfiler { |
|
|
TimeTraceProfiler() { |
|
|
Stack.reserve(8); |
|
|
Entries.reserve(128); |
|
|
StartTime = steady_clock::now(); |
|
|
} |
|
|
|
|
|
void begin(std::string Name, llvm::function_ref<std::string()> Detail) { |
|
|
Entry E = {steady_clock::now(), {}, Name, Detail()}; |
|
|
Stack.push_back(std::move(E)); |
|
|
} |
|
|
|
|
|
void end() { |
|
|
assert(!Stack.empty() && "Must call begin() first"); |
|
|
auto &E = Stack.back(); |
|
|
E.Duration = steady_clock::now() - E.Start; |
|
|
|
|
|
// Only include sections longer than 500us. |
|
|
if (duration_cast<microseconds>(E.Duration).count() > 500) |
|
|
Entries.emplace_back(E); |
|
|
|
|
|
// Track total time taken by each "name", but only the topmost levels of |
|
|
// them; e.g. if there's a template instantiation that instantiates other |
|
|
// templates from within, we only want to add the topmost one. "topmost" |
|
|
// happens to be the ones that don't have any currently open entries above |
|
|
// itself. |
|
|
if (std::find_if(++Stack.rbegin(), Stack.rend(), [&](const Entry &Val) { |
|
|
return Val.Name == E.Name; |
|
|
}) == Stack.rend()) { |
|
|
TotalPerName[E.Name] += E.Duration; |
|
|
CountPerName[E.Name]++; |
|
|
} |
|
|
|
|
|
Stack.pop_back(); |
|
|
} |
|
|
|
|
|
void Write(std::unique_ptr<raw_pwrite_stream> &OS) { |
|
|
assert(Stack.empty() && |
|
|
"All profiler sections should be ended when calling Write"); |
|
|
|
|
|
*OS << "{ \"traceEvents\": [\n"; |
|
|
|
|
|
// Emit all events for the main flame graph. |
|
|
for (const auto &E : Entries) { |
|
|
auto StartUs = duration_cast<microseconds>(E.Start - StartTime).count(); |
|
|
auto DurUs = duration_cast<microseconds>(E.Duration).count(); |
|
|
*OS << "{ \"pid\":1, \"tid\":0, \"ph\":\"X\", \"ts\":" << StartUs |
|
|
<< ", \"dur\":" << DurUs << ", \"name\":\"" << escapeString(E.Name) |
|
|
<< "\", \"args\":{ \"detail\":\"" << escapeString(E.Detail) |
|
|
<< "\"} },\n"; |
|
|
} |
|
|
|
|
|
// Emit totals by section name as additional "thread" events, sorted from |
|
|
// longest one. |
|
|
int Tid = 1; |
|
|
std::vector<NameAndDuration> SortedTotals; |
|
|
SortedTotals.reserve(TotalPerName.size()); |
|
|
for (const auto &E : TotalPerName) { |
|
|
SortedTotals.push_back(E); |
|
|
} |
|
|
std::sort(SortedTotals.begin(), SortedTotals.end(), |
|
|
[](const NameAndDuration &A, const NameAndDuration &B) { |
|
|
return A.second > B.second; |
|
|
}); |
|
|
for (const auto &E : SortedTotals) { |
|
|
auto DurUs = duration_cast<microseconds>(E.second).count(); |
|
|
*OS << "{ \"pid\":1, \"tid\":" << Tid << ", \"ph\":\"X\", \"ts\":" << 0 |
|
|
<< ", \"dur\":" << DurUs << ", \"name\":\"Total " |
|
|
<< escapeString(E.first) |
|
|
<< "\", \"args\":{ \"count\":" << CountPerName[E.first] |
|
|
<< ", \"avg ms\":" << (DurUs / CountPerName[E.first] / 1000) |
|
|
<< "} },\n"; |
|
|
++Tid; |
|
|
} |
|
|
|
|
|
// Emit metadata event with process name. |
|
|
*OS << "{ \"cat\":\"\", \"pid\":1, \"tid\":0, \"ts\":0, \"ph\":\"M\", " |
|
|
"\"name\":\"process_name\", \"args\":{ \"name\":\"clang\" } }\n"; |
|
|
*OS << "] }\n"; |
|
|
} |
|
|
|
|
|
std::vector<Entry> Stack; |
|
|
std::vector<Entry> Entries; |
|
|
std::unordered_map<std::string, DurationType> TotalPerName; |
|
|
std::unordered_map<std::string, size_t> CountPerName; |
|
|
time_point<steady_clock> StartTime; |
|
|
}; |
|
|
|
|
|
void timeTraceProfilerInitialize() { |
|
|
assert(TimeTraceProfilerInstance == nullptr && |
|
|
"Profiler should not be initialized"); |
|
|
TimeTraceProfilerInstance = new TimeTraceProfiler(); |
|
|
} |
|
|
|
|
|
void timeTraceProfilerCleanup() { |
|
|
delete TimeTraceProfilerInstance; |
|
|
TimeTraceProfilerInstance = nullptr; |
|
|
} |
|
|
|
|
|
void timeTraceProfilerWrite(std::unique_ptr<raw_pwrite_stream> &OS) { |
|
|
assert(TimeTraceProfilerInstance != nullptr && |
|
|
"Profiler object can't be null"); |
|
|
TimeTraceProfilerInstance->Write(OS); |
|
|
} |
|
|
|
|
|
void timeTraceProfilerBegin(StringRef Name, StringRef Detail) { |
|
|
if (TimeTraceProfilerInstance != nullptr) |
|
|
TimeTraceProfilerInstance->begin(Name, [&]() { return Detail; }); |
|
|
} |
|
|
|
|
|
void timeTraceProfilerBegin(StringRef Name, |
|
|
llvm::function_ref<std::string()> Detail) { |
|
|
if (TimeTraceProfilerInstance != nullptr) |
|
|
TimeTraceProfilerInstance->begin(Name, Detail); |
|
|
} |
|
|
|
|
|
void timeTraceProfilerEnd() { |
|
|
if (TimeTraceProfilerInstance != nullptr) |
|
|
TimeTraceProfilerInstance->end(); |
|
|
} |
|
|
|
|
|
} // namespace llvm |