diff options
author | Tamar Christina <tamar.christina@arm.com> | 2022-04-20 15:42:15 +0100 |
---|---|---|
committer | Tamar Christina <tamar.christina@arm.com> | 2022-04-20 15:42:15 +0100 |
commit | dcf5fc3f60846b5d2e436befb934493f5132ffd9 (patch) | |
tree | 3c240ac7e1e9a39c1a43e022655594986ef9d567 | |
parent | 8b2fbaf32118b1312ae5663fc28b13fc23a82d0e (diff) |
perf: Fix profile reading to correctly take segments into account.
LNT's perf parsing implementation has a very subtle bug horrible bug:
It's assuming that the text segment starts at the same address that
the program was loaded at. Or rather, it assumes the text segment is
at address 0.
This is usually not the case (and indeed LLD itself puts many non-exec
Segments before the first exec one)
Because of this no event is matched for certain binaries. Also the
code can wrongly try to attribute an event to the wrong MMAP because
it only checks the starting address. This means that the order of the
MMAPs matters and again as of a few days ago the order coming out of
LLD places the binary itself after most SOs including ld.so.
By checking only the start address we can attribute an event to an SO
instead of to the program since trivially shared libraries are
loaded before the program itself in the virtual memory space. This
would later fail to resolve but we'd lose the event.
This patch changes it to also check for the ending position.
-rw-r--r-- | lnt/testing/profile/cPerf.cpp | 73 |
1 files changed, 66 insertions, 7 deletions
diff --git a/lnt/testing/profile/cPerf.cpp b/lnt/testing/profile/cPerf.cpp index 82336e8..95f7b17 100644 --- a/lnt/testing/profile/cPerf.cpp +++ b/lnt/testing/profile/cPerf.cpp @@ -129,7 +129,7 @@ FILE *ForkAndExec(std::string Cmd) { if (fork() == 0) { dup2(P[1], 1); close(P[0]); - execl("/bin/sh", "sh", "-c", Cmd.c_str(), 0); + execl("/bin/sh", "sh", "-c", Cmd.c_str(), (char *)NULL); } else { close(P[1]); } @@ -364,6 +364,12 @@ struct Map { const char *Filename; }; +struct EventDesc { + uint64_t Start; + uint64_t End; + size_t MapId; +}; + struct Symbol { uint64_t Start; uint64_t End; @@ -382,6 +388,55 @@ public: SymTabOutput(std::string Objdump, std::string BinaryCacheRoot) : Objdump(Objdump), BinaryCacheRoot(BinaryCacheRoot) {} + uint64_t fetchExecSegment(Map *M) { + std::string Cmd = Objdump + " -p -C " + + BinaryCacheRoot + std::string(M->Filename) + +#ifdef _WIN32 + " 2> NUL"; +#else + " 2>/dev/null"; +#endif + auto Stream = ForkAndExec(Cmd); + + char *Line = nullptr, *PrevLine = nullptr; + size_t LineLen = 0; + uint64_t offset = 0; + while (true) { + if (PrevLine) + free (PrevLine); + if (Line) + PrevLine = strdup (Line); + ssize_t Len = getline(&Line, &LineLen, Stream); + if (Len == -1) + break; + + char* pos; + if ((pos = strstr (Line, "flags r-x")) == NULL + && (pos = strstr (Line, "flags rwx")) == NULL) + continue; + + /* Format is weird.. but we did find the section so punt. */ + if ((pos = strstr (PrevLine, "vaddr ")) == NULL) + break; + + pos += 6; + offset = strtoull (pos, NULL, 16); + break; + } + if (Line) + free(Line); + if (PrevLine) + free(PrevLine); + +#ifdef _WIN32 + _pclose(Stream); +#else + fclose(Stream); + wait(NULL); +#endif + return offset; + } + void fetchSymbols(Map *M) { std::string Cmd = Objdump + " -t -T -C " + BinaryCacheRoot + std::string(M->Filename) + @@ -473,6 +528,10 @@ public: void reset(Map *M) { clear(); // Fetch both dynamic and static symbols, sort and unique them. + uint64_t segmentStart = fetchExecSegment (M); + /* Adjust the symbol to a value relative to the start of the load address + to match up with registerNewMapping. */ + M->Adjust -= segmentStart; fetchSymbols(M); std::sort(begin(), end()); @@ -626,7 +685,7 @@ private: std::map<const char *, uint64_t> TotalEvents; std::map<uint64_t, std::map<const char *, uint64_t>> TotalEventsPerMap; std::vector<Map> Maps; - std::map<uint64_t, std::map<uint64_t, size_t>> CurrentMaps; + std::map<uint64_t, std::map<uint64_t, EventDesc>> CurrentMaps; PyObject *Functions, *TopLevelCounters; std::vector<PyObject*> Lines; @@ -800,7 +859,7 @@ void PerfReader::registerNewMapping(unsigned char *Buf, const char *Filename) { // FIXME: The code assumes perf_event_attr.sample_id_all is set. uint64_t Time = getTimeFromSampleId(EndOfEvent, EventLayouts.begin()->second); auto &CurrentMap = CurrentMaps[Time]; - CurrentMap.insert({E->start, MapID}); + CurrentMap.insert({E->start, { E->start, End, MapID}}); } unsigned char *PerfReader::readEvent(unsigned char *Buf) { @@ -841,9 +900,9 @@ unsigned char *PerfReader::readEvent(unsigned char *Buf) { continue; --NewI; - if (NewI->first > PC) + if (NewI->second.Start > PC || NewI->second.End < PC) continue; - MapID = NewI->second; + MapID = NewI->second.MapId; break; } if (MapID != ~0ULL) { @@ -961,11 +1020,11 @@ void PerfReader::emitMaps() { if (AllUnderThreshold) continue; - uint64_t Adjust = Maps[MapID].Adjust; - SymTabOutput Syms(Objdump, BinaryCacheRoot); Syms.reset(&Maps[MapID]); + uint64_t Adjust = Maps[MapID].Adjust; + // Accumulate the event totals for each symbol auto Sym = Syms.begin(); auto Event = MapEvents.begin(); |