#include "huge_page_deducer.h" #include <limits> #include "perf_data_utils.h" #include "base/logging.h" using PerfEvent = quipper::PerfDataProto::PerfEvent; using MMapEvent = quipper::PerfDataProto::MMapEvent; namespace quipper { namespace { const char kAnonFilename[] = "//anon"; const size_t kHugepageSize = 1 << 21; bool IsAnon(const MMapEvent& event) { return event.filename() == kAnonFilename; } // IsContiguous returns true if mmap |a| is immediately followed by |b| // within a process' address space. bool IsContiguous(const MMapEvent& a, const MMapEvent& b) { return a.pid() == b.pid() && (a.start() + a.len()) == b.start(); } // IsEquivalentFile returns true iff |a| and |b| have the same name, or if // either of them are anonymous memory (and thus likely to be a --hugepage_text // version of the same file). bool IsEquivalentFile(const MMapEvent& a, const MMapEvent& b) { // perf attributes neighboring anonymous mappings under the argv[0] // filename rather than "//anon", so check filename equality, as well as // anonymous. return a.filename() == b.filename() || IsAnon(a) || IsAnon(b); } // Helper to correctly update a filename on a PerfEvent that contains an // MMapEvent. void SetMmapFilename(PerfEvent* event, const string& new_filename, uint64_t new_filename_md5_prefix) { CHECK(event->has_mmap_event()); event->mutable_header()->set_size( event->header().size() + GetUint64AlignedStringLength(new_filename) - GetUint64AlignedStringLength(event->mmap_event().filename())); event->mutable_mmap_event()->set_filename(new_filename); event->mutable_mmap_event()->set_filename_md5_prefix(new_filename_md5_prefix); } } // namespace namespace { // MMapRange represents an index into a PerfEvents sequence that contains // a contiguous region of mmaps that have all of the same filename and pgoff. class MMapRange { public: // Default constructor is an invalid range. MMapRange() : first_(std::numeric_limits<int>::max()), last_(std::numeric_limits<int>::min()) {} // Construct a real range. MMapRange(int first_index, int last_index) : first_(first_index), last_(last_index) {} uint64 Len(const RepeatedPtrField<PerfEvent>& events) const { auto& first = events.Get(first_).mmap_event(); auto& last = events.Get(last_).mmap_event(); return last.start() - first.start() + last.len(); } int FirstIndex() const { return first_; } int LastIndex() const { return last_; } bool IsValid() const { return first_ <= last_; } const MMapEvent& FirstMmap(const RepeatedPtrField<PerfEvent>& events) const { return events.Get(first_).mmap_event(); } const MMapEvent& LastMmap(const RepeatedPtrField<PerfEvent>& events) const { return events.Get(last_).mmap_event(); } private: int first_; int last_; }; std::ostream& operator<<(std::ostream& os, const MMapRange& r) { os << "[" << r.FirstIndex() << "," << r.LastIndex() << "]"; return os; } // MMapRange version of IsContiguous(MMapEvent, MMapEvent). bool IsContiguous(const RepeatedPtrField<PerfEvent>& events, const MMapRange& a, const MMapRange& b) { return IsContiguous(a.LastMmap(events), b.FirstMmap(events)); } // MMapRange version of IsIsEquivalent(MMapEvent, MMapEvent). bool IsEquivalentFile(const RepeatedPtrField<PerfEvent>& events, const MMapRange& a, const MMapRange& b) { // Because a range has the same file for all mmaps within it, assume that // checking any mmap in |a| with any in |b| is sufficient. return IsEquivalentFile(a.LastMmap(events), b.FirstMmap(events)); } // FindRange returns a MMapRange of contiguous MmapEvents that: // - either: // - contains 1 or more MmapEvents with pgoff == 0 // - is a single MmapEvent with pgoff != 0 // - and: // - has the same filename for all entries // Otherwise, if none can be found, an invalid range will be returned. MMapRange FindRange(const RepeatedPtrField<PerfEvent>& events, int start) { const MMapEvent* prev_mmap = nullptr; MMapRange range; for (int i = start; i < events.size(); i++) { const PerfEvent& event = events.Get(i); // Skip irrelevant events if (!event.has_mmap_event()) { continue; } // Skip dynamic mmap() events. Hugepage deduction only works on mmaps as // synthesized by perf from /proc/${pid}/maps, which have timestamp==0. // Support for deducing hugepages from a sequence of mmap()/mremap() calls // would require additional deduction logic. if (event.timestamp() != 0) { continue; } const MMapEvent& mmap = events.Get(i).mmap_event(); if (prev_mmap == nullptr) { range = MMapRange(i, i); prev_mmap = &mmap; } // Ranges match exactly: //anon,//anon, or file,file; If they use different // names, then deduction needs to consider them independently. if (prev_mmap->filename() != mmap.filename()) { break; } // If they're not virtually contiguous, they're not a single range. if (start != i && !IsContiguous(*prev_mmap, mmap)) { break; } // If this segment has a page offset, assume that it is *not* hugepage // backed, and thus does not need separate deduction. if (mmap.pgoff() != 0) { break; } CHECK(mmap.pgoff() == 0 || !IsAnon(mmap)) << "Anonymous pages can't have pgoff set"; prev_mmap = &mmap; range = MMapRange(range.FirstIndex(), i); } // Range has: // - single file // - virtually contiguous // - either: is multiple mappings *or* has pgoff=0 return range; } // FindNextRange will return the next range after the given |prev_range| if // there is one; otherwise it will return an invalid range. MMapRange FindNextRange(const RepeatedPtrField<PerfEvent>& events, const MMapRange& prev_range) { MMapRange ret; if (prev_range.IsValid() && prev_range.LastIndex() < events.size()) { ret = FindRange(events, prev_range.LastIndex() + 1); } return ret; } // UpdateRangeFromNext will set the filename / pgoff of all mmaps within |range| // to be pgoff-contiguous with |next_range|, and match its file information. void UpdateRangeFromNext(const MMapRange& range, const MMapRange& next_range, RepeatedPtrField<PerfEvent>* events) { CHECK(range.LastIndex() < events->size()); CHECK(next_range.LastIndex() < events->size()); const MMapEvent& src = next_range.FirstMmap(*events); const uint64 start_pgoff = src.pgoff() - range.Len(*events); uint64 pgoff = start_pgoff; for (int i = range.FirstIndex(); i <= range.LastIndex(); i++) { if (!events->Get(i).has_mmap_event()) { continue; } PerfEvent* event = events->Mutable(i); MMapEvent* mmap = event->mutable_mmap_event(); // Replace "//anon" with a regular name if possible. if (IsAnon(*mmap)) { // ANDROID-CHANGED: protobuf-lite. CHECK_EQ(mmap->pgoff(), 0u) << "//anon should have offset=0 for mmap"; // << event->ShortDebugString(); SetMmapFilename(event, src.filename(), src.filename_md5_prefix()); } if (mmap->pgoff() == 0) { mmap->set_pgoff(pgoff); if (src.has_maj()) { mmap->set_maj(src.maj()); } if (src.has_min()) { mmap->set_min(src.min()); } if (src.has_ino()) { mmap->set_ino(src.ino()); } if (src.has_ino_generation()) { mmap->set_ino_generation(src.ino_generation()); } } pgoff += mmap->len(); } CHECK_EQ(pgoff, start_pgoff + range.Len(*events)); } } // namespace void DeduceHugePages(RepeatedPtrField<PerfEvent>* events) { // |prev_range|, if IsValid(), represents the preview mmap range seen (and // already processed / updated). MMapRange prev_range; // |range| contains the currently-being-processed mmap range, which will have // its hugepages ranges deduced. MMapRange range = FindRange(*events, 0); // |next_range| contains the next range to process, possibily containing // pgoff != 0 or !IsAnon(filename) from which the current range can be // updated. MMapRange next_range = FindNextRange(*events, range); for (; range.IsValid(); prev_range = range, range = next_range, next_range = FindNextRange(*events, range)) { const bool have_next = (next_range.IsValid() && IsContiguous(*events, range, next_range) && IsEquivalentFile(*events, range, next_range)); // If there's no mmap after this, then we assume that this is *not* viable // a hugepage_text mapping. This is true unless we're really unlucky. If: // - the binary is mapped such that the limit is hugepage aligned // (presumably 4Ki/2Mi chance == p=0.03125) // - and the entire binaryis hugepage_text mapped if (!have_next) { continue; } const bool have_prev = (prev_range.IsValid() && IsContiguous(*events, prev_range, range) && IsEquivalentFile(*events, prev_range, range) && IsEquivalentFile(*events, prev_range, next_range)); uint64 start_pgoff = 0; if (have_prev) { const auto& prev = prev_range.LastMmap(*events); start_pgoff = prev.pgoff() + prev.len(); } const auto& next = next_range.FirstMmap(*events); // prev.pgoff should be valid now, so let's double-check that // if next has a non-zero pgoff, that {prev,curr,next} will have // contiguous pgoff once updated. if (next.pgoff() >= range.Len(*events) && (next.pgoff() - range.Len(*events)) == start_pgoff) { UpdateRangeFromNext(range, next_range, events); } } } void CombineMappings(RepeatedPtrField<PerfEvent>* events) { // Combine mappings RepeatedPtrField<PerfEvent> new_events; new_events.Reserve(events->size()); // |prev| is the index of the last mmap_event in |new_events| (or // |new_events.size()| if no mmap_events have been inserted yet). int prev = 0; for (int i = 0; i < events->size(); ++i) { PerfEvent* event = events->Mutable(i); if (!event->has_mmap_event()) { new_events.Add()->Swap(event); continue; } const MMapEvent& mmap = event->mmap_event(); // Try to merge mmap with |new_events[prev]|. while (prev < new_events.size() && !new_events.Get(prev).has_mmap_event()) { prev++; } if (prev >= new_events.size()) { new_events.Add()->Swap(event); continue; } MMapEvent* prev_mmap = new_events.Mutable(prev)->mutable_mmap_event(); // Don't use IsEquivalentFile(); we don't want to combine //anon with // files if DeduceHugepages didn't already fix up the mappings. const bool file_match = prev_mmap->filename() == mmap.filename(); const bool pgoff_contiguous = file_match && (prev_mmap->pgoff() + prev_mmap->len() == mmap.pgoff()); const bool combine_mappings = IsContiguous(*prev_mmap, mmap) && pgoff_contiguous; if (!combine_mappings) { new_events.Add()->Swap(event); prev++; continue; } // Combine the lengths of the two mappings. prev_mmap->set_len(prev_mmap->len() + mmap.len()); } events->Swap(&new_events); } } // namespace quipper