1 //===-- Perf.cpp ----------------------------------------------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 
9 #include "Perf.h"
10 
11 #include "Plugins/Process/POSIX/ProcessPOSIXLog.h"
12 #include "lldb/Host/linux/Support.h"
13 
14 #include "llvm/Support/FormatVariadic.h"
15 #include "llvm/Support/MathExtras.h"
16 #include "llvm/Support/MemoryBuffer.h"
17 
18 #include <linux/version.h>
19 #include <sys/ioctl.h>
20 #include <sys/mman.h>
21 #include <sys/syscall.h>
22 #include <unistd.h>
23 
24 using namespace lldb_private;
25 using namespace process_linux;
26 using namespace llvm;
27 
28 Expected<LinuxPerfZeroTscConversion>
29 lldb_private::process_linux::LoadPerfTscConversionParameters() {
30 #if LINUX_VERSION_CODE >= KERNEL_VERSION(3,12,0)
31   lldb::pid_t pid = getpid();
32   perf_event_attr attr;
33   memset(&attr, 0, sizeof(attr));
34   attr.size = sizeof(attr);
35   attr.type = PERF_TYPE_SOFTWARE;
36   attr.config = PERF_COUNT_SW_DUMMY;
37 
38   Expected<PerfEvent> perf_event = PerfEvent::Init(attr, pid);
39   if (!perf_event)
40     return perf_event.takeError();
41   if (Error mmap_err =
42           perf_event->MmapMetadataAndBuffers(/*num_data_pages=*/0,
43                                              /*num_aux_pages=*/0,
44                                              /*data_buffer_write=*/false))
45     return std::move(mmap_err);
46 
47   perf_event_mmap_page &mmap_metada = perf_event->GetMetadataPage();
48   if (mmap_metada.cap_user_time && mmap_metada.cap_user_time_zero) {
49     return LinuxPerfZeroTscConversion{
50         mmap_metada.time_mult, mmap_metada.time_shift, {mmap_metada.time_zero}};
51   } else {
52     auto err_cap =
53         !mmap_metada.cap_user_time ? "cap_user_time" : "cap_user_time_zero";
54     std::string err_msg =
55         llvm::formatv("Can't get TSC to real time conversion values. "
56                       "perf_event capability '{0}' not supported.",
57                       err_cap);
58     return llvm::createStringError(llvm::inconvertibleErrorCode(), err_msg);
59   }
60 #else
61   std::string err_msg = "PERF_COUNT_SW_DUMMY requires Linux 3.12";
62   return llvm::createStringError(llvm::inconvertibleErrorCode(), err_msg);
63 #endif
64 }
65 
66 void resource_handle::MmapDeleter::operator()(void *ptr) {
67   if (m_bytes && ptr != nullptr)
68     munmap(ptr, m_bytes);
69 }
70 
71 void resource_handle::FileDescriptorDeleter::operator()(long *ptr) {
72   if (ptr == nullptr)
73     return;
74   if (*ptr == -1)
75     return;
76   close(*ptr);
77   std::default_delete<long>()(ptr);
78 }
79 
80 llvm::Expected<PerfEvent> PerfEvent::Init(perf_event_attr &attr,
81                                           Optional<lldb::pid_t> pid,
82                                           Optional<lldb::cpu_id_t> cpu,
83                                           Optional<long> group_fd,
84                                           unsigned long flags) {
85   errno = 0;
86   long fd = syscall(SYS_perf_event_open, &attr, pid.value_or(-1),
87                     cpu.value_or(-1), group_fd.value_or(-1), flags);
88   if (fd == -1) {
89     std::string err_msg =
90         llvm::formatv("perf event syscall failed: {0}", std::strerror(errno));
91     return llvm::createStringError(llvm::inconvertibleErrorCode(), err_msg);
92   }
93   return PerfEvent(fd, !attr.disabled);
94 }
95 
96 llvm::Expected<PerfEvent> PerfEvent::Init(perf_event_attr &attr,
97                                           Optional<lldb::pid_t> pid,
98                                           Optional<lldb::cpu_id_t> cpu) {
99   return Init(attr, pid, cpu, -1, 0);
100 }
101 
102 llvm::Expected<resource_handle::MmapUP>
103 PerfEvent::DoMmap(void *addr, size_t length, int prot, int flags,
104                   long int offset, llvm::StringRef buffer_name) {
105   errno = 0;
106   auto mmap_result = ::mmap(addr, length, prot, flags, GetFd(), offset);
107 
108   if (mmap_result == MAP_FAILED) {
109     std::string err_msg =
110         llvm::formatv("perf event mmap allocation failed for {0}: {1}",
111                       buffer_name, std::strerror(errno));
112     return createStringError(inconvertibleErrorCode(), err_msg);
113   }
114   return resource_handle::MmapUP(mmap_result, length);
115 }
116 
117 llvm::Error PerfEvent::MmapMetadataAndDataBuffer(size_t num_data_pages,
118                                                  bool data_buffer_write) {
119   size_t mmap_size = (num_data_pages + 1) * getpagesize();
120   if (Expected<resource_handle::MmapUP> mmap_metadata_data = DoMmap(
121           nullptr, mmap_size, PROT_READ | (data_buffer_write ? PROT_WRITE : 0),
122           MAP_SHARED, 0, "metadata and data buffer")) {
123     m_metadata_data_base = std::move(mmap_metadata_data.get());
124     return Error::success();
125   } else
126     return mmap_metadata_data.takeError();
127 }
128 
129 llvm::Error PerfEvent::MmapAuxBuffer(size_t num_aux_pages) {
130   if (num_aux_pages == 0)
131     return Error::success();
132 
133   perf_event_mmap_page &metadata_page = GetMetadataPage();
134 
135   metadata_page.aux_offset =
136       metadata_page.data_offset + metadata_page.data_size;
137   metadata_page.aux_size = num_aux_pages * getpagesize();
138 
139   if (Expected<resource_handle::MmapUP> mmap_aux =
140           DoMmap(nullptr, metadata_page.aux_size, PROT_READ, MAP_SHARED,
141                  metadata_page.aux_offset, "aux buffer")) {
142     m_aux_base = std::move(mmap_aux.get());
143     return Error::success();
144   } else
145     return mmap_aux.takeError();
146 }
147 
148 llvm::Error PerfEvent::MmapMetadataAndBuffers(size_t num_data_pages,
149                                               size_t num_aux_pages,
150                                               bool data_buffer_write) {
151   if (num_data_pages != 0 && !isPowerOf2_64(num_data_pages))
152     return llvm::createStringError(
153         llvm::inconvertibleErrorCode(),
154         llvm::formatv("Number of data pages must be a power of 2, got: {0}",
155                       num_data_pages));
156   if (num_aux_pages != 0 && !isPowerOf2_64(num_aux_pages))
157     return llvm::createStringError(
158         llvm::inconvertibleErrorCode(),
159         llvm::formatv("Number of aux pages must be a power of 2, got: {0}",
160                       num_aux_pages));
161   if (Error err = MmapMetadataAndDataBuffer(num_data_pages, data_buffer_write))
162     return err;
163   if (Error err = MmapAuxBuffer(num_aux_pages))
164     return err;
165   return Error::success();
166 }
167 
168 long PerfEvent::GetFd() const { return *(m_fd.get()); }
169 
170 perf_event_mmap_page &PerfEvent::GetMetadataPage() const {
171   return *reinterpret_cast<perf_event_mmap_page *>(m_metadata_data_base.get());
172 }
173 
174 ArrayRef<uint8_t> PerfEvent::GetDataBuffer() const {
175   perf_event_mmap_page &mmap_metadata = GetMetadataPage();
176   return {reinterpret_cast<uint8_t *>(m_metadata_data_base.get()) +
177               mmap_metadata.data_offset,
178            static_cast<size_t>(mmap_metadata.data_size)};
179 }
180 
181 ArrayRef<uint8_t> PerfEvent::GetAuxBuffer() const {
182   perf_event_mmap_page &mmap_metadata = GetMetadataPage();
183   return {reinterpret_cast<uint8_t *>(m_aux_base.get()),
184            static_cast<size_t>(mmap_metadata.aux_size)};
185 }
186 
187 Expected<std::vector<uint8_t>> PerfEvent::GetReadOnlyDataBuffer() {
188   // The following code assumes that the protection level of the DATA page
189   // is PROT_READ. If PROT_WRITE is used, then reading would require that
190   // this piece of code updates some pointers. See more about data_tail
191   // in https://man7.org/linux/man-pages/man2/perf_event_open.2.html.
192 
193   bool was_enabled = m_enabled;
194   if (Error err = DisableWithIoctl())
195     return std::move(err);
196 
197   /**
198    * The data buffer and aux buffer have different implementations
199    * with respect to their definition of head pointer when using PROD_READ only.
200    * In the case of Aux data buffer the head always wraps around the aux buffer
201    * and we don't need to care about it, whereas the data_head keeps
202    * increasing and needs to be wrapped by modulus operator
203    */
204   perf_event_mmap_page &mmap_metadata = GetMetadataPage();
205 
206   ArrayRef<uint8_t> data = GetDataBuffer();
207   uint64_t data_head = mmap_metadata.data_head;
208   uint64_t data_size = mmap_metadata.data_size;
209   std::vector<uint8_t> output;
210   output.reserve(data.size());
211 
212   if (data_head > data_size) {
213     uint64_t actual_data_head = data_head % data_size;
214     // The buffer has wrapped, so we first the oldest chunk of data
215     output.insert(output.end(), data.begin() + actual_data_head, data.end());
216     // And we we read the most recent chunk of data
217     output.insert(output.end(), data.begin(), data.begin() + actual_data_head);
218   } else {
219     // There's been no wrapping, so we just read linearly
220     output.insert(output.end(), data.begin(), data.begin() + data_head);
221   }
222 
223   if (was_enabled) {
224     if (Error err = EnableWithIoctl())
225       return std::move(err);
226   }
227 
228   return output;
229 }
230 
231 Expected<std::vector<uint8_t>> PerfEvent::GetReadOnlyAuxBuffer() {
232   // The following code assumes that the protection level of the AUX page
233   // is PROT_READ. If PROT_WRITE is used, then reading would require that
234   // this piece of code updates some pointers. See more about aux_tail
235   // in https://man7.org/linux/man-pages/man2/perf_event_open.2.html.
236 
237   bool was_enabled = m_enabled;
238   if (Error err = DisableWithIoctl())
239     return std::move(err);
240 
241   perf_event_mmap_page &mmap_metadata = GetMetadataPage();
242 
243   ArrayRef<uint8_t> data = GetAuxBuffer();
244   uint64_t aux_head = mmap_metadata.aux_head;
245   std::vector<uint8_t> output;
246   output.reserve(data.size());
247 
248   /**
249    * When configured as ring buffer, the aux buffer keeps wrapping around
250    * the buffer and its not possible to detect how many times the buffer
251    * wrapped. Initially the buffer is filled with zeros,as shown below
252    * so in order to get complete buffer we first copy firstpartsize, followed
253    * by any left over part from beginning to aux_head
254    *
255    * aux_offset [d,d,d,d,d,d,d,d,0,0,0,0,0,0,0,0,0,0,0] aux_size
256    *                 aux_head->||<- firstpartsize  ->|
257    *
258    * */
259 
260   output.insert(output.end(), data.begin() + aux_head, data.end());
261   output.insert(output.end(), data.begin(), data.begin() + aux_head);
262 
263   if (was_enabled) {
264     if (Error err = EnableWithIoctl())
265       return std::move(err);
266   }
267 
268   return output;
269 }
270 
271 Error PerfEvent::DisableWithIoctl() {
272   if (!m_enabled)
273     return Error::success();
274 
275   if (ioctl(*m_fd, PERF_EVENT_IOC_DISABLE, PERF_IOC_FLAG_GROUP) < 0)
276     return createStringError(inconvertibleErrorCode(),
277                              "Can't disable perf event. %s",
278                              std::strerror(errno));
279 
280   m_enabled = false;
281   return Error::success();
282 }
283 
284 bool PerfEvent::IsEnabled() const { return m_enabled; }
285 
286 Error PerfEvent::EnableWithIoctl() {
287   if (m_enabled)
288     return Error::success();
289 
290   if (ioctl(*m_fd, PERF_EVENT_IOC_ENABLE, PERF_IOC_FLAG_GROUP) < 0)
291     return createStringError(inconvertibleErrorCode(),
292                              "Can't enable perf event. %s",
293                              std::strerror(errno));
294 
295   m_enabled = true;
296   return Error::success();
297 }
298 
299 size_t PerfEvent::GetEffectiveDataBufferSize() const {
300   perf_event_mmap_page &mmap_metadata = GetMetadataPage();
301   if (mmap_metadata.data_head < mmap_metadata.data_size)
302     return mmap_metadata.data_head;
303   else
304     return mmap_metadata.data_size; // The buffer has wrapped.
305 }
306 
307 Expected<PerfEvent>
308 lldb_private::process_linux::CreateContextSwitchTracePerfEvent(
309     lldb::cpu_id_t cpu_id, const PerfEvent *parent_perf_event) {
310   Log *log = GetLog(POSIXLog::Trace);
311 #ifndef PERF_ATTR_SIZE_VER5
312   return createStringError(inconvertibleErrorCode(),
313                            "Intel PT Linux perf event not supported");
314 #else
315   perf_event_attr attr;
316   memset(&attr, 0, sizeof(attr));
317   attr.size = sizeof(attr);
318   attr.sample_type = PERF_SAMPLE_TID | PERF_SAMPLE_TIME;
319   attr.type = PERF_TYPE_SOFTWARE;
320   attr.context_switch = 1;
321   attr.exclude_kernel = 1;
322   attr.sample_id_all = 1;
323   attr.exclude_hv = 1;
324   attr.disabled = parent_perf_event ? !parent_perf_event->IsEnabled() : false;
325 
326   // The given perf configuration will produce context switch records of 32
327   // bytes each. Assuming that every context switch will be emitted twice (one
328   // for context switch ins and another one for context switch outs), and that a
329   // context switch will happen at least every half a millisecond per core, we
330   // need 500 * 32 bytes (~16 KB) for a trace of one second, which is much more
331   // than what a regular intel pt trace can get. Pessimistically we pick as
332   // 32KiB for the size of our context switch trace.
333 
334   uint64_t data_buffer_size = 32768;
335   uint64_t data_buffer_numpages = data_buffer_size / getpagesize();
336 
337   LLDB_LOG(log, "Will create context switch trace buffer of size {0}",
338            data_buffer_size);
339 
340   Optional<long> group_fd;
341   if (parent_perf_event)
342     group_fd = parent_perf_event->GetFd();
343 
344   if (Expected<PerfEvent> perf_event =
345           PerfEvent::Init(attr, /*pid=*/None, cpu_id, group_fd, /*flags=*/0)) {
346     if (Error mmap_err = perf_event->MmapMetadataAndBuffers(
347             data_buffer_numpages, 0, /*data_buffer_write=*/false)) {
348       return std::move(mmap_err);
349     }
350     return perf_event;
351   } else {
352     return perf_event.takeError();
353   }
354 #endif
355 }
356