109d62154SDaniel Borkmann #ifndef _TOOLS_LINUX_RING_BUFFER_H_
209d62154SDaniel Borkmann #define _TOOLS_LINUX_RING_BUFFER_H_
309d62154SDaniel Borkmann 
409d62154SDaniel Borkmann #include <asm/barrier.h>
5db9a5fd0SJiri Olsa #include <linux/perf_event.h>
609d62154SDaniel Borkmann 
709d62154SDaniel Borkmann /*
809d62154SDaniel Borkmann  * Contract with kernel for walking the perf ring buffer from
909d62154SDaniel Borkmann  * user space requires the following barrier pairing (quote
1009d62154SDaniel Borkmann  * from kernel/events/ring_buffer.c):
1109d62154SDaniel Borkmann  *
1209d62154SDaniel Borkmann  *   Since the mmap() consumer (userspace) can run on a
1309d62154SDaniel Borkmann  *   different CPU:
1409d62154SDaniel Borkmann  *
1509d62154SDaniel Borkmann  *   kernel                             user
1609d62154SDaniel Borkmann  *
1709d62154SDaniel Borkmann  *   if (LOAD ->data_tail) {            LOAD ->data_head
1809d62154SDaniel Borkmann  *                      (A)             smp_rmb()       (C)
1909d62154SDaniel Borkmann  *      STORE $data                     LOAD $data
2009d62154SDaniel Borkmann  *      smp_wmb()       (B)             smp_mb()        (D)
2109d62154SDaniel Borkmann  *      STORE ->data_head               STORE ->data_tail
2209d62154SDaniel Borkmann  *   }
2309d62154SDaniel Borkmann  *
2409d62154SDaniel Borkmann  *   Where A pairs with D, and B pairs with C.
2509d62154SDaniel Borkmann  *
2609d62154SDaniel Borkmann  *   In our case A is a control dependency that separates the
2709d62154SDaniel Borkmann  *   load of the ->data_tail and the stores of $data. In case
2809d62154SDaniel Borkmann  *   ->data_tail indicates there is no room in the buffer to
2909d62154SDaniel Borkmann  *   store $data we do not.
3009d62154SDaniel Borkmann  *
3109d62154SDaniel Borkmann  *   D needs to be a full barrier since it separates the data
3209d62154SDaniel Borkmann  *   READ from the tail WRITE.
3309d62154SDaniel Borkmann  *
3409d62154SDaniel Borkmann  *   For B a WMB is sufficient since it separates two WRITEs,
3509d62154SDaniel Borkmann  *   and for C an RMB is sufficient since it separates two READs.
3609d62154SDaniel Borkmann  *
3709d62154SDaniel Borkmann  * Note, instead of B, C, D we could also use smp_store_release()
3809d62154SDaniel Borkmann  * in B and D as well as smp_load_acquire() in C.
3909d62154SDaniel Borkmann  *
4009d62154SDaniel Borkmann  * However, this optimization does not make sense for all kernel
4109d62154SDaniel Borkmann  * supported architectures since for a fair number it would
4209d62154SDaniel Borkmann  * resolve into READ_ONCE() + smp_mb() pair for smp_load_acquire(),
4309d62154SDaniel Borkmann  * and smp_mb() + WRITE_ONCE() pair for smp_store_release().
4409d62154SDaniel Borkmann  *
4509d62154SDaniel Borkmann  * Thus for those smp_wmb() in B and smp_rmb() in C would still
4609d62154SDaniel Borkmann  * be less expensive. For the case of D this has either the same
4709d62154SDaniel Borkmann  * cost or is less expensive, for example, due to TSO x86 can
4809d62154SDaniel Borkmann  * avoid the CPU barrier entirely.
4909d62154SDaniel Borkmann  */
5009d62154SDaniel Borkmann 
ring_buffer_read_head(struct perf_event_mmap_page * base)5109d62154SDaniel Borkmann static inline u64 ring_buffer_read_head(struct perf_event_mmap_page *base)
5209d62154SDaniel Borkmann {
5309d62154SDaniel Borkmann /*
5409d62154SDaniel Borkmann  * Architectures where smp_load_acquire() does not fallback to
5509d62154SDaniel Borkmann  * READ_ONCE() + smp_mb() pair.
5609d62154SDaniel Borkmann  */
5709d62154SDaniel Borkmann #if defined(__x86_64__) || defined(__aarch64__) || defined(__powerpc64__) || \
58*aa5736dcSCharlie Jenkins     defined(__ia64__) || defined(__sparc__) && defined(__arch64__) || defined(__riscv)
5909d62154SDaniel Borkmann 	return smp_load_acquire(&base->data_head);
6009d62154SDaniel Borkmann #else
6109d62154SDaniel Borkmann 	u64 head = READ_ONCE(base->data_head);
6209d62154SDaniel Borkmann 
6309d62154SDaniel Borkmann 	smp_rmb();
6409d62154SDaniel Borkmann 	return head;
6509d62154SDaniel Borkmann #endif
6609d62154SDaniel Borkmann }
6709d62154SDaniel Borkmann 
ring_buffer_write_tail(struct perf_event_mmap_page * base,u64 tail)6809d62154SDaniel Borkmann static inline void ring_buffer_write_tail(struct perf_event_mmap_page *base,
6909d62154SDaniel Borkmann 					  u64 tail)
7009d62154SDaniel Borkmann {
7109d62154SDaniel Borkmann 	smp_store_release(&base->data_tail, tail);
7209d62154SDaniel Borkmann }
7309d62154SDaniel Borkmann 
7409d62154SDaniel Borkmann #endif /* _TOOLS_LINUX_RING_BUFFER_H_ */
75