#!/usr/bin/python # @lint-avoid-python-3-compatibility-imports # # readahead Show performance of read-ahead cache # For Linux, uses BCC, eBPF # # Copyright (c) 2020 Suchakra Sharma # Licensed under the Apache License, Version 2.0 (the "License") # This was originally created for the BPF Performance Tools book # published by Addison Wesley. ISBN-13: 9780136554820 # When copying or porting, include this comment. # # 20-Aug-2020 Suchakra Sharma Ported from bpftrace to BCC from __future__ import print_function from bcc import BPF from time import sleep import ctypes as ct import argparse # arguments examples = """examples: ./readahead -d 20 # monitor for 10 seconds and generate stats """ parser = argparse.ArgumentParser( description="Monitor performance of read ahead cache", formatter_class=argparse.RawDescriptionHelpFormatter, epilog=examples) parser.add_argument("-d", "--duration", type=int, help="total duration to monitor for, in seconds") args = parser.parse_args() if not args.duration: args.duration = 99999999 # BPF program program = """ #include #include BPF_HASH(flag, u32, u8); // used to track if we are in do_page_cache_readahead() BPF_HASH(birth, struct page*, u64); // used to track timestamps of cache alloc'ed page BPF_ARRAY(pages); // increment/decrement readahead pages BPF_HISTOGRAM(dist); int entry__do_page_cache_readahead(struct pt_regs *ctx) { u32 pid; u8 one = 1; pid = bpf_get_current_pid_tgid(); flag.update(&pid, &one); return 0; } int exit__do_page_cache_readahead(struct pt_regs *ctx) { u32 pid; u8 zero = 0; pid = bpf_get_current_pid_tgid(); flag.update(&pid, &zero); return 0; } int exit__page_cache_alloc(struct pt_regs *ctx) { u32 pid; u64 ts; struct page *retval = (struct page*) PT_REGS_RC(ctx); u32 zero = 0; // static key for accessing pages[0] pid = bpf_get_current_pid_tgid(); u8 *f = flag.lookup(&pid); if (f != NULL && *f == 1) { ts = bpf_ktime_get_ns(); birth.update(&retval, &ts); u64 *count = pages.lookup(&zero); if (count) (*count)++; // increment read ahead pages count } return 0; } int entry_mark_page_accessed(struct pt_regs *ctx) { u64 ts, delta; struct page *arg0 = (struct page *) PT_REGS_PARM1(ctx); u32 zero = 0; // static key for accessing pages[0] u64 *bts = birth.lookup(&arg0); if (bts != NULL) { delta = bpf_ktime_get_ns() - *bts; dist.increment(bpf_log2l(delta/1000000)); u64 *count = pages.lookup(&zero); if (count) (*count)--; // decrement read ahead pages count birth.delete(&arg0); // remove the entry from hashmap } return 0; } """ b = BPF(text=program) b.attach_kprobe(event="__do_page_cache_readahead", fn_name="entry__do_page_cache_readahead") b.attach_kretprobe(event="__do_page_cache_readahead", fn_name="exit__do_page_cache_readahead") b.attach_kretprobe(event="__page_cache_alloc", fn_name="exit__page_cache_alloc") b.attach_kprobe(event="mark_page_accessed", fn_name="entry_mark_page_accessed") # header print("Tracing... Hit Ctrl-C to end.") # print def print_stats(): print() print("Read-ahead unused pages: %d" % (b["pages"][ct.c_ulong(0)].value)) print("Histogram of read-ahead used page age (ms):") print("") b["dist"].print_log2_hist("age (ms)") b["dist"].clear() b["pages"].clear() while True: try: sleep(args.duration) print_stats() except KeyboardInterrupt: print_stats() break