184 lines
5.0 KiB
Python
Executable File
184 lines
5.0 KiB
Python
Executable File
#!/usr/bin/python
|
|
# @lint-avoid-python-3-compatibility-imports
|
|
#
|
|
# readahead Show performance of read-ahead cache
|
|
# For Linux, uses BCC, eBPF
|
|
#
|
|
# Copyright (c) 2020 Suchakra Sharma <mail@suchakra.in>
|
|
# Licensed under the Apache License, Version 2.0 (the "License")
|
|
# This was originally created for the BPF Performance Tools book
|
|
# published by Addison Wesley. ISBN-13: 9780136554820
|
|
# When copying or porting, include this comment.
|
|
#
|
|
# 20-Aug-2020 Suchakra Sharma Ported from bpftrace to BCC
|
|
# 17-Sep-2021 Hengqi Chen Migrated to kfunc
|
|
|
|
from __future__ import print_function
|
|
from bcc import BPF
|
|
from time import sleep
|
|
import ctypes as ct
|
|
import argparse
|
|
|
|
# arguments
|
|
examples = """examples:
|
|
./readahead -d 20 # monitor for 20 seconds and generate stats
|
|
"""
|
|
|
|
parser = argparse.ArgumentParser(
|
|
description="Monitor performance of read ahead cache",
|
|
formatter_class=argparse.RawDescriptionHelpFormatter,
|
|
epilog=examples)
|
|
parser.add_argument("-d", "--duration", type=int,
|
|
help="total duration to monitor for, in seconds")
|
|
args = parser.parse_args()
|
|
if not args.duration:
|
|
args.duration = 99999999
|
|
|
|
# BPF program
|
|
bpf_text = """
|
|
#include <uapi/linux/ptrace.h>
|
|
#include <linux/mm_types.h>
|
|
|
|
BPF_HASH(flag, u32, u8); // used to track if we are in do_page_cache_readahead()
|
|
BPF_HASH(birth, struct page*, u64); // used to track timestamps of cache alloc'ed page
|
|
BPF_ARRAY(pages); // increment/decrement readahead pages
|
|
BPF_HISTOGRAM(dist);
|
|
"""
|
|
|
|
bpf_text_kprobe = """
|
|
int entry__do_page_cache_readahead(struct pt_regs *ctx) {
|
|
u32 pid;
|
|
u8 one = 1;
|
|
pid = bpf_get_current_pid_tgid();
|
|
flag.update(&pid, &one);
|
|
return 0;
|
|
}
|
|
|
|
int exit__do_page_cache_readahead(struct pt_regs *ctx) {
|
|
u32 pid;
|
|
u8 zero = 0;
|
|
pid = bpf_get_current_pid_tgid();
|
|
flag.update(&pid, &zero);
|
|
return 0;
|
|
}
|
|
|
|
int exit__page_cache_alloc(struct pt_regs *ctx) {
|
|
u32 pid;
|
|
u64 ts;
|
|
struct page *retval = (struct page*) PT_REGS_RC(ctx);
|
|
u32 zero = 0; // static key for accessing pages[0]
|
|
pid = bpf_get_current_pid_tgid();
|
|
u8 *f = flag.lookup(&pid);
|
|
if (f != NULL && *f == 1) {
|
|
ts = bpf_ktime_get_ns();
|
|
birth.update(&retval, &ts);
|
|
pages.atomic_increment(zero);
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
int entry_mark_page_accessed(struct pt_regs *ctx) {
|
|
u64 ts, delta;
|
|
struct page *arg0 = (struct page *) PT_REGS_PARM1(ctx);
|
|
u32 zero = 0; // static key for accessing pages[0]
|
|
u64 *bts = birth.lookup(&arg0);
|
|
if (bts != NULL) {
|
|
delta = bpf_ktime_get_ns() - *bts;
|
|
dist.atomic_increment(bpf_log2l(delta/1000000));
|
|
pages.atomic_increment(zero, -1);
|
|
birth.delete(&arg0); // remove the entry from hashmap
|
|
}
|
|
return 0;
|
|
}
|
|
"""
|
|
|
|
bpf_text_kfunc = """
|
|
KFUNC_PROBE(RA_FUNC)
|
|
{
|
|
u32 pid = bpf_get_current_pid_tgid();
|
|
u8 one = 1;
|
|
|
|
flag.update(&pid, &one);
|
|
return 0;
|
|
}
|
|
|
|
KRETFUNC_PROBE(RA_FUNC)
|
|
{
|
|
u32 pid = bpf_get_current_pid_tgid();
|
|
u8 zero = 0;
|
|
|
|
flag.update(&pid, &zero);
|
|
return 0;
|
|
}
|
|
|
|
KRETFUNC_PROBE(__page_cache_alloc, gfp_t gfp, struct page *retval)
|
|
{
|
|
u64 ts;
|
|
u32 zero = 0; // static key for accessing pages[0]
|
|
u32 pid = bpf_get_current_pid_tgid();
|
|
u8 *f = flag.lookup(&pid);
|
|
|
|
if (f != NULL && *f == 1) {
|
|
ts = bpf_ktime_get_ns();
|
|
birth.update(&retval, &ts);
|
|
pages.atomic_increment(zero);
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
KFUNC_PROBE(mark_page_accessed, struct page *arg0)
|
|
{
|
|
u64 ts, delta;
|
|
u32 zero = 0; // static key for accessing pages[0]
|
|
u64 *bts = birth.lookup(&arg0);
|
|
|
|
if (bts != NULL) {
|
|
delta = bpf_ktime_get_ns() - *bts;
|
|
dist.atomic_increment(bpf_log2l(delta/1000000));
|
|
pages.atomic_increment(zero, -1);
|
|
birth.delete(&arg0); // remove the entry from hashmap
|
|
}
|
|
return 0;
|
|
}
|
|
"""
|
|
|
|
if BPF.support_kfunc():
|
|
if BPF.get_kprobe_functions(b"__do_page_cache_readahead"):
|
|
ra_func = "__do_page_cache_readahead"
|
|
else:
|
|
ra_func = "do_page_cache_ra"
|
|
bpf_text += bpf_text_kfunc.replace("RA_FUNC", ra_func)
|
|
b = BPF(text=bpf_text)
|
|
else:
|
|
bpf_text += bpf_text_kprobe
|
|
b = BPF(text=bpf_text)
|
|
if BPF.get_kprobe_functions(b"__do_page_cache_readahead"):
|
|
ra_event = "__do_page_cache_readahead"
|
|
else:
|
|
ra_event = "do_page_cache_ra"
|
|
b.attach_kprobe(event=ra_event, fn_name="entry__do_page_cache_readahead")
|
|
b.attach_kretprobe(event=ra_event, fn_name="exit__do_page_cache_readahead")
|
|
b.attach_kretprobe(event="__page_cache_alloc", fn_name="exit__page_cache_alloc")
|
|
b.attach_kprobe(event="mark_page_accessed", fn_name="entry_mark_page_accessed")
|
|
|
|
# header
|
|
print("Tracing... Hit Ctrl-C to end.")
|
|
|
|
# print
|
|
def print_stats():
|
|
print()
|
|
print("Read-ahead unused pages: %d" % (b["pages"][ct.c_ulong(0)].value))
|
|
print("Histogram of read-ahead used page age (ms):")
|
|
print("")
|
|
b["dist"].print_log2_hist("age (ms)")
|
|
b["dist"].clear()
|
|
b["pages"].clear()
|
|
|
|
while True:
|
|
try:
|
|
sleep(args.duration)
|
|
print_stats()
|
|
except KeyboardInterrupt:
|
|
print_stats()
|
|
break
|