1#!/usr/bin/env python 2# 3# llcstat.py Summarize cache references and cache misses by PID. 4# Cache reference and cache miss are corresponding events defined in 5# uapi/linux/perf_event.h, it varies to different architecture. 6# On x86-64, they mean LLC references and LLC misses. 7# 8# For Linux, uses BCC, eBPF. Embedded C. 9# 10# SEE ALSO: perf top -e cache-misses -e cache-references -a -ns pid,cpu,comm 11# 12# REQUIRES: Linux 4.9+ (BPF_PROG_TYPE_PERF_EVENT support). 13# 14# Copyright (c) 2016 Facebook, Inc. 15# Licensed under the Apache License, Version 2.0 (the "License") 16# 17# 19-Oct-2016 Teng Qin Created this. 18 19from __future__ import print_function 20import argparse 21from bcc import BPF, PerfType, PerfHWConfig 22import signal 23from time import sleep 24 25parser = argparse.ArgumentParser( 26 description="Summarize cache references and misses by PID", 27 formatter_class=argparse.RawDescriptionHelpFormatter) 28parser.add_argument( 29 "-c", "--sample_period", type=int, default=100, 30 help="Sample one in this many number of cache reference / miss events") 31parser.add_argument( 32 "duration", nargs="?", default=10, help="Duration, in seconds, to run") 33parser.add_argument("--ebpf", action="store_true", 34 help=argparse.SUPPRESS) 35args = parser.parse_args() 36 37# load BPF program 38bpf_text=""" 39#include <linux/ptrace.h> 40#include <uapi/linux/bpf_perf_event.h> 41 42struct key_t { 43 int cpu; 44 int pid; 45 char name[TASK_COMM_LEN]; 46}; 47 48BPF_HASH(ref_count, struct key_t); 49BPF_HASH(miss_count, struct key_t); 50 51static inline __attribute__((always_inline)) void get_key(struct key_t* key) { 52 key->cpu = bpf_get_smp_processor_id(); 53 key->pid = bpf_get_current_pid_tgid(); 54 bpf_get_current_comm(&(key->name), sizeof(key->name)); 55} 56 57int on_cache_miss(struct bpf_perf_event_data *ctx) { 58 struct key_t key = {}; 59 get_key(&key); 60 61 miss_count.increment(key, ctx->sample_period); 62 63 return 0; 64} 65 66int on_cache_ref(struct bpf_perf_event_data *ctx) { 67 struct key_t key = {}; 68 get_key(&key); 69 70 ref_count.increment(key, ctx->sample_period); 71 72 return 0; 73} 74""" 75 76if args.ebpf: 77 print(bpf_text) 78 exit() 79 80b = BPF(text=bpf_text) 81try: 82 b.attach_perf_event( 83 ev_type=PerfType.HARDWARE, ev_config=PerfHWConfig.CACHE_MISSES, 84 fn_name="on_cache_miss", sample_period=args.sample_period) 85 b.attach_perf_event( 86 ev_type=PerfType.HARDWARE, ev_config=PerfHWConfig.CACHE_REFERENCES, 87 fn_name="on_cache_ref", sample_period=args.sample_period) 88except Exception: 89 print("Failed to attach to a hardware event. Is this a virtual machine?") 90 exit() 91 92print("Running for {} seconds or hit Ctrl-C to end.".format(args.duration)) 93 94try: 95 sleep(float(args.duration)) 96except KeyboardInterrupt: 97 signal.signal(signal.SIGINT, lambda signal, frame: print()) 98 99miss_count = {} 100for (k, v) in b.get_table('miss_count').items(): 101 miss_count[(k.pid, k.cpu, k.name)] = v.value 102 103print('PID NAME CPU REFERENCE MISS HIT%') 104tot_ref = 0 105tot_miss = 0 106for (k, v) in b.get_table('ref_count').items(): 107 try: 108 miss = miss_count[(k.pid, k.cpu, k.name)] 109 except KeyError: 110 miss = 0 111 tot_ref += v.value 112 tot_miss += miss 113 # This happens on some PIDs due to missed counts caused by sampling 114 hit = (v.value - miss) if (v.value >= miss) else 0 115 print('{:<8d} {:<16s} {:<4d} {:>12d} {:>12d} {:>6.2f}%'.format( 116 k.pid, k.name.decode('utf-8', 'replace'), k.cpu, v.value, miss, 117 (float(hit) / float(v.value)) * 100.0)) 118print('Total References: {} Total Misses: {} Hit Rate: {:.2f}%'.format( 119 tot_ref, tot_miss, (float(tot_ref - tot_miss) / float(tot_ref)) * 100.0)) 120