1#!/usr/bin/env python 2# @lint-avoid-python-3-compatibility-imports 3# 4# softirqs Summarize soft IRQ (interrupt) event time. 5# For Linux, uses BCC, eBPF. 6# 7# USAGE: softirqs [-h] [-T] [-N] [-C] [-d] [-c CPU] [interval] [count] 8# 9# Copyright (c) 2015 Brendan Gregg. 10# Licensed under the Apache License, Version 2.0 (the "License") 11# 12# 20-Oct-2015 Brendan Gregg Created this. 13# 03-Apr-2017 Sasha Goldshtein Migrated to kernel tracepoints. 14# 07-Mar-2022 Rocky Xing Added CPU filter support. 15# 24-Mar-2022 Rocky Xing Added event counting support. 16 17from __future__ import print_function 18from bcc import BPF 19from time import sleep, strftime 20import argparse 21import sys 22 23# arguments 24examples = """examples: 25 ./softirqs # sum soft irq event time 26 ./softirqs -C # show the number of soft irq events 27 ./softirqs -d # show soft irq event time as histograms 28 ./softirqs 1 10 # print 1 second summaries, 10 times 29 ./softirqs -NT 1 # 1s summaries, nanoseconds, and timestamps 30 ./softirqs -c 1 # sum soft irq event time on CPU 1 only 31""" 32parser = argparse.ArgumentParser( 33 description="Summarize soft irq event time as histograms.", 34 formatter_class=argparse.RawDescriptionHelpFormatter, 35 epilog=examples) 36parser.add_argument("-T", "--timestamp", action="store_true", 37 help="include timestamp on output") 38parser.add_argument("-N", "--nanoseconds", action="store_true", 39 help="output in nanoseconds") 40parser.add_argument("-C", "--events", action="store_true", 41 help="show the number of soft irq events") 42parser.add_argument("-d", "--dist", action="store_true", 43 help="show distributions as histograms") 44parser.add_argument("-c", "--cpu", type=int, 45 help="trace this CPU only") 46parser.add_argument("interval", nargs="?", default=99999999, 47 help="output interval, in seconds") 48parser.add_argument("count", nargs="?", default=99999999, 49 help="number of outputs") 50parser.add_argument("--ebpf", action="store_true", 51 help=argparse.SUPPRESS) 52args = parser.parse_args() 53countdown = int(args.count) 54if args.events and (args.dist or args.nanoseconds): 55 print("The --events option can't be used with time-based options") 56 exit() 57if args.events: 58 factor = 1 59 label = "count" 60elif args.nanoseconds: 61 factor = 1 62 label = "nsecs" 63else: 64 factor = 1000 65 label = "usecs" 66debug = 0 67 68# define BPF program 69bpf_text = """ 70#include <uapi/linux/ptrace.h> 71 72typedef struct entry_key { 73 u32 pid; 74 u32 cpu; 75} entry_key_t; 76 77typedef struct irq_key { 78 u32 vec; 79 u64 slot; 80} irq_key_t; 81 82typedef struct account_val { 83 u64 ts; 84 u32 vec; 85} account_val_t; 86 87BPF_HASH(start, entry_key_t, account_val_t); 88BPF_HISTOGRAM(dist, irq_key_t); 89""" 90 91bpf_text_count = """ 92TRACEPOINT_PROBE(irq, softirq_entry) 93{ 94 u32 cpu = bpf_get_smp_processor_id(); 95 96 FILTER_CPU 97 98 irq_key_t key = { .slot = 0 /* ignore */ }; 99 key.vec = args->vec; 100 101 dist.atomic_increment(key); 102 103 return 0; 104} 105""" 106 107bpf_text_time = """ 108TRACEPOINT_PROBE(irq, softirq_entry) 109{ 110 account_val_t val = {}; 111 entry_key_t key = {}; 112 u32 cpu = bpf_get_smp_processor_id(); 113 114 FILTER_CPU 115 116 key.pid = bpf_get_current_pid_tgid(); 117 key.cpu = cpu; 118 val.ts = bpf_ktime_get_ns(); 119 val.vec = args->vec; 120 121 start.update(&key, &val); 122 123 return 0; 124} 125 126TRACEPOINT_PROBE(irq, softirq_exit) 127{ 128 u64 delta; 129 u32 vec; 130 account_val_t *valp; 131 irq_key_t key = {0}; 132 entry_key_t entry_key = {}; 133 u32 cpu = bpf_get_smp_processor_id(); 134 135 FILTER_CPU 136 137 entry_key.pid = bpf_get_current_pid_tgid(); 138 entry_key.cpu = cpu; 139 140 // fetch timestamp and calculate delta 141 valp = start.lookup(&entry_key); 142 if (valp == 0) { 143 return 0; // missed start 144 } 145 delta = bpf_ktime_get_ns() - valp->ts; 146 vec = valp->vec; 147 148 // store as sum or histogram 149 STORE 150 151 start.delete(&entry_key); 152 return 0; 153} 154""" 155 156if args.events: 157 bpf_text += bpf_text_count 158else: 159 bpf_text += bpf_text_time 160 161# code substitutions 162if args.dist: 163 bpf_text = bpf_text.replace('STORE', 164 'key.vec = vec; key.slot = bpf_log2l(delta / %d); ' % factor + 165 'dist.atomic_increment(key);') 166else: 167 bpf_text = bpf_text.replace('STORE', 168 'key.vec = valp->vec; ' + 169 'dist.atomic_increment(key, delta);') 170if args.cpu is not None: 171 bpf_text = bpf_text.replace('FILTER_CPU', 172 'if (cpu != %d) { return 0; }' % int(args.cpu)) 173else: 174 bpf_text = bpf_text.replace('FILTER_CPU', '') 175if debug or args.ebpf: 176 print(bpf_text) 177 if args.ebpf: 178 exit() 179 180# load BPF program 181b = BPF(text=bpf_text) 182 183def vec_to_name(vec): 184 # copied from softirq_to_name() in kernel/softirq.c 185 # may need updates if new softirq handlers are added 186 return ["hi", "timer", "net_tx", "net_rx", "block", "irq_poll", 187 "tasklet", "sched", "hrtimer", "rcu"][vec] 188 189if args.events: 190 print("Tracing soft irq events... Hit Ctrl-C to end.") 191else: 192 print("Tracing soft irq event time... Hit Ctrl-C to end.") 193 194# output 195exiting = 0 if args.interval else 1 196dist = b.get_table("dist") 197while (1): 198 try: 199 sleep(int(args.interval)) 200 except KeyboardInterrupt: 201 exiting = 1 202 203 print() 204 if args.timestamp: 205 print("%-8s\n" % strftime("%H:%M:%S"), end="") 206 207 if args.dist: 208 dist.print_log2_hist(label, "softirq", section_print_fn=vec_to_name) 209 else: 210 print("%-16s %11s" % ("SOFTIRQ", "TOTAL_" + label)) 211 for k, v in sorted(dist.items(), key=lambda dist: dist[1].value): 212 print("%-16s %11d" % (vec_to_name(k.vec), v.value / factor)) 213 dist.clear() 214 215 sys.stdout.flush() 216 217 countdown -= 1 218 if exiting or countdown == 0: 219 exit() 220