blob: ae45275d8946a88f5805c49503f1112570c5a62f [file] [log] [blame]
#!/usr/bin/python
#
# biolatpcts.py IO latency percentile calculation example
#
# Copyright (C) 2020 Tejun Heo <tj@kernel.org>
# Copyright (C) 2020 Facebook
from __future__ import print_function
from bcc import BPF
from time import sleep
bpf_source = """
#include <linux/blk_types.h>
#include <linux/blk-mq.h>
#include <linux/blkdev.h>
#include <linux/time64.h>
BPF_PERCPU_ARRAY(lat_100ms, u64, 100);
BPF_PERCPU_ARRAY(lat_1ms, u64, 100);
BPF_PERCPU_ARRAY(lat_10us, u64, 100);
RAW_TRACEPOINT_PROBE(block_rq_complete)
{
// TP_PROTO(struct request *rq, blk_status_t error, unsigned int nr_bytes)
struct request *rq = (void *)ctx->args[0];
unsigned int cmd_flags;
u64 dur;
size_t base, slot;
if (!rq->io_start_time_ns)
return 0;
dur = bpf_ktime_get_ns() - rq->io_start_time_ns;
slot = min_t(size_t, div_u64(dur, 100 * NSEC_PER_MSEC), 99);
lat_100ms.increment(slot);
if (slot)
return 0;
slot = min_t(size_t, div_u64(dur, NSEC_PER_MSEC), 99);
lat_1ms.increment(slot);
if (slot)
return 0;
slot = min_t(size_t, div_u64(dur, 10 * NSEC_PER_USEC), 99);
lat_10us.increment(slot);
return 0;
}
"""
bpf = BPF(text=bpf_source)
cur_lat_100ms = bpf['lat_100ms']
cur_lat_1ms = bpf['lat_1ms']
cur_lat_10us = bpf['lat_10us']
last_lat_100ms = [0] * 100
last_lat_1ms = [0] * 100
last_lat_10us = [0] * 100
lat_100ms = [0] * 100
lat_1ms = [0] * 100
lat_10us = [0] * 100
def find_pct(req, total, slots, idx, counted):
while idx > 0:
idx -= 1
if slots[idx] > 0:
counted += slots[idx]
if (counted / total) * 100 >= 100 - req:
break
return (idx, counted)
def calc_lat_pct(req_pcts, total, lat_100ms, lat_1ms, lat_10us):
pcts = [0] * len(req_pcts)
if total == 0:
return pcts
data = [(100 * 1000, lat_100ms), (1000, lat_1ms), (10, lat_10us)]
data_sel = 0
idx = 100
counted = 0
for pct_idx in reversed(range(len(req_pcts))):
req = float(req_pcts[pct_idx])
while True:
last_counted = counted
(gran, slots) = data[data_sel]
(idx, counted) = find_pct(req, total, slots, idx, counted)
if idx > 0 or data_sel == len(data) - 1:
break
counted = last_counted
data_sel += 1
idx = 100
pcts[pct_idx] = gran * idx + gran / 2
return pcts
print('Block I/O latency percentile example. See tools/biolatpcts.py for the full utility.')
while True:
sleep(3)
lat_total = 0;
for i in range(100):
v = cur_lat_100ms.sum(i).value
lat_100ms[i] = max(v - last_lat_100ms[i], 0)
last_lat_100ms[i] = v
v = cur_lat_1ms.sum(i).value
lat_1ms[i] = max(v - last_lat_1ms[i], 0)
last_lat_1ms[i] = v
v = cur_lat_10us.sum(i).value
lat_10us[i] = max(v - last_lat_10us[i], 0)
last_lat_10us[i] = v
lat_total += lat_100ms[i]
target_pcts = [50, 75, 90, 99]
pcts = calc_lat_pct(target_pcts, lat_total, lat_100ms, lat_1ms, lat_10us);
for i in range(len(target_pcts)):
print('p{}={}us '.format(target_pcts[i], int(pcts[i])), end='')
print()