[PATCH] iommu/arm-smmu-v3: add tracepoints for cmdq_issue_cmdlist

Song Bao Hua (Barry Song) song.bao.hua at hisilicon.com
Fri Aug 28 03:55:18 EDT 2020



> -----Original Message-----
> From: Jean-Philippe Brucker [mailto:jean-philippe at linaro.org]
> Sent: Friday, August 28, 2020 7:41 PM
> To: Song Bao Hua (Barry Song) <song.bao.hua at hisilicon.com>
> Cc: iommu at lists.linux-foundation.org; linux-arm-kernel at lists.infradead.org;
> robin.murphy at arm.com; will at kernel.org; Linuxarm <linuxarm at huawei.com>
> Subject: Re: [PATCH] iommu/arm-smmu-v3: add tracepoints for
> cmdq_issue_cmdlist
> 
> Hi,
> 
> On Thu, Aug 27, 2020 at 09:33:51PM +1200, Barry Song wrote:
> > cmdq_issue_cmdlist() is the hotspot that uses a lot of time. This
> > patch adds tracepoints for it to help debug.
> >
> > Signed-off-by: Barry Song <song.bao.hua at hisilicon.com>
> > ---
> >  * can furthermore develop an eBPF program to benchmark using this
> > trace
> 
> Have you tried using kprobe and kretprobe instead of tracepoints?
> Any noticeable performance drop?

Yes. Pls read this email.
kprobe overhead and OPTPROBES implementation on ARM64
https://www.spinics.net/lists/arm-kernel/msg828788.html

> 
> Thanks,
> Jean
> 
> >
> >   cmdlistlat.c:
> > #include <uapi/linux/ptrace.h>
> >
> > BPF_HASH(start, u32);
> > BPF_HISTOGRAM(dist);
> >
> > TRACEPOINT_PROBE(arm_smmu_v3, issue_cmdlist_entry) {
> >         u32 pid;
> >         u64 ts, *val;
> >
> >         pid = bpf_get_current_pid_tgid();
> >         ts = bpf_ktime_get_ns();
> >         start.update(&pid, &ts);
> >         return 0;
> > }
> >
> > TRACEPOINT_PROBE(arm_smmu_v3, issue_cmdlist_exit) {
> >         u32 pid;
> >         u64 *tsp, delta;
> >
> >         pid = bpf_get_current_pid_tgid();
> >         tsp = start.lookup(&pid);
> >
> >         if (tsp != 0) {
> >                 delta = bpf_ktime_get_ns() - *tsp;
> >                 dist.increment(bpf_log2l(delta));
> >                 start.delete(&pid);
> >         }
> >
> >         return 0;
> > }
> >
> >  cmdlistlat.py:
> > #!/usr/bin/python3
> > #
> > from __future__ import print_function
> > from bcc import BPF
> > from ctypes import c_ushort, c_int, c_ulonglong from time import sleep
> > from sys import argv
> >
> > def usage():
> >         print("USAGE: %s [interval [count]]" % argv[0])
> >         exit()
> >
> > # arguments
> > interval = 5
> > count = -1
> > if len(argv) > 1:
> >         try:
> >                 interval = int(argv[1])
> >                 if interval == 0:
> >                         raise
> >                 if len(argv) > 2:
> >                         count = int(argv[2])
> >         except: # also catches -h, --help
> >                 usage()
> >
> > # load BPF program
> > b = BPF(src_file = "cmdlistlat.c")
> >
> > # header
> > print("Tracing... Hit Ctrl-C to end.")
> >
> > # output
> > loop = 0
> > do_exit = 0
> > while (1):
> >         if count > 0:
> >                 loop += 1
> >                 if loop > count:
> >                         exit()
> >         try:
> >                 sleep(interval)
> >         except KeyboardInterrupt:
> >                 pass; do_exit = 1
> >
> >         print()
> >         b["dist"].print_log2_hist("nsecs")
> >         b["dist"].clear()
> >         if do_exit:
> >                 exit()
> >
> >
> >  drivers/iommu/arm/arm-smmu-v3/Makefile        |  1 +
> >  .../iommu/arm/arm-smmu-v3/arm-smmu-v3-trace.h | 48
> +++++++++++++++++++
> >  drivers/iommu/arm/arm-smmu-v3/arm-smmu-v3.c   |  8 ++++
> >  3 files changed, 57 insertions(+)
> >  create mode 100644
> drivers/iommu/arm/arm-smmu-v3/arm-smmu-v3-trace.h
> >
> > diff --git a/drivers/iommu/arm/arm-smmu-v3/Makefile
> > b/drivers/iommu/arm/arm-smmu-v3/Makefile
> > index 569e24e9f162..dba1087f91f3 100644
> > --- a/drivers/iommu/arm/arm-smmu-v3/Makefile
> > +++ b/drivers/iommu/arm/arm-smmu-v3/Makefile
> > @@ -1,2 +1,3 @@
> >  # SPDX-License-Identifier: GPL-2.0
> > +ccflags-y += -I$(src)                   # needed for trace events
> >  obj-$(CONFIG_ARM_SMMU_V3) += arm-smmu-v3.o diff --git
> > a/drivers/iommu/arm/arm-smmu-v3/arm-smmu-v3-trace.h
> > b/drivers/iommu/arm/arm-smmu-v3/arm-smmu-v3-trace.h
> > new file mode 100644
> > index 000000000000..29ab96706124
> > --- /dev/null
> > +++ b/drivers/iommu/arm/arm-smmu-v3/arm-smmu-v3-trace.h
> > @@ -0,0 +1,48 @@
> > +/* SPDX-License-Identifier: GPL-2.0-only */
> > +/*
> > + * Copyright (C) 2020 Hisilicon Limited.
> > + */
> > +
> > +#undef TRACE_SYSTEM
> > +#define TRACE_SYSTEM arm_smmu_v3
> > +
> > +#if !defined(_ARM_SMMU_V3_TRACE_H) ||
> > +defined(TRACE_HEADER_MULTI_READ) #define _ARM_SMMU_V3_TRACE_H
> > +
> > +#include <linux/tracepoint.h>
> > +
> > +struct device;
> > +
> > +DECLARE_EVENT_CLASS(issue_cmdlist_class,
> > +	TP_PROTO(struct device *dev, int n, bool sync),
> > +	TP_ARGS(dev, n, sync),
> > +
> > +	TP_STRUCT__entry(
> > +		__string(device, dev_name(dev))
> > +		__field(int, n)
> > +		__field(bool, sync)
> > +	),
> > +	TP_fast_assign(
> > +		__assign_str(device, dev_name(dev));
> > +		__entry->n = n;
> > +		__entry->sync = sync;
> > +	),
> > +	TP_printk("%s cmd number=%d sync=%d",
> > +			__get_str(device), __entry->n, __entry->sync) );
> > +
> > +#define DEFINE_ISSUE_CMDLIST_EVENT(name)       \
> > +DEFINE_EVENT(issue_cmdlist_class, name,        \
> > +	TP_PROTO(struct device *dev, int n, bool sync), \
> > +	TP_ARGS(dev, n, sync))
> > +
> > +DEFINE_ISSUE_CMDLIST_EVENT(issue_cmdlist_entry);
> > +DEFINE_ISSUE_CMDLIST_EVENT(issue_cmdlist_exit);
> > +
> > +#endif /* _ARM_SMMU_V3_TRACE_H */
> > +
> > +#undef TRACE_INCLUDE_PATH
> > +#undef TRACE_INCLUDE_FILE
> > +#define TRACE_INCLUDE_PATH .
> > +#define TRACE_INCLUDE_FILE arm-smmu-v3-trace #include
> > +<trace/define_trace.h>
> > diff --git a/drivers/iommu/arm/arm-smmu-v3/arm-smmu-v3.c
> > b/drivers/iommu/arm/arm-smmu-v3/arm-smmu-v3.c
> > index 7332251dd8cd..e2d7d5f1d234 100644
> > --- a/drivers/iommu/arm/arm-smmu-v3/arm-smmu-v3.c
> > +++ b/drivers/iommu/arm/arm-smmu-v3/arm-smmu-v3.c
> > @@ -33,6 +33,8 @@
> >
> >  #include <linux/amba/bus.h>
> >
> > +#include "arm-smmu-v3-trace.h"
> > +
> >  /* MMIO registers */
> >  #define ARM_SMMU_IDR0			0x0
> >  #define IDR0_ST_LVL			GENMASK(28, 27)
> > @@ -1389,6 +1391,8 @@ static int arm_smmu_cmdq_issue_cmdlist(struct
> arm_smmu_device *smmu,
> >  	}, head = llq;
> >  	int ret = 0;
> >
> > +	trace_issue_cmdlist_entry(smmu->dev, n, sync);
> > +
> >  	/* 1. Allocate some space in the queue */
> >  	local_irq_save(flags);
> >  	llq.val = READ_ONCE(cmdq->q.llq.val); @@ -1493,6 +1497,7 @@ static
> > int arm_smmu_cmdq_issue_cmdlist(struct arm_smmu_device *smmu,
> >  	}
> >
> >  	local_irq_restore(flags);
> > +	trace_issue_cmdlist_exit(smmu->dev, n, sync);
> >  	return ret;
> >  }
> >
> > @@ -4166,6 +4171,9 @@ static struct platform_driver arm_smmu_driver =
> > {  };  module_platform_driver(arm_smmu_driver);
> >
> > +#define CREATE_TRACE_POINTS
> > +#include "arm-smmu-v3-trace.h"
> > +
> >  MODULE_DESCRIPTION("IOMMU API for ARM architected SMMUv3
> > implementations");  MODULE_AUTHOR("Will Deacon <will at kernel.org>");
> > MODULE_ALIAS("platform:arm-smmu-v3");
> > --
> > 2.27.0




More information about the linux-arm-kernel mailing list