[RFC PATCH 1/5] Application: reads perf cycle counter using perf_event_open syscall
Yogesh Tillu
yogesh.tillu at linaro.org
Mon Nov 3 07:04:01 PST 2014
This patchset is for application reading perf cycle counter using syscall
perf_event_open.
Signed-off-by: Yogesh Tillu <yogesh.tillu at linaro.org>
---
app_readcounter.c | 83 +++++++++++++++++++++++++++++++++++++++++++++++++++++
1 file changed, 83 insertions(+)
create mode 100644 app_readcounter.c
diff --git a/app_readcounter.c b/app_readcounter.c
new file mode 100644
index 0000000..5363dd4
--- /dev/null
+++ b/app_readcounter.c
@@ -0,0 +1,83 @@
+/*
+Application to Read perf cycle counter using perf_event_open syscall
+
+To Run: pass randon number to create busy loop
+e.g.: $./app_readcounter 64
+
+*/
+#define _GNU_SOURCE
+#include <stdio.h>
+#include <stdint.h>
+#include <stdlib.h>
+#include <unistd.h>
+#include <sys/types.h>
+#include <sys/syscall.h>
+#include <linux/perf_event.h>
+
+static int fddev = -1;
+__attribute__((constructor)) static void
+init(void)
+{
+ static struct perf_event_attr attr;
+ attr.type = PERF_TYPE_HARDWARE;
+ attr.config = PERF_COUNT_HW_CPU_CYCLES;
+ fddev = syscall(__NR_perf_event_open, &attr, 0, -1, -1, 0);
+}
+
+__attribute__((destructor)) static void
+fini(void)
+{
+ close(fddev);
+}
+
+static inline long long
+cpucycles(void)
+{
+ long long result = 0;
+ if (read(fddev, &result, sizeof(result)) < sizeof(result)) return 0;
+ return result;
+}
+
+/* Simple loop body to keep things interested. Make sure it gets inlined. */
+static inline int
+loop(int* __restrict__ a, int* __restrict__ b, int n)
+{
+ unsigned sum = 0;
+ int i=0;
+ for ( i = 0; i < n; ++i)
+ if(a[i] > b[i])
+ sum += a[i] + 5;
+ return sum;
+}
+
+int
+main(int ac, char **av)
+{
+ long long time_start = 0;
+ long long time_end = 0;
+
+ int *a = NULL;
+ int *b = NULL;
+ int len = 0;
+ int i,sum = 0;
+ if (ac != 2) return -1;
+ len = atoi(av[1]);
+ printf("%s: len = %d\n", av[0], len);
+
+ a = malloc(len*sizeof(*a));
+ b = malloc(len*sizeof(*b));
+
+ for (i = 0; i < len; ++i) {
+ a[i] = i+128;
+ b[i] = i+64;
+ }
+
+ printf("%s: beginning loop\n", av[0]);
+ time_start = cpucycles();
+ sum = loop(a, b, len);
+ time_end = cpucycles();
+ printf("%s: done. sum = %d; time delta = %llu\n", av[0], sum, time_end - time_start);
+
+ free(a); free(b);
+ return 0;
+}
--
1.7.9.5
More information about the linux-arm-kernel
mailing list