Thread (18 messages) 18 messages, 3 authors, 2020-09-04

Re: [PATCH v2 5/9] libperf: Add support for user space counter access

From: Rob Herring <robh@kernel.org>
Date: 2020-09-02 17:00:27
Also in: lkml

On Mon, Aug 31, 2020 at 3:11 AM Jiri Olsa [off-list ref] wrote:
On Fri, Aug 28, 2020 at 02:56:10PM -0600, Rob Herring wrote:

SNIP
quoted
+int perf_mmap__read_self(struct perf_mmap *map, struct perf_counts_values *count)
+{
+     struct perf_event_mmap_page *pc = map->base;
+     u32 seq, idx, time_mult = 0, time_shift = 0;
+     u64 cnt, cyc = 0, time_offset = 0, time_cycles = 0, time_mask = ~0ULL;
+
+     BUG_ON(!pc);
+
+     if (!pc->cap_user_rdpmc)
+             return -1;
+
+     do {
+             seq = READ_ONCE(pc->lock);
+             barrier();
+
+             count->ena = READ_ONCE(pc->time_enabled);
+             count->run = READ_ONCE(pc->time_running);
+
+             if (pc->cap_user_time && count->ena != count->run) {
+                     cyc = read_timestamp();
+                     time_mult = READ_ONCE(pc->time_mult);
+                     time_shift = READ_ONCE(pc->time_shift);
+                     time_offset = READ_ONCE(pc->time_offset);
+
+                     if (pc->cap_user_time_short) {
+                             time_cycles = READ_ONCE(pc->time_cycles);
+                             time_mask = READ_ONCE(pc->time_mask);
+                     }
+             }
+
+             idx = READ_ONCE(pc->index);
+             cnt = READ_ONCE(pc->offset);
+             if (pc->cap_user_rdpmc && idx) {
no need to check pc->cap_user_rdpmc again
I was thinking cap_user_rdpmc could change, but I guess idx will
always be 0 in that case.
quoted
+static int test_stat_user_read(int event)
+{
+     struct perf_counts_values counts = { .val = 0 };
+     struct perf_thread_map *threads;
+     struct perf_evsel *evsel;
+     struct perf_event_mmap_page *pc;
+     struct perf_event_attr attr = {
+             .type   = PERF_TYPE_HARDWARE,
+             .config = event,
+     };
+     int err, i;
+
+     threads = perf_thread_map__new_dummy();
+     __T("failed to create threads", threads);
+
+     perf_thread_map__set_pid(threads, 0, 0);
+
+     evsel = perf_evsel__new(&attr);
+     __T("failed to create evsel", evsel);
+
+     err = perf_evsel__open(evsel, NULL, threads);
+     __T("failed to open evsel", err == 0);
+
+     pc = perf_evsel__mmap(evsel);
+     __T("failed to mmap evsel", pc);
+
+#if defined(__i386__) || defined(__x86_64__) || defined(__aarch64__)
+     __T("userspace counter access not supported", pc->cap_user_rdpmc);
+     __T("userspace counter access not enabled", pc->index);
+     __T("userspace counter width not set", pc->pmc_width >= 32);
+#endif
+
+     perf_evsel__read(evsel, 0, 0, &counts);
+     __T("failed to read value for evsel", counts.val != 0);
+
+     fputs("\n", stderr);
+     for (i = 0; i < 5; i++) {
+             volatile int count = 0x10000 << i;
+             __u64 start, end, last = 0;
+
+             fprintf(stderr, "\tloop = %u, ", count);
we should add support to display verbose output for tests,
because right now this breaks the output:

- running test-cpumap.c...OK
- running test-threadmap.c...OK
- running test-evlist.c...OK
- running test-evsel.c...
        loop = 65536, count = 328035
        loop = 131072, count = 655715
        loop = 262144, count = 1311075
        loop = 524288, count = 2627060
        loop = 1048576, count = 5253540

        loop = 65536, count = 327594
        loop = 131072, count = 659930
        loop = 262144, count = 1378892
        loop = 524288, count = 2664341
        loop = 1048576, count = 5365682
OK

but we can do it in separate change later
Would you like me to just comment this out then for now?

Rob

_______________________________________________
linux-arm-kernel mailing list
linux-arm-kernel@lists.infradead.org
http://lists.infradead.org/mailman/listinfo/linux-arm-kernel
Keyboard shortcuts
hback out one level
jnext message in thread
kprevious message in thread
ldrill in
Escclose help / fold thread tree
?toggle this help