1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0+
2*4882a593Smuzhiyun
3*4882a593Smuzhiyun /*
4*4882a593Smuzhiyun * Copyright 2018 IBM Corporation.
5*4882a593Smuzhiyun */
6*4882a593Smuzhiyun
7*4882a593Smuzhiyun #define __SANE_USERSPACE_TYPES__
8*4882a593Smuzhiyun
9*4882a593Smuzhiyun #include <sys/types.h>
10*4882a593Smuzhiyun #include <stdint.h>
11*4882a593Smuzhiyun #include <malloc.h>
12*4882a593Smuzhiyun #include <unistd.h>
13*4882a593Smuzhiyun #include <signal.h>
14*4882a593Smuzhiyun #include <stdlib.h>
15*4882a593Smuzhiyun #include <string.h>
16*4882a593Smuzhiyun #include <stdio.h>
17*4882a593Smuzhiyun #include "utils.h"
18*4882a593Smuzhiyun #include "flush_utils.h"
19*4882a593Smuzhiyun
entry_flush_test(void)20*4882a593Smuzhiyun int entry_flush_test(void)
21*4882a593Smuzhiyun {
22*4882a593Smuzhiyun char *p;
23*4882a593Smuzhiyun int repetitions = 10;
24*4882a593Smuzhiyun int fd, passes = 0, iter, rc = 0;
25*4882a593Smuzhiyun struct perf_event_read v;
26*4882a593Smuzhiyun __u64 l1d_misses_total = 0;
27*4882a593Smuzhiyun unsigned long iterations = 100000, zero_size = 24 * 1024;
28*4882a593Smuzhiyun unsigned long l1d_misses_expected;
29*4882a593Smuzhiyun int rfi_flush_orig;
30*4882a593Smuzhiyun int entry_flush, entry_flush_orig;
31*4882a593Smuzhiyun
32*4882a593Smuzhiyun SKIP_IF(geteuid() != 0);
33*4882a593Smuzhiyun
34*4882a593Smuzhiyun // The PMU event we use only works on Power7 or later
35*4882a593Smuzhiyun SKIP_IF(!have_hwcap(PPC_FEATURE_ARCH_2_06));
36*4882a593Smuzhiyun
37*4882a593Smuzhiyun if (read_debugfs_file("powerpc/rfi_flush", &rfi_flush_orig) < 0) {
38*4882a593Smuzhiyun perror("Unable to read powerpc/rfi_flush debugfs file");
39*4882a593Smuzhiyun SKIP_IF(1);
40*4882a593Smuzhiyun }
41*4882a593Smuzhiyun
42*4882a593Smuzhiyun if (read_debugfs_file("powerpc/entry_flush", &entry_flush_orig) < 0) {
43*4882a593Smuzhiyun perror("Unable to read powerpc/entry_flush debugfs file");
44*4882a593Smuzhiyun SKIP_IF(1);
45*4882a593Smuzhiyun }
46*4882a593Smuzhiyun
47*4882a593Smuzhiyun if (rfi_flush_orig != 0) {
48*4882a593Smuzhiyun if (write_debugfs_file("powerpc/rfi_flush", 0) < 0) {
49*4882a593Smuzhiyun perror("error writing to powerpc/rfi_flush debugfs file");
50*4882a593Smuzhiyun FAIL_IF(1);
51*4882a593Smuzhiyun }
52*4882a593Smuzhiyun }
53*4882a593Smuzhiyun
54*4882a593Smuzhiyun entry_flush = entry_flush_orig;
55*4882a593Smuzhiyun
56*4882a593Smuzhiyun fd = perf_event_open_counter(PERF_TYPE_HW_CACHE, PERF_L1D_READ_MISS_CONFIG, -1);
57*4882a593Smuzhiyun FAIL_IF(fd < 0);
58*4882a593Smuzhiyun
59*4882a593Smuzhiyun p = (char *)memalign(zero_size, CACHELINE_SIZE);
60*4882a593Smuzhiyun
61*4882a593Smuzhiyun FAIL_IF(perf_event_enable(fd));
62*4882a593Smuzhiyun
63*4882a593Smuzhiyun // disable L1 prefetching
64*4882a593Smuzhiyun set_dscr(1);
65*4882a593Smuzhiyun
66*4882a593Smuzhiyun iter = repetitions;
67*4882a593Smuzhiyun
68*4882a593Smuzhiyun /*
69*4882a593Smuzhiyun * We expect to see l1d miss for each cacheline access when entry_flush
70*4882a593Smuzhiyun * is set. Allow a small variation on this.
71*4882a593Smuzhiyun */
72*4882a593Smuzhiyun l1d_misses_expected = iterations * (zero_size / CACHELINE_SIZE - 2);
73*4882a593Smuzhiyun
74*4882a593Smuzhiyun again:
75*4882a593Smuzhiyun FAIL_IF(perf_event_reset(fd));
76*4882a593Smuzhiyun
77*4882a593Smuzhiyun syscall_loop(p, iterations, zero_size);
78*4882a593Smuzhiyun
79*4882a593Smuzhiyun FAIL_IF(read(fd, &v, sizeof(v)) != sizeof(v));
80*4882a593Smuzhiyun
81*4882a593Smuzhiyun if (entry_flush && v.l1d_misses >= l1d_misses_expected)
82*4882a593Smuzhiyun passes++;
83*4882a593Smuzhiyun else if (!entry_flush && v.l1d_misses < (l1d_misses_expected / 2))
84*4882a593Smuzhiyun passes++;
85*4882a593Smuzhiyun
86*4882a593Smuzhiyun l1d_misses_total += v.l1d_misses;
87*4882a593Smuzhiyun
88*4882a593Smuzhiyun while (--iter)
89*4882a593Smuzhiyun goto again;
90*4882a593Smuzhiyun
91*4882a593Smuzhiyun if (passes < repetitions) {
92*4882a593Smuzhiyun printf("FAIL (L1D misses with entry_flush=%d: %llu %c %lu) [%d/%d failures]\n",
93*4882a593Smuzhiyun entry_flush, l1d_misses_total, entry_flush ? '<' : '>',
94*4882a593Smuzhiyun entry_flush ? repetitions * l1d_misses_expected :
95*4882a593Smuzhiyun repetitions * l1d_misses_expected / 2,
96*4882a593Smuzhiyun repetitions - passes, repetitions);
97*4882a593Smuzhiyun rc = 1;
98*4882a593Smuzhiyun } else {
99*4882a593Smuzhiyun printf("PASS (L1D misses with entry_flush=%d: %llu %c %lu) [%d/%d pass]\n",
100*4882a593Smuzhiyun entry_flush, l1d_misses_total, entry_flush ? '>' : '<',
101*4882a593Smuzhiyun entry_flush ? repetitions * l1d_misses_expected :
102*4882a593Smuzhiyun repetitions * l1d_misses_expected / 2,
103*4882a593Smuzhiyun passes, repetitions);
104*4882a593Smuzhiyun }
105*4882a593Smuzhiyun
106*4882a593Smuzhiyun if (entry_flush == entry_flush_orig) {
107*4882a593Smuzhiyun entry_flush = !entry_flush_orig;
108*4882a593Smuzhiyun if (write_debugfs_file("powerpc/entry_flush", entry_flush) < 0) {
109*4882a593Smuzhiyun perror("error writing to powerpc/entry_flush debugfs file");
110*4882a593Smuzhiyun return 1;
111*4882a593Smuzhiyun }
112*4882a593Smuzhiyun iter = repetitions;
113*4882a593Smuzhiyun l1d_misses_total = 0;
114*4882a593Smuzhiyun passes = 0;
115*4882a593Smuzhiyun goto again;
116*4882a593Smuzhiyun }
117*4882a593Smuzhiyun
118*4882a593Smuzhiyun perf_event_disable(fd);
119*4882a593Smuzhiyun close(fd);
120*4882a593Smuzhiyun
121*4882a593Smuzhiyun set_dscr(0);
122*4882a593Smuzhiyun
123*4882a593Smuzhiyun if (write_debugfs_file("powerpc/rfi_flush", rfi_flush_orig) < 0) {
124*4882a593Smuzhiyun perror("unable to restore original value of powerpc/rfi_flush debugfs file");
125*4882a593Smuzhiyun return 1;
126*4882a593Smuzhiyun }
127*4882a593Smuzhiyun
128*4882a593Smuzhiyun if (write_debugfs_file("powerpc/entry_flush", entry_flush_orig) < 0) {
129*4882a593Smuzhiyun perror("unable to restore original value of powerpc/entry_flush debugfs file");
130*4882a593Smuzhiyun return 1;
131*4882a593Smuzhiyun }
132*4882a593Smuzhiyun
133*4882a593Smuzhiyun return rc;
134*4882a593Smuzhiyun }
135*4882a593Smuzhiyun
main(int argc,char * argv[])136*4882a593Smuzhiyun int main(int argc, char *argv[])
137*4882a593Smuzhiyun {
138*4882a593Smuzhiyun return test_harness(entry_flush_test, "entry_flush_test");
139*4882a593Smuzhiyun }
140