1 // SPDX-License-Identifier: GPL-2.0-or-later
2 /*
3  * Performance counter support for e500 family processors.
4  *
5  * Copyright 2008-2009 Paul Mackerras, IBM Corporation.
6  * Copyright 2010 Freescale Semiconductor, Inc.
7  */
8 #include <linux/string.h>
9 #include <linux/perf_event.h>
10 #include <asm/reg.h>
11 #include <asm/cputable.h>
12 
13 /*
14  * Map of generic hardware event types to hardware events
15  * Zero if unsupported
16  */
17 static int e500_generic_events[] = {
18 	[PERF_COUNT_HW_CPU_CYCLES] = 1,
19 	[PERF_COUNT_HW_INSTRUCTIONS] = 2,
20 	[PERF_COUNT_HW_CACHE_MISSES] = 41, /* Data L1 cache reloads */
21 	[PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = 12,
22 	[PERF_COUNT_HW_BRANCH_MISSES] = 15,
23 	[PERF_COUNT_HW_STALLED_CYCLES_FRONTEND] = 18,
24 	[PERF_COUNT_HW_STALLED_CYCLES_BACKEND] = 19,
25 };
26 
27 #define C(x)	PERF_COUNT_HW_CACHE_##x
28 
29 /*
30  * Table of generalized cache-related events.
31  * 0 means not supported, -1 means nonsensical, other values
32  * are event codes.
33  */
34 static int e500_cache_events[C(MAX)][C(OP_MAX)][C(RESULT_MAX)] = {
35 	/*
36 	 * D-cache misses are not split into read/write/prefetch;
37 	 * use raw event 41.
38 	 */
39 	[C(L1D)] = {		/* 	RESULT_ACCESS	RESULT_MISS */
40 		[C(OP_READ)] = {	27,		0	},
41 		[C(OP_WRITE)] = {	28,		0	},
42 		[C(OP_PREFETCH)] = {	29,		0	},
43 	},
44 	[C(L1I)] = {		/* 	RESULT_ACCESS	RESULT_MISS */
45 		[C(OP_READ)] = {	2,		60	},
46 		[C(OP_WRITE)] = {	-1,		-1	},
47 		[C(OP_PREFETCH)] = {	0,		0	},
48 	},
49 	/*
50 	 * Assuming LL means L2, it's not a good match for this model.
51 	 * It allocates only on L1 castout or explicit prefetch, and
52 	 * does not have separate read/write events (but it does have
53 	 * separate instruction/data events).
54 	 */
55 	[C(LL)] = {		/* 	RESULT_ACCESS	RESULT_MISS */
56 		[C(OP_READ)] = {	0,		0	},
57 		[C(OP_WRITE)] = {	0,		0	},
58 		[C(OP_PREFETCH)] = {	0,		0	},
59 	},
60 	/*
61 	 * There are data/instruction MMU misses, but that's a miss on
62 	 * the chip's internal level-one TLB which is probably not
63 	 * what the user wants.  Instead, unified level-two TLB misses
64 	 * are reported here.
65 	 */
66 	[C(DTLB)] = {		/* 	RESULT_ACCESS	RESULT_MISS */
67 		[C(OP_READ)] = {	26,		66	},
68 		[C(OP_WRITE)] = {	-1,		-1	},
69 		[C(OP_PREFETCH)] = {	-1,		-1	},
70 	},
71 	[C(BPU)] = {		/* 	RESULT_ACCESS	RESULT_MISS */
72 		[C(OP_READ)] = {	12,		15 	},
73 		[C(OP_WRITE)] = {	-1,		-1	},
74 		[C(OP_PREFETCH)] = {	-1,		-1	},
75 	},
76 	[C(NODE)] = {		/* 	RESULT_ACCESS	RESULT_MISS */
77 		[C(OP_READ)] = {	-1,		-1 	},
78 		[C(OP_WRITE)] = {	-1,		-1	},
79 		[C(OP_PREFETCH)] = {	-1,		-1	},
80 	},
81 };
82 
83 static int num_events = 128;
84 
85 /* Upper half of event id is PMLCb, for threshold events */
e500_xlate_event(u64 event_id)86 static u64 e500_xlate_event(u64 event_id)
87 {
88 	u32 event_low = (u32)event_id;
89 	u64 ret;
90 
91 	if (event_low >= num_events)
92 		return 0;
93 
94 	ret = FSL_EMB_EVENT_VALID;
95 
96 	if (event_low >= 76 && event_low <= 81) {
97 		ret |= FSL_EMB_EVENT_RESTRICTED;
98 		ret |= event_id &
99 		       (FSL_EMB_EVENT_THRESHMUL | FSL_EMB_EVENT_THRESH);
100 	} else if (event_id &
101 	           (FSL_EMB_EVENT_THRESHMUL | FSL_EMB_EVENT_THRESH)) {
102 		/* Threshold requested on non-threshold event */
103 		return 0;
104 	}
105 
106 	return ret;
107 }
108 
109 static struct fsl_emb_pmu e500_pmu = {
110 	.name			= "e500 family",
111 	.n_counter		= 4,
112 	.n_restricted		= 2,
113 	.xlate_event		= e500_xlate_event,
114 	.n_generic		= ARRAY_SIZE(e500_generic_events),
115 	.generic_events		= e500_generic_events,
116 	.cache_events		= &e500_cache_events,
117 };
118 
init_e500_pmu(void)119 static int init_e500_pmu(void)
120 {
121 	if (!cur_cpu_spec->oprofile_cpu_type)
122 		return -ENODEV;
123 
124 	if (!strcmp(cur_cpu_spec->oprofile_cpu_type, "ppc/e500mc"))
125 		num_events = 256;
126 	else if (strcmp(cur_cpu_spec->oprofile_cpu_type, "ppc/e500"))
127 		return -ENODEV;
128 
129 	return register_fsl_emb_pmu(&e500_pmu);
130 }
131 
132 early_initcall(init_e500_pmu);
133