Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
torvalds
GitHub Repository: torvalds/linux
Path: blob/master/arch/powerpc/perf/isa207-common.h
26442 views
1
/* SPDX-License-Identifier: GPL-2.0-or-later */
2
/*
3
* Copyright 2009 Paul Mackerras, IBM Corporation.
4
* Copyright 2013 Michael Ellerman, IBM Corporation.
5
* Copyright 2016 Madhavan Srinivasan, IBM Corporation.
6
*/
7
8
#ifndef _LINUX_POWERPC_PERF_ISA207_COMMON_H_
9
#define _LINUX_POWERPC_PERF_ISA207_COMMON_H_
10
11
#include <linux/kernel.h>
12
#include <linux/perf_event.h>
13
#include <asm/firmware.h>
14
#include <asm/cputable.h>
15
16
#include "internal.h"
17
18
#define EVENT_EBB_MASK 1ull
19
#define EVENT_EBB_SHIFT PERF_EVENT_CONFIG_EBB_SHIFT
20
#define EVENT_BHRB_MASK 1ull
21
#define EVENT_BHRB_SHIFT 62
22
#define EVENT_WANTS_BHRB (EVENT_BHRB_MASK << EVENT_BHRB_SHIFT)
23
#define EVENT_IFM_MASK 3ull
24
#define EVENT_IFM_SHIFT 60
25
#define EVENT_THR_CMP_SHIFT 40 /* Threshold CMP value */
26
#define EVENT_THR_CMP_MASK 0x3ff
27
#define EVENT_THR_CTL_SHIFT 32 /* Threshold control value (start/stop) */
28
#define EVENT_THR_CTL_MASK 0xffull
29
#define EVENT_THR_SEL_SHIFT 29 /* Threshold select value */
30
#define EVENT_THR_SEL_MASK 0x7
31
#define EVENT_THRESH_SHIFT 29 /* All threshold bits */
32
#define EVENT_THRESH_MASK 0x1fffffull
33
#define EVENT_SAMPLE_SHIFT 24 /* Sampling mode & eligibility */
34
#define EVENT_SAMPLE_MASK 0x1f
35
#define EVENT_CACHE_SEL_SHIFT 20 /* L2/L3 cache select */
36
#define EVENT_CACHE_SEL_MASK 0xf
37
#define EVENT_IS_L1 (4 << EVENT_CACHE_SEL_SHIFT)
38
#define EVENT_PMC_SHIFT 16 /* PMC number (1-based) */
39
#define EVENT_PMC_MASK 0xf
40
#define EVENT_UNIT_SHIFT 12 /* Unit */
41
#define EVENT_UNIT_MASK 0xf
42
#define EVENT_COMBINE_SHIFT 11 /* Combine bit */
43
#define EVENT_COMBINE_MASK 0x1
44
#define EVENT_COMBINE(v) (((v) >> EVENT_COMBINE_SHIFT) & EVENT_COMBINE_MASK)
45
#define EVENT_MARKED_SHIFT 8 /* Marked bit */
46
#define EVENT_MARKED_MASK 0x1
47
#define EVENT_IS_MARKED (EVENT_MARKED_MASK << EVENT_MARKED_SHIFT)
48
#define EVENT_PSEL_MASK 0xff /* PMCxSEL value */
49
50
/* Bits defined by Linux */
51
#define EVENT_LINUX_MASK \
52
((EVENT_EBB_MASK << EVENT_EBB_SHIFT) | \
53
(EVENT_BHRB_MASK << EVENT_BHRB_SHIFT) | \
54
(EVENT_IFM_MASK << EVENT_IFM_SHIFT))
55
56
#define EVENT_VALID_MASK \
57
((EVENT_THRESH_MASK << EVENT_THRESH_SHIFT) | \
58
(EVENT_SAMPLE_MASK << EVENT_SAMPLE_SHIFT) | \
59
(EVENT_CACHE_SEL_MASK << EVENT_CACHE_SEL_SHIFT) | \
60
(EVENT_PMC_MASK << EVENT_PMC_SHIFT) | \
61
(EVENT_UNIT_MASK << EVENT_UNIT_SHIFT) | \
62
(EVENT_COMBINE_MASK << EVENT_COMBINE_SHIFT) | \
63
(EVENT_MARKED_MASK << EVENT_MARKED_SHIFT) | \
64
EVENT_LINUX_MASK | \
65
EVENT_PSEL_MASK)
66
67
#define ONLY_PLM \
68
(PERF_SAMPLE_BRANCH_USER |\
69
PERF_SAMPLE_BRANCH_KERNEL |\
70
PERF_SAMPLE_BRANCH_HV)
71
72
/* Contants to support power9 raw encoding format */
73
#define p9_EVENT_COMBINE_SHIFT 10 /* Combine bit */
74
#define p9_EVENT_COMBINE_MASK 0x3ull
75
#define p9_EVENT_COMBINE(v) (((v) >> p9_EVENT_COMBINE_SHIFT) & p9_EVENT_COMBINE_MASK)
76
#define p9_SDAR_MODE_SHIFT 50
77
#define p9_SDAR_MODE_MASK 0x3ull
78
#define p9_SDAR_MODE(v) (((v) >> p9_SDAR_MODE_SHIFT) & p9_SDAR_MODE_MASK)
79
80
#define p9_EVENT_VALID_MASK \
81
((p9_SDAR_MODE_MASK << p9_SDAR_MODE_SHIFT | \
82
(EVENT_THRESH_MASK << EVENT_THRESH_SHIFT) | \
83
(EVENT_SAMPLE_MASK << EVENT_SAMPLE_SHIFT) | \
84
(EVENT_CACHE_SEL_MASK << EVENT_CACHE_SEL_SHIFT) | \
85
(EVENT_PMC_MASK << EVENT_PMC_SHIFT) | \
86
(EVENT_UNIT_MASK << EVENT_UNIT_SHIFT) | \
87
(p9_EVENT_COMBINE_MASK << p9_EVENT_COMBINE_SHIFT) | \
88
(EVENT_MARKED_MASK << EVENT_MARKED_SHIFT) | \
89
EVENT_LINUX_MASK | \
90
EVENT_PSEL_MASK))
91
92
/* Contants to support power10 raw encoding format */
93
#define p10_SDAR_MODE_SHIFT 22
94
#define p10_SDAR_MODE_MASK 0x3ull
95
#define p10_SDAR_MODE(v) (((v) >> p10_SDAR_MODE_SHIFT) & \
96
p10_SDAR_MODE_MASK)
97
#define p10_EVENT_L2L3_SEL_MASK 0x1f
98
#define p10_L2L3_SEL_SHIFT 3
99
#define p10_L2L3_EVENT_SHIFT 40
100
#define p10_EVENT_THRESH_MASK 0xffffull
101
#define p10_EVENT_CACHE_SEL_MASK 0x3ull
102
#define p10_EVENT_MMCR3_MASK 0x7fffull
103
#define p10_EVENT_MMCR3_SHIFT 45
104
#define p10_EVENT_RADIX_SCOPE_QUAL_SHIFT 9
105
#define p10_EVENT_RADIX_SCOPE_QUAL_MASK 0x1
106
#define p10_MMCR1_RADIX_SCOPE_QUAL_SHIFT 45
107
108
/* Event Threshold Compare bit constant for power10 in config1 attribute */
109
#define p10_EVENT_THR_CMP_SHIFT 0
110
#define p10_EVENT_THR_CMP_MASK 0x3FFFFull
111
112
#define p10_EVENT_VALID_MASK \
113
((p10_SDAR_MODE_MASK << p10_SDAR_MODE_SHIFT | \
114
(p10_EVENT_THRESH_MASK << EVENT_THRESH_SHIFT) | \
115
(EVENT_SAMPLE_MASK << EVENT_SAMPLE_SHIFT) | \
116
(p10_EVENT_CACHE_SEL_MASK << EVENT_CACHE_SEL_SHIFT) | \
117
(EVENT_PMC_MASK << EVENT_PMC_SHIFT) | \
118
(EVENT_UNIT_MASK << EVENT_UNIT_SHIFT) | \
119
(p9_EVENT_COMBINE_MASK << p9_EVENT_COMBINE_SHIFT) | \
120
(p10_EVENT_MMCR3_MASK << p10_EVENT_MMCR3_SHIFT) | \
121
(EVENT_MARKED_MASK << EVENT_MARKED_SHIFT) | \
122
(p10_EVENT_RADIX_SCOPE_QUAL_MASK << p10_EVENT_RADIX_SCOPE_QUAL_SHIFT) | \
123
EVENT_LINUX_MASK | \
124
EVENT_PSEL_MASK))
125
/*
126
* Layout of constraint bits:
127
*
128
* 60 56 52 48 44 40 36 32
129
* | - - - - | - - - - | - - - - | - - - - | - - - - | - - - - | - - - - | - - - - |
130
* [ fab_match ] [ thresh_cmp ] [ thresh_ctl ] [ ]
131
* | |
132
* [ thresh_cmp bits for p10] thresh_sel -*
133
*
134
* 28 24 20 16 12 8 4 0
135
* | - - - - | - - - - | - - - - | - - - - | - - - - | - - - - | - - - - | - - - - |
136
* [ ] | [ ] | [ sample ] [ ] [6] [5] [4] [3] [2] [1]
137
* | | | | |
138
* BHRB IFM -* | | |*radix_scope | Count of events for each PMC.
139
* EBB -* | | p1, p2, p3, p4, p5, p6.
140
* L1 I/D qualifier -* |
141
* nc - number of counters -*
142
*
143
* The PMC fields P1..P6, and NC, are adder fields. As we accumulate constraints
144
* we want the low bit of each field to be added to any existing value.
145
*
146
* Everything else is a value field.
147
*/
148
149
#define CNST_FAB_MATCH_VAL(v) (((v) & EVENT_THR_CTL_MASK) << 56)
150
#define CNST_FAB_MATCH_MASK CNST_FAB_MATCH_VAL(EVENT_THR_CTL_MASK)
151
152
/* We just throw all the threshold bits into the constraint */
153
#define CNST_THRESH_VAL(v) (((v) & EVENT_THRESH_MASK) << 32)
154
#define CNST_THRESH_MASK CNST_THRESH_VAL(EVENT_THRESH_MASK)
155
156
#define CNST_THRESH_CTL_SEL_VAL(v) (((v) & 0x7ffull) << 32)
157
#define CNST_THRESH_CTL_SEL_MASK CNST_THRESH_CTL_SEL_VAL(0x7ff)
158
159
#define p10_CNST_THRESH_CMP_VAL(v) (((v) & 0x7ffull) << 43)
160
#define p10_CNST_THRESH_CMP_MASK p10_CNST_THRESH_CMP_VAL(0x7ff)
161
162
#define CNST_EBB_VAL(v) (((v) & EVENT_EBB_MASK) << 24)
163
#define CNST_EBB_MASK CNST_EBB_VAL(EVENT_EBB_MASK)
164
165
#define CNST_IFM_VAL(v) (((v) & EVENT_IFM_MASK) << 25)
166
#define CNST_IFM_MASK CNST_IFM_VAL(EVENT_IFM_MASK)
167
168
#define CNST_L1_QUAL_VAL(v) (((v) & 3) << 22)
169
#define CNST_L1_QUAL_MASK CNST_L1_QUAL_VAL(3)
170
171
#define CNST_SAMPLE_VAL(v) (((v) & EVENT_SAMPLE_MASK) << 16)
172
#define CNST_SAMPLE_MASK CNST_SAMPLE_VAL(EVENT_SAMPLE_MASK)
173
174
#define CNST_CACHE_GROUP_VAL(v) (((v) & 0xffull) << 55)
175
#define CNST_CACHE_GROUP_MASK CNST_CACHE_GROUP_VAL(0xff)
176
#define CNST_CACHE_PMC4_VAL (1ull << 54)
177
#define CNST_CACHE_PMC4_MASK CNST_CACHE_PMC4_VAL
178
179
#define CNST_L2L3_GROUP_VAL(v) (((v) & 0x1full) << 55)
180
#define CNST_L2L3_GROUP_MASK CNST_L2L3_GROUP_VAL(0x1f)
181
182
#define CNST_RADIX_SCOPE_GROUP_VAL(v) (((v) & 0x1ull) << 21)
183
#define CNST_RADIX_SCOPE_GROUP_MASK CNST_RADIX_SCOPE_GROUP_VAL(1)
184
185
/*
186
* For NC we are counting up to 4 events. This requires three bits, and we need
187
* the fifth event to overflow and set the 4th bit. To achieve that we bias the
188
* fields by 3 in test_adder.
189
*/
190
#define CNST_NC_SHIFT 12
191
#define CNST_NC_VAL (1 << CNST_NC_SHIFT)
192
#define CNST_NC_MASK (8 << CNST_NC_SHIFT)
193
#define ISA207_TEST_ADDER (3 << CNST_NC_SHIFT)
194
195
/*
196
* For the per-PMC fields we have two bits. The low bit is added, so if two
197
* events ask for the same PMC the sum will overflow, setting the high bit,
198
* indicating an error. So our mask sets the high bit.
199
*/
200
#define CNST_PMC_SHIFT(pmc) ((pmc - 1) * 2)
201
#define CNST_PMC_VAL(pmc) (1 << CNST_PMC_SHIFT(pmc))
202
#define CNST_PMC_MASK(pmc) (2 << CNST_PMC_SHIFT(pmc))
203
204
/* Our add_fields is defined as: */
205
#define ISA207_ADD_FIELDS \
206
CNST_PMC_VAL(1) | CNST_PMC_VAL(2) | CNST_PMC_VAL(3) | \
207
CNST_PMC_VAL(4) | CNST_PMC_VAL(5) | CNST_PMC_VAL(6) | CNST_NC_VAL
208
209
/* Bits in MMCR1 for PowerISA v2.07 */
210
#define MMCR1_UNIT_SHIFT(pmc) (60 - (4 * ((pmc) - 1)))
211
#define MMCR1_COMBINE_SHIFT(pmc) (35 - ((pmc) - 1))
212
#define MMCR1_PMCSEL_SHIFT(pmc) (24 - (((pmc) - 1)) * 8)
213
#define MMCR1_FAB_SHIFT 36
214
#define MMCR1_DC_IC_QUAL_MASK 0x3
215
#define MMCR1_DC_IC_QUAL_SHIFT 46
216
217
/* MMCR1 Combine bits macro for power9 */
218
#define p9_MMCR1_COMBINE_SHIFT(pmc) (38 - ((pmc - 1) * 2))
219
220
/* Bits in MMCRA for PowerISA v2.07 */
221
#define MMCRA_SAMP_MODE_SHIFT 1
222
#define MMCRA_SAMP_ELIG_SHIFT 4
223
#define MMCRA_SAMP_ELIG_MASK 7
224
#define MMCRA_THR_CTL_SHIFT 8
225
#define MMCRA_THR_SEL_SHIFT 16
226
#define MMCRA_THR_CMP_SHIFT 32
227
#define MMCRA_SDAR_MODE_SHIFT 42
228
#define MMCRA_SDAR_MODE_TLB (1ull << MMCRA_SDAR_MODE_SHIFT)
229
#define MMCRA_SDAR_MODE_NO_UPDATES ~(0x3ull << MMCRA_SDAR_MODE_SHIFT)
230
#define MMCRA_SDAR_MODE_DCACHE (2ull << MMCRA_SDAR_MODE_SHIFT)
231
#define MMCRA_IFM_SHIFT 30
232
#define MMCRA_THR_CTR_MANT_SHIFT 19
233
#define MMCRA_THR_CTR_MANT_MASK 0x7Ful
234
#define MMCRA_THR_CTR_MANT(v) (((v) >> MMCRA_THR_CTR_MANT_SHIFT) &\
235
MMCRA_THR_CTR_MANT_MASK)
236
237
#define MMCRA_THR_CTR_EXP_SHIFT 27
238
#define MMCRA_THR_CTR_EXP_MASK 0x7ul
239
#define MMCRA_THR_CTR_EXP(v) (((v) >> MMCRA_THR_CTR_EXP_SHIFT) &\
240
MMCRA_THR_CTR_EXP_MASK)
241
242
#define P10_MMCRA_THR_CTR_MANT_MASK 0xFFul
243
#define P10_MMCRA_THR_CTR_MANT(v) (((v) >> MMCRA_THR_CTR_MANT_SHIFT) &\
244
P10_MMCRA_THR_CTR_MANT_MASK)
245
246
/* MMCRA Threshold Compare bit constant for power9 */
247
#define p9_MMCRA_THR_CMP_SHIFT 45
248
249
/* Bits in MMCR2 for PowerISA v2.07 */
250
#define MMCR2_FCS(pmc) (1ull << (63 - (((pmc) - 1) * 9)))
251
#define MMCR2_FCP(pmc) (1ull << (62 - (((pmc) - 1) * 9)))
252
#define MMCR2_FCWAIT(pmc) (1ull << (58 - (((pmc) - 1) * 9)))
253
#define MMCR2_FCH(pmc) (1ull << (57 - (((pmc) - 1) * 9)))
254
255
#define MAX_ALT 2
256
#define MAX_PMU_COUNTERS 6
257
258
/* Bits in MMCR3 for PowerISA v3.10 */
259
#define MMCR3_SHIFT(pmc) (49 - (15 * ((pmc) - 1)))
260
261
#define ISA207_SIER_TYPE_SHIFT 15
262
#define ISA207_SIER_TYPE_MASK (0x7ull << ISA207_SIER_TYPE_SHIFT)
263
264
#define ISA207_SIER_LDST_SHIFT 1
265
#define ISA207_SIER_LDST_MASK (0x7ull << ISA207_SIER_LDST_SHIFT)
266
267
#define ISA207_SIER_DATA_SRC_SHIFT 53
268
#define ISA207_SIER_DATA_SRC_MASK (0x7ull << ISA207_SIER_DATA_SRC_SHIFT)
269
270
/* Bits in SIER2/SIER3 for Power10 */
271
#define P10_SIER2_FINISH_CYC(sier2) (((sier2) >> (63 - 37)) & 0x7fful)
272
#define P10_SIER2_DISPATCH_CYC(sier2) (((sier2) >> (63 - 13)) & 0x7fful)
273
274
#define P(a, b) PERF_MEM_S(a, b)
275
#define PH(a, b) (P(LVL, HIT) | P(a, b))
276
#define PM(a, b) (P(LVL, MISS) | P(a, b))
277
#define LEVEL(x) P(LVLNUM, x)
278
#define REM P(REMOTE, REMOTE)
279
280
int isa207_get_constraint(u64 event, unsigned long *maskp, unsigned long *valp, u64 event_config1);
281
int isa207_compute_mmcr(u64 event[], int n_ev,
282
unsigned int hwc[], struct mmcr_regs *mmcr,
283
struct perf_event *pevents[], u32 flags);
284
void isa207_disable_pmc(unsigned int pmc, struct mmcr_regs *mmcr);
285
int isa207_get_alternatives(u64 event, u64 alt[], int size, unsigned int flags,
286
const unsigned int ev_alt[][MAX_ALT]);
287
void isa207_get_mem_data_src(union perf_mem_data_src *dsrc, u32 flags,
288
struct pt_regs *regs);
289
void isa207_get_mem_weight(u64 *weight, u64 type);
290
291
int isa3XX_check_attr_config(struct perf_event *ev);
292
293
#endif
294
295