1 #include "perf_event_intel_uncore.h"
3 static struct intel_uncore_type
*empty_uncore
[] = { NULL
, };
4 static struct intel_uncore_type
**msr_uncores
= empty_uncore
;
5 static struct intel_uncore_type
**pci_uncores
= empty_uncore
;
6 /* pci bus to socket mapping */
7 static int pcibus_to_physid
[256] = { [0 ... 255] = -1, };
9 static DEFINE_RAW_SPINLOCK(uncore_box_lock
);
11 /* mask of cpus that collect uncore events */
12 static cpumask_t uncore_cpu_mask
;
14 /* constraint for the fixed counter */
15 static struct event_constraint constraint_fixed
=
16 EVENT_CONSTRAINT(~0ULL, 1 << UNCORE_PMC_IDX_FIXED
, ~0ULL);
17 static struct event_constraint constraint_empty
=
18 EVENT_CONSTRAINT(0, 0, 0);
20 #define __BITS_VALUE(x, i, n) ((typeof(x))(((x) >> ((i) * (n))) & \
23 DEFINE_UNCORE_FORMAT_ATTR(event
, event
, "config:0-7");
24 DEFINE_UNCORE_FORMAT_ATTR(event_ext
, event
, "config:0-7,21");
25 DEFINE_UNCORE_FORMAT_ATTR(umask
, umask
, "config:8-15");
26 DEFINE_UNCORE_FORMAT_ATTR(edge
, edge
, "config:18");
27 DEFINE_UNCORE_FORMAT_ATTR(tid_en
, tid_en
, "config:19");
28 DEFINE_UNCORE_FORMAT_ATTR(inv
, inv
, "config:23");
29 DEFINE_UNCORE_FORMAT_ATTR(cmask5
, cmask
, "config:24-28");
30 DEFINE_UNCORE_FORMAT_ATTR(cmask8
, cmask
, "config:24-31");
31 DEFINE_UNCORE_FORMAT_ATTR(thresh8
, thresh
, "config:24-31");
32 DEFINE_UNCORE_FORMAT_ATTR(thresh5
, thresh
, "config:24-28");
33 DEFINE_UNCORE_FORMAT_ATTR(occ_sel
, occ_sel
, "config:14-15");
34 DEFINE_UNCORE_FORMAT_ATTR(occ_invert
, occ_invert
, "config:30");
35 DEFINE_UNCORE_FORMAT_ATTR(occ_edge
, occ_edge
, "config:14-51");
36 DEFINE_UNCORE_FORMAT_ATTR(filter_tid
, filter_tid
, "config1:0-4");
37 DEFINE_UNCORE_FORMAT_ATTR(filter_link
, filter_link
, "config1:5-8");
38 DEFINE_UNCORE_FORMAT_ATTR(filter_nid
, filter_nid
, "config1:10-17");
39 DEFINE_UNCORE_FORMAT_ATTR(filter_nid2
, filter_nid
, "config1:32-47");
40 DEFINE_UNCORE_FORMAT_ATTR(filter_state
, filter_state
, "config1:18-22");
41 DEFINE_UNCORE_FORMAT_ATTR(filter_state2
, filter_state
, "config1:17-22");
42 DEFINE_UNCORE_FORMAT_ATTR(filter_opc
, filter_opc
, "config1:23-31");
43 DEFINE_UNCORE_FORMAT_ATTR(filter_opc2
, filter_opc
, "config1:52-60");
44 DEFINE_UNCORE_FORMAT_ATTR(filter_band0
, filter_band0
, "config1:0-7");
45 DEFINE_UNCORE_FORMAT_ATTR(filter_band1
, filter_band1
, "config1:8-15");
46 DEFINE_UNCORE_FORMAT_ATTR(filter_band2
, filter_band2
, "config1:16-23");
47 DEFINE_UNCORE_FORMAT_ATTR(filter_band3
, filter_band3
, "config1:24-31");
49 static u64
uncore_msr_read_counter(struct intel_uncore_box
*box
, struct perf_event
*event
)
53 rdmsrl(event
->hw
.event_base
, count
);
59 * generic get constraint function for shared match/mask registers.
61 static struct event_constraint
*
62 uncore_get_constraint(struct intel_uncore_box
*box
, struct perf_event
*event
)
64 struct intel_uncore_extra_reg
*er
;
65 struct hw_perf_event_extra
*reg1
= &event
->hw
.extra_reg
;
66 struct hw_perf_event_extra
*reg2
= &event
->hw
.branch_reg
;
71 * reg->alloc can be set due to existing state, so for fake box we
72 * need to ignore this, otherwise we might fail to allocate proper
73 * fake state for this extra reg constraint.
75 if (reg1
->idx
== EXTRA_REG_NONE
||
76 (!uncore_box_is_fake(box
) && reg1
->alloc
))
79 er
= &box
->shared_regs
[reg1
->idx
];
80 raw_spin_lock_irqsave(&er
->lock
, flags
);
81 if (!atomic_read(&er
->ref
) ||
82 (er
->config1
== reg1
->config
&& er
->config2
== reg2
->config
)) {
84 er
->config1
= reg1
->config
;
85 er
->config2
= reg2
->config
;
88 raw_spin_unlock_irqrestore(&er
->lock
, flags
);
91 if (!uncore_box_is_fake(box
))
96 return &constraint_empty
;
99 static void uncore_put_constraint(struct intel_uncore_box
*box
, struct perf_event
*event
)
101 struct intel_uncore_extra_reg
*er
;
102 struct hw_perf_event_extra
*reg1
= &event
->hw
.extra_reg
;
105 * Only put constraint if extra reg was actually allocated. Also
106 * takes care of event which do not use an extra shared reg.
108 * Also, if this is a fake box we shouldn't touch any event state
109 * (reg->alloc) and we don't care about leaving inconsistent box
110 * state either since it will be thrown out.
112 if (uncore_box_is_fake(box
) || !reg1
->alloc
)
115 er
= &box
->shared_regs
[reg1
->idx
];
116 atomic_dec(&er
->ref
);
120 static u64
uncore_shared_reg_config(struct intel_uncore_box
*box
, int idx
)
122 struct intel_uncore_extra_reg
*er
;
126 er
= &box
->shared_regs
[idx
];
128 raw_spin_lock_irqsave(&er
->lock
, flags
);
130 raw_spin_unlock_irqrestore(&er
->lock
, flags
);
135 /* Sandy Bridge-EP uncore support */
136 static struct intel_uncore_type snbep_uncore_cbox
;
137 static struct intel_uncore_type snbep_uncore_pcu
;
139 static void snbep_uncore_pci_disable_box(struct intel_uncore_box
*box
)
141 struct pci_dev
*pdev
= box
->pci_dev
;
142 int box_ctl
= uncore_pci_box_ctl(box
);
145 if (!pci_read_config_dword(pdev
, box_ctl
, &config
)) {
146 config
|= SNBEP_PMON_BOX_CTL_FRZ
;
147 pci_write_config_dword(pdev
, box_ctl
, config
);
151 static void snbep_uncore_pci_enable_box(struct intel_uncore_box
*box
)
153 struct pci_dev
*pdev
= box
->pci_dev
;
154 int box_ctl
= uncore_pci_box_ctl(box
);
157 if (!pci_read_config_dword(pdev
, box_ctl
, &config
)) {
158 config
&= ~SNBEP_PMON_BOX_CTL_FRZ
;
159 pci_write_config_dword(pdev
, box_ctl
, config
);
163 static void snbep_uncore_pci_enable_event(struct intel_uncore_box
*box
, struct perf_event
*event
)
165 struct pci_dev
*pdev
= box
->pci_dev
;
166 struct hw_perf_event
*hwc
= &event
->hw
;
168 pci_write_config_dword(pdev
, hwc
->config_base
, hwc
->config
| SNBEP_PMON_CTL_EN
);
171 static void snbep_uncore_pci_disable_event(struct intel_uncore_box
*box
, struct perf_event
*event
)
173 struct pci_dev
*pdev
= box
->pci_dev
;
174 struct hw_perf_event
*hwc
= &event
->hw
;
176 pci_write_config_dword(pdev
, hwc
->config_base
, hwc
->config
);
179 static u64
snbep_uncore_pci_read_counter(struct intel_uncore_box
*box
, struct perf_event
*event
)
181 struct pci_dev
*pdev
= box
->pci_dev
;
182 struct hw_perf_event
*hwc
= &event
->hw
;
185 pci_read_config_dword(pdev
, hwc
->event_base
, (u32
*)&count
);
186 pci_read_config_dword(pdev
, hwc
->event_base
+ 4, (u32
*)&count
+ 1);
191 static void snbep_uncore_pci_init_box(struct intel_uncore_box
*box
)
193 struct pci_dev
*pdev
= box
->pci_dev
;
195 pci_write_config_dword(pdev
, SNBEP_PCI_PMON_BOX_CTL
, SNBEP_PMON_BOX_CTL_INT
);
198 static void snbep_uncore_msr_disable_box(struct intel_uncore_box
*box
)
203 msr
= uncore_msr_box_ctl(box
);
206 config
|= SNBEP_PMON_BOX_CTL_FRZ
;
211 static void snbep_uncore_msr_enable_box(struct intel_uncore_box
*box
)
216 msr
= uncore_msr_box_ctl(box
);
219 config
&= ~SNBEP_PMON_BOX_CTL_FRZ
;
224 static void snbep_uncore_msr_enable_event(struct intel_uncore_box
*box
, struct perf_event
*event
)
226 struct hw_perf_event
*hwc
= &event
->hw
;
227 struct hw_perf_event_extra
*reg1
= &hwc
->extra_reg
;
229 if (reg1
->idx
!= EXTRA_REG_NONE
)
230 wrmsrl(reg1
->reg
, uncore_shared_reg_config(box
, 0));
232 wrmsrl(hwc
->config_base
, hwc
->config
| SNBEP_PMON_CTL_EN
);
235 static void snbep_uncore_msr_disable_event(struct intel_uncore_box
*box
,
236 struct perf_event
*event
)
238 struct hw_perf_event
*hwc
= &event
->hw
;
240 wrmsrl(hwc
->config_base
, hwc
->config
);
243 static void snbep_uncore_msr_init_box(struct intel_uncore_box
*box
)
245 unsigned msr
= uncore_msr_box_ctl(box
);
248 wrmsrl(msr
, SNBEP_PMON_BOX_CTL_INT
);
251 static struct attribute
*snbep_uncore_formats_attr
[] = {
252 &format_attr_event
.attr
,
253 &format_attr_umask
.attr
,
254 &format_attr_edge
.attr
,
255 &format_attr_inv
.attr
,
256 &format_attr_thresh8
.attr
,
260 static struct attribute
*snbep_uncore_ubox_formats_attr
[] = {
261 &format_attr_event
.attr
,
262 &format_attr_umask
.attr
,
263 &format_attr_edge
.attr
,
264 &format_attr_inv
.attr
,
265 &format_attr_thresh5
.attr
,
269 static struct attribute
*snbep_uncore_cbox_formats_attr
[] = {
270 &format_attr_event
.attr
,
271 &format_attr_umask
.attr
,
272 &format_attr_edge
.attr
,
273 &format_attr_tid_en
.attr
,
274 &format_attr_inv
.attr
,
275 &format_attr_thresh8
.attr
,
276 &format_attr_filter_tid
.attr
,
277 &format_attr_filter_nid
.attr
,
278 &format_attr_filter_state
.attr
,
279 &format_attr_filter_opc
.attr
,
283 static struct attribute
*snbep_uncore_pcu_formats_attr
[] = {
284 &format_attr_event
.attr
,
285 &format_attr_occ_sel
.attr
,
286 &format_attr_edge
.attr
,
287 &format_attr_inv
.attr
,
288 &format_attr_thresh5
.attr
,
289 &format_attr_occ_invert
.attr
,
290 &format_attr_occ_edge
.attr
,
291 &format_attr_filter_band0
.attr
,
292 &format_attr_filter_band1
.attr
,
293 &format_attr_filter_band2
.attr
,
294 &format_attr_filter_band3
.attr
,
298 static struct attribute
*snbep_uncore_qpi_formats_attr
[] = {
299 &format_attr_event_ext
.attr
,
300 &format_attr_umask
.attr
,
301 &format_attr_edge
.attr
,
302 &format_attr_inv
.attr
,
303 &format_attr_thresh8
.attr
,
307 static struct uncore_event_desc snbep_uncore_imc_events
[] = {
308 INTEL_UNCORE_EVENT_DESC(clockticks
, "event=0xff,umask=0x00"),
309 INTEL_UNCORE_EVENT_DESC(cas_count_read
, "event=0x04,umask=0x03"),
310 INTEL_UNCORE_EVENT_DESC(cas_count_write
, "event=0x04,umask=0x0c"),
311 { /* end: all zeroes */ },
314 static struct uncore_event_desc snbep_uncore_qpi_events
[] = {
315 INTEL_UNCORE_EVENT_DESC(clockticks
, "event=0x14"),
316 INTEL_UNCORE_EVENT_DESC(txl_flits_active
, "event=0x00,umask=0x06"),
317 INTEL_UNCORE_EVENT_DESC(drs_data
, "event=0x02,umask=0x08"),
318 INTEL_UNCORE_EVENT_DESC(ncb_data
, "event=0x03,umask=0x04"),
319 { /* end: all zeroes */ },
322 static struct attribute_group snbep_uncore_format_group
= {
324 .attrs
= snbep_uncore_formats_attr
,
327 static struct attribute_group snbep_uncore_ubox_format_group
= {
329 .attrs
= snbep_uncore_ubox_formats_attr
,
332 static struct attribute_group snbep_uncore_cbox_format_group
= {
334 .attrs
= snbep_uncore_cbox_formats_attr
,
337 static struct attribute_group snbep_uncore_pcu_format_group
= {
339 .attrs
= snbep_uncore_pcu_formats_attr
,
342 static struct attribute_group snbep_uncore_qpi_format_group
= {
344 .attrs
= snbep_uncore_qpi_formats_attr
,
347 #define SNBEP_UNCORE_MSR_OPS_COMMON_INIT() \
348 .init_box = snbep_uncore_msr_init_box, \
349 .disable_box = snbep_uncore_msr_disable_box, \
350 .enable_box = snbep_uncore_msr_enable_box, \
351 .disable_event = snbep_uncore_msr_disable_event, \
352 .enable_event = snbep_uncore_msr_enable_event, \
353 .read_counter = uncore_msr_read_counter
355 static struct intel_uncore_ops snbep_uncore_msr_ops
= {
356 SNBEP_UNCORE_MSR_OPS_COMMON_INIT(),
359 static struct intel_uncore_ops snbep_uncore_pci_ops
= {
360 .init_box
= snbep_uncore_pci_init_box
,
361 .disable_box
= snbep_uncore_pci_disable_box
,
362 .enable_box
= snbep_uncore_pci_enable_box
,
363 .disable_event
= snbep_uncore_pci_disable_event
,
364 .enable_event
= snbep_uncore_pci_enable_event
,
365 .read_counter
= snbep_uncore_pci_read_counter
,
368 static struct event_constraint snbep_uncore_cbox_constraints
[] = {
369 UNCORE_EVENT_CONSTRAINT(0x01, 0x1),
370 UNCORE_EVENT_CONSTRAINT(0x02, 0x3),
371 UNCORE_EVENT_CONSTRAINT(0x04, 0x3),
372 UNCORE_EVENT_CONSTRAINT(0x05, 0x3),
373 UNCORE_EVENT_CONSTRAINT(0x07, 0x3),
374 UNCORE_EVENT_CONSTRAINT(0x09, 0x3),
375 UNCORE_EVENT_CONSTRAINT(0x11, 0x1),
376 UNCORE_EVENT_CONSTRAINT(0x12, 0x3),
377 UNCORE_EVENT_CONSTRAINT(0x13, 0x3),
378 UNCORE_EVENT_CONSTRAINT(0x1b, 0xc),
379 UNCORE_EVENT_CONSTRAINT(0x1c, 0xc),
380 UNCORE_EVENT_CONSTRAINT(0x1d, 0xc),
381 UNCORE_EVENT_CONSTRAINT(0x1e, 0xc),
382 EVENT_CONSTRAINT_OVERLAP(0x1f, 0xe, 0xff),
383 UNCORE_EVENT_CONSTRAINT(0x21, 0x3),
384 UNCORE_EVENT_CONSTRAINT(0x23, 0x3),
385 UNCORE_EVENT_CONSTRAINT(0x31, 0x3),
386 UNCORE_EVENT_CONSTRAINT(0x32, 0x3),
387 UNCORE_EVENT_CONSTRAINT(0x33, 0x3),
388 UNCORE_EVENT_CONSTRAINT(0x34, 0x3),
389 UNCORE_EVENT_CONSTRAINT(0x35, 0x3),
390 UNCORE_EVENT_CONSTRAINT(0x36, 0x1),
391 UNCORE_EVENT_CONSTRAINT(0x37, 0x3),
392 UNCORE_EVENT_CONSTRAINT(0x38, 0x3),
393 UNCORE_EVENT_CONSTRAINT(0x39, 0x3),
394 UNCORE_EVENT_CONSTRAINT(0x3b, 0x1),
398 static struct event_constraint snbep_uncore_r2pcie_constraints
[] = {
399 UNCORE_EVENT_CONSTRAINT(0x10, 0x3),
400 UNCORE_EVENT_CONSTRAINT(0x11, 0x3),
401 UNCORE_EVENT_CONSTRAINT(0x12, 0x1),
402 UNCORE_EVENT_CONSTRAINT(0x23, 0x3),
403 UNCORE_EVENT_CONSTRAINT(0x24, 0x3),
404 UNCORE_EVENT_CONSTRAINT(0x25, 0x3),
405 UNCORE_EVENT_CONSTRAINT(0x26, 0x3),
406 UNCORE_EVENT_CONSTRAINT(0x32, 0x3),
407 UNCORE_EVENT_CONSTRAINT(0x33, 0x3),
408 UNCORE_EVENT_CONSTRAINT(0x34, 0x3),
412 static struct event_constraint snbep_uncore_r3qpi_constraints
[] = {
413 UNCORE_EVENT_CONSTRAINT(0x10, 0x3),
414 UNCORE_EVENT_CONSTRAINT(0x11, 0x3),
415 UNCORE_EVENT_CONSTRAINT(0x12, 0x3),
416 UNCORE_EVENT_CONSTRAINT(0x13, 0x1),
417 UNCORE_EVENT_CONSTRAINT(0x20, 0x3),
418 UNCORE_EVENT_CONSTRAINT(0x21, 0x3),
419 UNCORE_EVENT_CONSTRAINT(0x22, 0x3),
420 UNCORE_EVENT_CONSTRAINT(0x23, 0x3),
421 UNCORE_EVENT_CONSTRAINT(0x24, 0x3),
422 UNCORE_EVENT_CONSTRAINT(0x25, 0x3),
423 UNCORE_EVENT_CONSTRAINT(0x26, 0x3),
424 UNCORE_EVENT_CONSTRAINT(0x28, 0x3),
425 UNCORE_EVENT_CONSTRAINT(0x29, 0x3),
426 UNCORE_EVENT_CONSTRAINT(0x2a, 0x3),
427 UNCORE_EVENT_CONSTRAINT(0x2b, 0x3),
428 UNCORE_EVENT_CONSTRAINT(0x2c, 0x3),
429 UNCORE_EVENT_CONSTRAINT(0x2d, 0x3),
430 UNCORE_EVENT_CONSTRAINT(0x2e, 0x3),
431 UNCORE_EVENT_CONSTRAINT(0x2f, 0x3),
432 UNCORE_EVENT_CONSTRAINT(0x30, 0x3),
433 UNCORE_EVENT_CONSTRAINT(0x31, 0x3),
434 UNCORE_EVENT_CONSTRAINT(0x32, 0x3),
435 UNCORE_EVENT_CONSTRAINT(0x33, 0x3),
436 UNCORE_EVENT_CONSTRAINT(0x34, 0x3),
437 UNCORE_EVENT_CONSTRAINT(0x36, 0x3),
438 UNCORE_EVENT_CONSTRAINT(0x37, 0x3),
439 UNCORE_EVENT_CONSTRAINT(0x38, 0x3),
440 UNCORE_EVENT_CONSTRAINT(0x39, 0x3),
444 static struct intel_uncore_type snbep_uncore_ubox
= {
449 .fixed_ctr_bits
= 48,
450 .perf_ctr
= SNBEP_U_MSR_PMON_CTR0
,
451 .event_ctl
= SNBEP_U_MSR_PMON_CTL0
,
452 .event_mask
= SNBEP_U_MSR_PMON_RAW_EVENT_MASK
,
453 .fixed_ctr
= SNBEP_U_MSR_PMON_UCLK_FIXED_CTR
,
454 .fixed_ctl
= SNBEP_U_MSR_PMON_UCLK_FIXED_CTL
,
455 .ops
= &snbep_uncore_msr_ops
,
456 .format_group
= &snbep_uncore_ubox_format_group
,
459 static struct extra_reg snbep_uncore_cbox_extra_regs
[] = {
460 SNBEP_CBO_EVENT_EXTRA_REG(SNBEP_CBO_PMON_CTL_TID_EN
,
461 SNBEP_CBO_PMON_CTL_TID_EN
, 0x1),
462 SNBEP_CBO_EVENT_EXTRA_REG(0x0334, 0xffff, 0x4),
463 SNBEP_CBO_EVENT_EXTRA_REG(0x0534, 0xffff, 0x4),
464 SNBEP_CBO_EVENT_EXTRA_REG(0x0934, 0xffff, 0x4),
465 SNBEP_CBO_EVENT_EXTRA_REG(0x4134, 0xffff, 0x6),
466 SNBEP_CBO_EVENT_EXTRA_REG(0x0135, 0xffff, 0x8),
467 SNBEP_CBO_EVENT_EXTRA_REG(0x0335, 0xffff, 0x8),
468 SNBEP_CBO_EVENT_EXTRA_REG(0x4135, 0xffff, 0xc),
469 SNBEP_CBO_EVENT_EXTRA_REG(0x4335, 0xffff, 0xc),
470 SNBEP_CBO_EVENT_EXTRA_REG(0x4435, 0xffff, 0x2),
471 SNBEP_CBO_EVENT_EXTRA_REG(0x4835, 0xffff, 0x2),
472 SNBEP_CBO_EVENT_EXTRA_REG(0x4a35, 0xffff, 0x2),
473 SNBEP_CBO_EVENT_EXTRA_REG(0x5035, 0xffff, 0x2),
474 SNBEP_CBO_EVENT_EXTRA_REG(0x0136, 0xffff, 0x8),
475 SNBEP_CBO_EVENT_EXTRA_REG(0x0336, 0xffff, 0x8),
476 SNBEP_CBO_EVENT_EXTRA_REG(0x4136, 0xffff, 0xc),
477 SNBEP_CBO_EVENT_EXTRA_REG(0x4336, 0xffff, 0xc),
478 SNBEP_CBO_EVENT_EXTRA_REG(0x4436, 0xffff, 0x2),
479 SNBEP_CBO_EVENT_EXTRA_REG(0x4836, 0xffff, 0x2),
480 SNBEP_CBO_EVENT_EXTRA_REG(0x4a36, 0xffff, 0x2),
481 SNBEP_CBO_EVENT_EXTRA_REG(0x4037, 0x40ff, 0x2),
485 static void snbep_cbox_put_constraint(struct intel_uncore_box
*box
, struct perf_event
*event
)
487 struct hw_perf_event_extra
*reg1
= &event
->hw
.extra_reg
;
488 struct intel_uncore_extra_reg
*er
= &box
->shared_regs
[0];
491 if (uncore_box_is_fake(box
))
494 for (i
= 0; i
< 5; i
++) {
495 if (reg1
->alloc
& (0x1 << i
))
496 atomic_sub(1 << (i
* 6), &er
->ref
);
501 static struct event_constraint
*
502 __snbep_cbox_get_constraint(struct intel_uncore_box
*box
, struct perf_event
*event
,
503 u64 (*cbox_filter_mask
)(int fields
))
505 struct hw_perf_event_extra
*reg1
= &event
->hw
.extra_reg
;
506 struct intel_uncore_extra_reg
*er
= &box
->shared_regs
[0];
511 if (reg1
->idx
== EXTRA_REG_NONE
)
514 raw_spin_lock_irqsave(&er
->lock
, flags
);
515 for (i
= 0; i
< 5; i
++) {
516 if (!(reg1
->idx
& (0x1 << i
)))
518 if (!uncore_box_is_fake(box
) && (reg1
->alloc
& (0x1 << i
)))
521 mask
= cbox_filter_mask(0x1 << i
);
522 if (!__BITS_VALUE(atomic_read(&er
->ref
), i
, 6) ||
523 !((reg1
->config
^ er
->config
) & mask
)) {
524 atomic_add(1 << (i
* 6), &er
->ref
);
526 er
->config
|= reg1
->config
& mask
;
532 raw_spin_unlock_irqrestore(&er
->lock
, flags
);
536 if (!uncore_box_is_fake(box
))
537 reg1
->alloc
|= alloc
;
541 for (; i
>= 0; i
--) {
542 if (alloc
& (0x1 << i
))
543 atomic_sub(1 << (i
* 6), &er
->ref
);
545 return &constraint_empty
;
548 static u64
snbep_cbox_filter_mask(int fields
)
553 mask
|= SNBEP_CB0_MSR_PMON_BOX_FILTER_TID
;
555 mask
|= SNBEP_CB0_MSR_PMON_BOX_FILTER_NID
;
557 mask
|= SNBEP_CB0_MSR_PMON_BOX_FILTER_STATE
;
559 mask
|= SNBEP_CB0_MSR_PMON_BOX_FILTER_OPC
;
564 static struct event_constraint
*
565 snbep_cbox_get_constraint(struct intel_uncore_box
*box
, struct perf_event
*event
)
567 return __snbep_cbox_get_constraint(box
, event
, snbep_cbox_filter_mask
);
570 static int snbep_cbox_hw_config(struct intel_uncore_box
*box
, struct perf_event
*event
)
572 struct hw_perf_event_extra
*reg1
= &event
->hw
.extra_reg
;
573 struct extra_reg
*er
;
576 for (er
= snbep_uncore_cbox_extra_regs
; er
->msr
; er
++) {
577 if (er
->event
!= (event
->hw
.config
& er
->config_mask
))
583 reg1
->reg
= SNBEP_C0_MSR_PMON_BOX_FILTER
+
584 SNBEP_CBO_MSR_OFFSET
* box
->pmu
->pmu_idx
;
585 reg1
->config
= event
->attr
.config1
& snbep_cbox_filter_mask(idx
);
591 static struct intel_uncore_ops snbep_uncore_cbox_ops
= {
592 SNBEP_UNCORE_MSR_OPS_COMMON_INIT(),
593 .hw_config
= snbep_cbox_hw_config
,
594 .get_constraint
= snbep_cbox_get_constraint
,
595 .put_constraint
= snbep_cbox_put_constraint
,
598 static struct intel_uncore_type snbep_uncore_cbox
= {
603 .event_ctl
= SNBEP_C0_MSR_PMON_CTL0
,
604 .perf_ctr
= SNBEP_C0_MSR_PMON_CTR0
,
605 .event_mask
= SNBEP_CBO_MSR_PMON_RAW_EVENT_MASK
,
606 .box_ctl
= SNBEP_C0_MSR_PMON_BOX_CTL
,
607 .msr_offset
= SNBEP_CBO_MSR_OFFSET
,
608 .num_shared_regs
= 1,
609 .constraints
= snbep_uncore_cbox_constraints
,
610 .ops
= &snbep_uncore_cbox_ops
,
611 .format_group
= &snbep_uncore_cbox_format_group
,
614 static u64
snbep_pcu_alter_er(struct perf_event
*event
, int new_idx
, bool modify
)
616 struct hw_perf_event
*hwc
= &event
->hw
;
617 struct hw_perf_event_extra
*reg1
= &hwc
->extra_reg
;
618 u64 config
= reg1
->config
;
620 if (new_idx
> reg1
->idx
)
621 config
<<= 8 * (new_idx
- reg1
->idx
);
623 config
>>= 8 * (reg1
->idx
- new_idx
);
626 hwc
->config
+= new_idx
- reg1
->idx
;
627 reg1
->config
= config
;
633 static struct event_constraint
*
634 snbep_pcu_get_constraint(struct intel_uncore_box
*box
, struct perf_event
*event
)
636 struct hw_perf_event_extra
*reg1
= &event
->hw
.extra_reg
;
637 struct intel_uncore_extra_reg
*er
= &box
->shared_regs
[0];
640 u64 mask
, config1
= reg1
->config
;
643 if (reg1
->idx
== EXTRA_REG_NONE
||
644 (!uncore_box_is_fake(box
) && reg1
->alloc
))
647 mask
= 0xffULL
<< (idx
* 8);
648 raw_spin_lock_irqsave(&er
->lock
, flags
);
649 if (!__BITS_VALUE(atomic_read(&er
->ref
), idx
, 8) ||
650 !((config1
^ er
->config
) & mask
)) {
651 atomic_add(1 << (idx
* 8), &er
->ref
);
653 er
->config
|= config1
& mask
;
656 raw_spin_unlock_irqrestore(&er
->lock
, flags
);
660 if (idx
!= reg1
->idx
) {
661 config1
= snbep_pcu_alter_er(event
, idx
, false);
664 return &constraint_empty
;
667 if (!uncore_box_is_fake(box
)) {
668 if (idx
!= reg1
->idx
)
669 snbep_pcu_alter_er(event
, idx
, true);
675 static void snbep_pcu_put_constraint(struct intel_uncore_box
*box
, struct perf_event
*event
)
677 struct hw_perf_event_extra
*reg1
= &event
->hw
.extra_reg
;
678 struct intel_uncore_extra_reg
*er
= &box
->shared_regs
[0];
680 if (uncore_box_is_fake(box
) || !reg1
->alloc
)
683 atomic_sub(1 << (reg1
->idx
* 8), &er
->ref
);
687 static int snbep_pcu_hw_config(struct intel_uncore_box
*box
, struct perf_event
*event
)
689 struct hw_perf_event
*hwc
= &event
->hw
;
690 struct hw_perf_event_extra
*reg1
= &hwc
->extra_reg
;
691 int ev_sel
= hwc
->config
& SNBEP_PMON_CTL_EV_SEL_MASK
;
693 if (ev_sel
>= 0xb && ev_sel
<= 0xe) {
694 reg1
->reg
= SNBEP_PCU_MSR_PMON_BOX_FILTER
;
695 reg1
->idx
= ev_sel
- 0xb;
696 reg1
->config
= event
->attr
.config1
& (0xff << reg1
->idx
);
701 static struct intel_uncore_ops snbep_uncore_pcu_ops
= {
702 SNBEP_UNCORE_MSR_OPS_COMMON_INIT(),
703 .hw_config
= snbep_pcu_hw_config
,
704 .get_constraint
= snbep_pcu_get_constraint
,
705 .put_constraint
= snbep_pcu_put_constraint
,
708 static struct intel_uncore_type snbep_uncore_pcu
= {
713 .perf_ctr
= SNBEP_PCU_MSR_PMON_CTR0
,
714 .event_ctl
= SNBEP_PCU_MSR_PMON_CTL0
,
715 .event_mask
= SNBEP_PCU_MSR_PMON_RAW_EVENT_MASK
,
716 .box_ctl
= SNBEP_PCU_MSR_PMON_BOX_CTL
,
717 .num_shared_regs
= 1,
718 .ops
= &snbep_uncore_pcu_ops
,
719 .format_group
= &snbep_uncore_pcu_format_group
,
722 static struct intel_uncore_type
*snbep_msr_uncores
[] = {
729 #define SNBEP_UNCORE_PCI_COMMON_INIT() \
730 .perf_ctr = SNBEP_PCI_PMON_CTR0, \
731 .event_ctl = SNBEP_PCI_PMON_CTL0, \
732 .event_mask = SNBEP_PMON_RAW_EVENT_MASK, \
733 .box_ctl = SNBEP_PCI_PMON_BOX_CTL, \
734 .ops = &snbep_uncore_pci_ops, \
735 .format_group = &snbep_uncore_format_group
737 static struct intel_uncore_type snbep_uncore_ha
= {
742 SNBEP_UNCORE_PCI_COMMON_INIT(),
745 static struct intel_uncore_type snbep_uncore_imc
= {
750 .fixed_ctr_bits
= 48,
751 .fixed_ctr
= SNBEP_MC_CHy_PCI_PMON_FIXED_CTR
,
752 .fixed_ctl
= SNBEP_MC_CHy_PCI_PMON_FIXED_CTL
,
753 .event_descs
= snbep_uncore_imc_events
,
754 SNBEP_UNCORE_PCI_COMMON_INIT(),
757 static struct intel_uncore_type snbep_uncore_qpi
= {
762 .perf_ctr
= SNBEP_PCI_PMON_CTR0
,
763 .event_ctl
= SNBEP_PCI_PMON_CTL0
,
764 .event_mask
= SNBEP_QPI_PCI_PMON_RAW_EVENT_MASK
,
765 .box_ctl
= SNBEP_PCI_PMON_BOX_CTL
,
766 .ops
= &snbep_uncore_pci_ops
,
767 .event_descs
= snbep_uncore_qpi_events
,
768 .format_group
= &snbep_uncore_qpi_format_group
,
772 static struct intel_uncore_type snbep_uncore_r2pcie
= {
777 .constraints
= snbep_uncore_r2pcie_constraints
,
778 SNBEP_UNCORE_PCI_COMMON_INIT(),
781 static struct intel_uncore_type snbep_uncore_r3qpi
= {
786 .constraints
= snbep_uncore_r3qpi_constraints
,
787 SNBEP_UNCORE_PCI_COMMON_INIT(),
792 SNBEP_PCI_UNCORE_IMC
,
793 SNBEP_PCI_UNCORE_QPI
,
794 SNBEP_PCI_UNCORE_R2PCIE
,
795 SNBEP_PCI_UNCORE_R3QPI
,
798 static struct intel_uncore_type
*snbep_pci_uncores
[] = {
799 [SNBEP_PCI_UNCORE_HA
] = &snbep_uncore_ha
,
800 [SNBEP_PCI_UNCORE_IMC
] = &snbep_uncore_imc
,
801 [SNBEP_PCI_UNCORE_QPI
] = &snbep_uncore_qpi
,
802 [SNBEP_PCI_UNCORE_R2PCIE
] = &snbep_uncore_r2pcie
,
803 [SNBEP_PCI_UNCORE_R3QPI
] = &snbep_uncore_r3qpi
,
807 static DEFINE_PCI_DEVICE_TABLE(snbep_uncore_pci_ids
) = {
809 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, PCI_DEVICE_ID_INTEL_UNC_HA
),
810 .driver_data
= SNBEP_PCI_UNCORE_HA
,
813 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, PCI_DEVICE_ID_INTEL_UNC_IMC0
),
814 .driver_data
= SNBEP_PCI_UNCORE_IMC
,
817 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, PCI_DEVICE_ID_INTEL_UNC_IMC1
),
818 .driver_data
= SNBEP_PCI_UNCORE_IMC
,
821 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, PCI_DEVICE_ID_INTEL_UNC_IMC2
),
822 .driver_data
= SNBEP_PCI_UNCORE_IMC
,
825 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, PCI_DEVICE_ID_INTEL_UNC_IMC3
),
826 .driver_data
= SNBEP_PCI_UNCORE_IMC
,
829 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, PCI_DEVICE_ID_INTEL_UNC_QPI0
),
830 .driver_data
= SNBEP_PCI_UNCORE_QPI
,
833 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, PCI_DEVICE_ID_INTEL_UNC_QPI1
),
834 .driver_data
= SNBEP_PCI_UNCORE_QPI
,
837 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, PCI_DEVICE_ID_INTEL_UNC_R2PCIE
),
838 .driver_data
= SNBEP_PCI_UNCORE_R2PCIE
,
841 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, PCI_DEVICE_ID_INTEL_UNC_R3QPI0
),
842 .driver_data
= SNBEP_PCI_UNCORE_R3QPI
,
845 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, PCI_DEVICE_ID_INTEL_UNC_R3QPI1
),
846 .driver_data
= SNBEP_PCI_UNCORE_R3QPI
,
848 { /* end: all zeroes */ }
851 static struct pci_driver snbep_uncore_pci_driver
= {
852 .name
= "snbep_uncore",
853 .id_table
= snbep_uncore_pci_ids
,
857 * build pci bus to socket mapping
859 static int snbep_pci2phy_map_init(int devid
)
861 struct pci_dev
*ubox_dev
= NULL
;
867 /* find the UBOX device */
868 ubox_dev
= pci_get_device(PCI_VENDOR_ID_INTEL
, devid
, ubox_dev
);
871 bus
= ubox_dev
->bus
->number
;
872 /* get the Node ID of the local register */
873 err
= pci_read_config_dword(ubox_dev
, 0x40, &config
);
877 /* get the Node ID mapping */
878 err
= pci_read_config_dword(ubox_dev
, 0x54, &config
);
882 * every three bits in the Node ID mapping register maps
883 * to a particular node.
885 for (i
= 0; i
< 8; i
++) {
886 if (nodeid
== ((config
>> (3 * i
)) & 0x7)) {
887 pcibus_to_physid
[bus
] = i
;
894 pci_dev_put(ubox_dev
);
896 return err
? pcibios_err_to_errno(err
) : 0;
898 /* end of Sandy Bridge-EP uncore support */
900 /* IvyTown uncore support */
901 static void ivt_uncore_msr_init_box(struct intel_uncore_box
*box
)
903 unsigned msr
= uncore_msr_box_ctl(box
);
905 wrmsrl(msr
, IVT_PMON_BOX_CTL_INT
);
908 static void ivt_uncore_pci_init_box(struct intel_uncore_box
*box
)
910 struct pci_dev
*pdev
= box
->pci_dev
;
912 pci_write_config_dword(pdev
, SNBEP_PCI_PMON_BOX_CTL
, IVT_PMON_BOX_CTL_INT
);
915 #define IVT_UNCORE_MSR_OPS_COMMON_INIT() \
916 .init_box = ivt_uncore_msr_init_box, \
917 .disable_box = snbep_uncore_msr_disable_box, \
918 .enable_box = snbep_uncore_msr_enable_box, \
919 .disable_event = snbep_uncore_msr_disable_event, \
920 .enable_event = snbep_uncore_msr_enable_event, \
921 .read_counter = uncore_msr_read_counter
923 static struct intel_uncore_ops ivt_uncore_msr_ops
= {
924 IVT_UNCORE_MSR_OPS_COMMON_INIT(),
927 static struct intel_uncore_ops ivt_uncore_pci_ops
= {
928 .init_box
= ivt_uncore_pci_init_box
,
929 .disable_box
= snbep_uncore_pci_disable_box
,
930 .enable_box
= snbep_uncore_pci_enable_box
,
931 .disable_event
= snbep_uncore_pci_disable_event
,
932 .enable_event
= snbep_uncore_pci_enable_event
,
933 .read_counter
= snbep_uncore_pci_read_counter
,
936 #define IVT_UNCORE_PCI_COMMON_INIT() \
937 .perf_ctr = SNBEP_PCI_PMON_CTR0, \
938 .event_ctl = SNBEP_PCI_PMON_CTL0, \
939 .event_mask = IVT_PMON_RAW_EVENT_MASK, \
940 .box_ctl = SNBEP_PCI_PMON_BOX_CTL, \
941 .ops = &ivt_uncore_pci_ops, \
942 .format_group = &ivt_uncore_format_group
944 static struct attribute
*ivt_uncore_formats_attr
[] = {
945 &format_attr_event
.attr
,
946 &format_attr_umask
.attr
,
947 &format_attr_edge
.attr
,
948 &format_attr_inv
.attr
,
949 &format_attr_thresh8
.attr
,
953 static struct attribute
*ivt_uncore_ubox_formats_attr
[] = {
954 &format_attr_event
.attr
,
955 &format_attr_umask
.attr
,
956 &format_attr_edge
.attr
,
957 &format_attr_inv
.attr
,
958 &format_attr_thresh5
.attr
,
962 static struct attribute
*ivt_uncore_cbox_formats_attr
[] = {
963 &format_attr_event
.attr
,
964 &format_attr_umask
.attr
,
965 &format_attr_edge
.attr
,
966 &format_attr_tid_en
.attr
,
967 &format_attr_thresh8
.attr
,
968 &format_attr_filter_tid
.attr
,
969 &format_attr_filter_link
.attr
,
970 &format_attr_filter_state2
.attr
,
971 &format_attr_filter_nid2
.attr
,
972 &format_attr_filter_opc2
.attr
,
976 static struct attribute
*ivt_uncore_pcu_formats_attr
[] = {
977 &format_attr_event_ext
.attr
,
978 &format_attr_occ_sel
.attr
,
979 &format_attr_edge
.attr
,
980 &format_attr_thresh5
.attr
,
981 &format_attr_occ_invert
.attr
,
982 &format_attr_occ_edge
.attr
,
983 &format_attr_filter_band0
.attr
,
984 &format_attr_filter_band1
.attr
,
985 &format_attr_filter_band2
.attr
,
986 &format_attr_filter_band3
.attr
,
990 static struct attribute
*ivt_uncore_qpi_formats_attr
[] = {
991 &format_attr_event_ext
.attr
,
992 &format_attr_umask
.attr
,
993 &format_attr_edge
.attr
,
994 &format_attr_thresh8
.attr
,
998 static struct attribute_group ivt_uncore_format_group
= {
1000 .attrs
= ivt_uncore_formats_attr
,
1003 static struct attribute_group ivt_uncore_ubox_format_group
= {
1005 .attrs
= ivt_uncore_ubox_formats_attr
,
1008 static struct attribute_group ivt_uncore_cbox_format_group
= {
1010 .attrs
= ivt_uncore_cbox_formats_attr
,
1013 static struct attribute_group ivt_uncore_pcu_format_group
= {
1015 .attrs
= ivt_uncore_pcu_formats_attr
,
1018 static struct attribute_group ivt_uncore_qpi_format_group
= {
1020 .attrs
= ivt_uncore_qpi_formats_attr
,
1023 static struct intel_uncore_type ivt_uncore_ubox
= {
1027 .perf_ctr_bits
= 44,
1028 .fixed_ctr_bits
= 48,
1029 .perf_ctr
= SNBEP_U_MSR_PMON_CTR0
,
1030 .event_ctl
= SNBEP_U_MSR_PMON_CTL0
,
1031 .event_mask
= IVT_U_MSR_PMON_RAW_EVENT_MASK
,
1032 .fixed_ctr
= SNBEP_U_MSR_PMON_UCLK_FIXED_CTR
,
1033 .fixed_ctl
= SNBEP_U_MSR_PMON_UCLK_FIXED_CTL
,
1034 .ops
= &ivt_uncore_msr_ops
,
1035 .format_group
= &ivt_uncore_ubox_format_group
,
1038 static struct extra_reg ivt_uncore_cbox_extra_regs
[] = {
1039 SNBEP_CBO_EVENT_EXTRA_REG(SNBEP_CBO_PMON_CTL_TID_EN
,
1040 SNBEP_CBO_PMON_CTL_TID_EN
, 0x1),
1041 SNBEP_CBO_EVENT_EXTRA_REG(0x1031, 0x10ff, 0x2),
1042 SNBEP_CBO_EVENT_EXTRA_REG(0x0334, 0xffff, 0x4),
1043 SNBEP_CBO_EVENT_EXTRA_REG(0x0534, 0xffff, 0x4),
1044 SNBEP_CBO_EVENT_EXTRA_REG(0x0934, 0xffff, 0x4),
1045 SNBEP_CBO_EVENT_EXTRA_REG(0x4134, 0xffff, 0xc),
1046 SNBEP_CBO_EVENT_EXTRA_REG(0x0135, 0xffff, 0x10),
1047 SNBEP_CBO_EVENT_EXTRA_REG(0x0335, 0xffff, 0x10),
1048 SNBEP_CBO_EVENT_EXTRA_REG(0x2135, 0xffff, 0x10),
1049 SNBEP_CBO_EVENT_EXTRA_REG(0x2335, 0xffff, 0x10),
1050 SNBEP_CBO_EVENT_EXTRA_REG(0x4135, 0xffff, 0x18),
1051 SNBEP_CBO_EVENT_EXTRA_REG(0x4335, 0xffff, 0x18),
1052 SNBEP_CBO_EVENT_EXTRA_REG(0x4435, 0xffff, 0x8),
1053 SNBEP_CBO_EVENT_EXTRA_REG(0x4835, 0xffff, 0x8),
1054 SNBEP_CBO_EVENT_EXTRA_REG(0x4a35, 0xffff, 0x8),
1055 SNBEP_CBO_EVENT_EXTRA_REG(0x5035, 0xffff, 0x8),
1056 SNBEP_CBO_EVENT_EXTRA_REG(0x8135, 0xffff, 0x10),
1057 SNBEP_CBO_EVENT_EXTRA_REG(0x8335, 0xffff, 0x10),
1058 SNBEP_CBO_EVENT_EXTRA_REG(0x0136, 0xffff, 0x10),
1059 SNBEP_CBO_EVENT_EXTRA_REG(0x0336, 0xffff, 0x10),
1060 SNBEP_CBO_EVENT_EXTRA_REG(0x2336, 0xffff, 0x10),
1061 SNBEP_CBO_EVENT_EXTRA_REG(0x2336, 0xffff, 0x10),
1062 SNBEP_CBO_EVENT_EXTRA_REG(0x4136, 0xffff, 0x18),
1063 SNBEP_CBO_EVENT_EXTRA_REG(0x4336, 0xffff, 0x18),
1064 SNBEP_CBO_EVENT_EXTRA_REG(0x4436, 0xffff, 0x8),
1065 SNBEP_CBO_EVENT_EXTRA_REG(0x4836, 0xffff, 0x8),
1066 SNBEP_CBO_EVENT_EXTRA_REG(0x4a36, 0xffff, 0x8),
1067 SNBEP_CBO_EVENT_EXTRA_REG(0x5036, 0xffff, 0x8),
1068 SNBEP_CBO_EVENT_EXTRA_REG(0x8136, 0xffff, 0x10),
1069 SNBEP_CBO_EVENT_EXTRA_REG(0x8336, 0xffff, 0x10),
1070 SNBEP_CBO_EVENT_EXTRA_REG(0x4037, 0x40ff, 0x8),
1074 static u64
ivt_cbox_filter_mask(int fields
)
1079 mask
|= IVT_CB0_MSR_PMON_BOX_FILTER_TID
;
1081 mask
|= IVT_CB0_MSR_PMON_BOX_FILTER_LINK
;
1083 mask
|= IVT_CB0_MSR_PMON_BOX_FILTER_STATE
;
1085 mask
|= IVT_CB0_MSR_PMON_BOX_FILTER_NID
;
1087 mask
|= IVT_CB0_MSR_PMON_BOX_FILTER_OPC
;
1092 static struct event_constraint
*
1093 ivt_cbox_get_constraint(struct intel_uncore_box
*box
, struct perf_event
*event
)
1095 return __snbep_cbox_get_constraint(box
, event
, ivt_cbox_filter_mask
);
1098 static int ivt_cbox_hw_config(struct intel_uncore_box
*box
, struct perf_event
*event
)
1100 struct hw_perf_event_extra
*reg1
= &event
->hw
.extra_reg
;
1101 struct extra_reg
*er
;
1104 for (er
= ivt_uncore_cbox_extra_regs
; er
->msr
; er
++) {
1105 if (er
->event
!= (event
->hw
.config
& er
->config_mask
))
1111 reg1
->reg
= SNBEP_C0_MSR_PMON_BOX_FILTER
+
1112 SNBEP_CBO_MSR_OFFSET
* box
->pmu
->pmu_idx
;
1113 reg1
->config
= event
->attr
.config1
& ivt_cbox_filter_mask(idx
);
1119 static void ivt_cbox_enable_event(struct intel_uncore_box
*box
, struct perf_event
*event
)
1121 struct hw_perf_event
*hwc
= &event
->hw
;
1122 struct hw_perf_event_extra
*reg1
= &hwc
->extra_reg
;
1124 if (reg1
->idx
!= EXTRA_REG_NONE
) {
1125 u64 filter
= uncore_shared_reg_config(box
, 0);
1126 wrmsrl(reg1
->reg
, filter
& 0xffffffff);
1127 wrmsrl(reg1
->reg
+ 6, filter
>> 32);
1130 wrmsrl(hwc
->config_base
, hwc
->config
| SNBEP_PMON_CTL_EN
);
1133 static struct intel_uncore_ops ivt_uncore_cbox_ops
= {
1134 .init_box
= ivt_uncore_msr_init_box
,
1135 .disable_box
= snbep_uncore_msr_disable_box
,
1136 .enable_box
= snbep_uncore_msr_enable_box
,
1137 .disable_event
= snbep_uncore_msr_disable_event
,
1138 .enable_event
= ivt_cbox_enable_event
,
1139 .read_counter
= uncore_msr_read_counter
,
1140 .hw_config
= ivt_cbox_hw_config
,
1141 .get_constraint
= ivt_cbox_get_constraint
,
1142 .put_constraint
= snbep_cbox_put_constraint
,
1145 static struct intel_uncore_type ivt_uncore_cbox
= {
1149 .perf_ctr_bits
= 44,
1150 .event_ctl
= SNBEP_C0_MSR_PMON_CTL0
,
1151 .perf_ctr
= SNBEP_C0_MSR_PMON_CTR0
,
1152 .event_mask
= IVT_CBO_MSR_PMON_RAW_EVENT_MASK
,
1153 .box_ctl
= SNBEP_C0_MSR_PMON_BOX_CTL
,
1154 .msr_offset
= SNBEP_CBO_MSR_OFFSET
,
1155 .num_shared_regs
= 1,
1156 .constraints
= snbep_uncore_cbox_constraints
,
1157 .ops
= &ivt_uncore_cbox_ops
,
1158 .format_group
= &ivt_uncore_cbox_format_group
,
1161 static struct intel_uncore_ops ivt_uncore_pcu_ops
= {
1162 IVT_UNCORE_MSR_OPS_COMMON_INIT(),
1163 .hw_config
= snbep_pcu_hw_config
,
1164 .get_constraint
= snbep_pcu_get_constraint
,
1165 .put_constraint
= snbep_pcu_put_constraint
,
1168 static struct intel_uncore_type ivt_uncore_pcu
= {
1172 .perf_ctr_bits
= 48,
1173 .perf_ctr
= SNBEP_PCU_MSR_PMON_CTR0
,
1174 .event_ctl
= SNBEP_PCU_MSR_PMON_CTL0
,
1175 .event_mask
= IVT_PCU_MSR_PMON_RAW_EVENT_MASK
,
1176 .box_ctl
= SNBEP_PCU_MSR_PMON_BOX_CTL
,
1177 .num_shared_regs
= 1,
1178 .ops
= &ivt_uncore_pcu_ops
,
1179 .format_group
= &ivt_uncore_pcu_format_group
,
1182 static struct intel_uncore_type
*ivt_msr_uncores
[] = {
1189 static struct intel_uncore_type ivt_uncore_ha
= {
1193 .perf_ctr_bits
= 48,
1194 IVT_UNCORE_PCI_COMMON_INIT(),
1197 static struct intel_uncore_type ivt_uncore_imc
= {
1201 .perf_ctr_bits
= 48,
1202 .fixed_ctr_bits
= 48,
1203 .fixed_ctr
= SNBEP_MC_CHy_PCI_PMON_FIXED_CTR
,
1204 .fixed_ctl
= SNBEP_MC_CHy_PCI_PMON_FIXED_CTL
,
1205 IVT_UNCORE_PCI_COMMON_INIT(),
1208 static struct intel_uncore_type ivt_uncore_qpi
= {
1212 .perf_ctr_bits
= 48,
1213 .perf_ctr
= SNBEP_PCI_PMON_CTR0
,
1214 .event_ctl
= SNBEP_PCI_PMON_CTL0
,
1215 .event_mask
= IVT_QPI_PCI_PMON_RAW_EVENT_MASK
,
1216 .box_ctl
= SNBEP_PCI_PMON_BOX_CTL
,
1217 .ops
= &ivt_uncore_pci_ops
,
1218 .format_group
= &ivt_uncore_qpi_format_group
,
1221 static struct intel_uncore_type ivt_uncore_r2pcie
= {
1225 .perf_ctr_bits
= 44,
1226 .constraints
= snbep_uncore_r2pcie_constraints
,
1227 IVT_UNCORE_PCI_COMMON_INIT(),
1230 static struct intel_uncore_type ivt_uncore_r3qpi
= {
1234 .perf_ctr_bits
= 44,
1235 .constraints
= snbep_uncore_r3qpi_constraints
,
1236 IVT_UNCORE_PCI_COMMON_INIT(),
1243 IVT_PCI_UNCORE_R2PCIE
,
1244 IVT_PCI_UNCORE_R3QPI
,
1247 static struct intel_uncore_type
*ivt_pci_uncores
[] = {
1248 [IVT_PCI_UNCORE_HA
] = &ivt_uncore_ha
,
1249 [IVT_PCI_UNCORE_IMC
] = &ivt_uncore_imc
,
1250 [IVT_PCI_UNCORE_QPI
] = &ivt_uncore_qpi
,
1251 [IVT_PCI_UNCORE_R2PCIE
] = &ivt_uncore_r2pcie
,
1252 [IVT_PCI_UNCORE_R3QPI
] = &ivt_uncore_r3qpi
,
1256 static DEFINE_PCI_DEVICE_TABLE(ivt_uncore_pci_ids
) = {
1257 { /* Home Agent 0 */
1258 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, 0xe30),
1259 .driver_data
= IVT_PCI_UNCORE_HA
,
1261 { /* Home Agent 1 */
1262 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, 0xe38),
1263 .driver_data
= IVT_PCI_UNCORE_HA
,
1265 { /* MC0 Channel 0 */
1266 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, 0xeb4),
1267 .driver_data
= IVT_PCI_UNCORE_IMC
,
1269 { /* MC0 Channel 1 */
1270 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, 0xeb5),
1271 .driver_data
= IVT_PCI_UNCORE_IMC
,
1273 { /* MC0 Channel 3 */
1274 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, 0xeb0),
1275 .driver_data
= IVT_PCI_UNCORE_IMC
,
1277 { /* MC0 Channel 4 */
1278 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, 0xeb1),
1279 .driver_data
= IVT_PCI_UNCORE_IMC
,
1281 { /* MC1 Channel 0 */
1282 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, 0xef4),
1283 .driver_data
= IVT_PCI_UNCORE_IMC
,
1285 { /* MC1 Channel 1 */
1286 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, 0xef5),
1287 .driver_data
= IVT_PCI_UNCORE_IMC
,
1289 { /* MC1 Channel 3 */
1290 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, 0xef0),
1291 .driver_data
= IVT_PCI_UNCORE_IMC
,
1293 { /* MC1 Channel 4 */
1294 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, 0xef1),
1295 .driver_data
= IVT_PCI_UNCORE_IMC
,
1298 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, 0xe32),
1299 .driver_data
= IVT_PCI_UNCORE_QPI
,
1302 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, 0xe33),
1303 .driver_data
= IVT_PCI_UNCORE_QPI
,
1306 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, 0xe3a),
1307 .driver_data
= IVT_PCI_UNCORE_QPI
,
1310 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, 0xe34),
1311 .driver_data
= IVT_PCI_UNCORE_R2PCIE
,
1313 { /* R3QPI0 Link 0 */
1314 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, 0xe36),
1315 .driver_data
= IVT_PCI_UNCORE_R3QPI
,
1317 { /* R3QPI0 Link 1 */
1318 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, 0xe37),
1319 .driver_data
= IVT_PCI_UNCORE_R3QPI
,
1321 { /* R3QPI1 Link 2 */
1322 PCI_DEVICE(PCI_VENDOR_ID_INTEL
, 0xe3e),
1323 .driver_data
= IVT_PCI_UNCORE_R3QPI
,
1325 { /* end: all zeroes */ }
1328 static struct pci_driver ivt_uncore_pci_driver
= {
1329 .name
= "ivt_uncore",
1330 .id_table
= ivt_uncore_pci_ids
,
1332 /* end of IvyTown uncore support */
1334 /* Sandy Bridge uncore support */
1335 static void snb_uncore_msr_enable_event(struct intel_uncore_box
*box
, struct perf_event
*event
)
1337 struct hw_perf_event
*hwc
= &event
->hw
;
1339 if (hwc
->idx
< UNCORE_PMC_IDX_FIXED
)
1340 wrmsrl(hwc
->config_base
, hwc
->config
| SNB_UNC_CTL_EN
);
1342 wrmsrl(hwc
->config_base
, SNB_UNC_CTL_EN
);
1345 static void snb_uncore_msr_disable_event(struct intel_uncore_box
*box
, struct perf_event
*event
)
1347 wrmsrl(event
->hw
.config_base
, 0);
1350 static void snb_uncore_msr_init_box(struct intel_uncore_box
*box
)
1352 if (box
->pmu
->pmu_idx
== 0) {
1353 wrmsrl(SNB_UNC_PERF_GLOBAL_CTL
,
1354 SNB_UNC_GLOBAL_CTL_EN
| SNB_UNC_GLOBAL_CTL_CORE_ALL
);
1358 static struct uncore_event_desc snb_uncore_events
[] = {
1359 INTEL_UNCORE_EVENT_DESC(clockticks
, "event=0xff,umask=0x00"),
1360 { /* end: all zeroes */ },
1363 static struct attribute
*snb_uncore_formats_attr
[] = {
1364 &format_attr_event
.attr
,
1365 &format_attr_umask
.attr
,
1366 &format_attr_edge
.attr
,
1367 &format_attr_inv
.attr
,
1368 &format_attr_cmask5
.attr
,
1372 static struct attribute_group snb_uncore_format_group
= {
1374 .attrs
= snb_uncore_formats_attr
,
1377 static struct intel_uncore_ops snb_uncore_msr_ops
= {
1378 .init_box
= snb_uncore_msr_init_box
,
1379 .disable_event
= snb_uncore_msr_disable_event
,
1380 .enable_event
= snb_uncore_msr_enable_event
,
1381 .read_counter
= uncore_msr_read_counter
,
1384 static struct event_constraint snb_uncore_cbox_constraints
[] = {
1385 UNCORE_EVENT_CONSTRAINT(0x80, 0x1),
1386 UNCORE_EVENT_CONSTRAINT(0x83, 0x1),
1387 EVENT_CONSTRAINT_END
1390 static struct intel_uncore_type snb_uncore_cbox
= {
1394 .perf_ctr_bits
= 44,
1395 .fixed_ctr_bits
= 48,
1396 .perf_ctr
= SNB_UNC_CBO_0_PER_CTR0
,
1397 .event_ctl
= SNB_UNC_CBO_0_PERFEVTSEL0
,
1398 .fixed_ctr
= SNB_UNC_FIXED_CTR
,
1399 .fixed_ctl
= SNB_UNC_FIXED_CTR_CTRL
,
1401 .event_mask
= SNB_UNC_RAW_EVENT_MASK
,
1402 .msr_offset
= SNB_UNC_CBO_MSR_OFFSET
,
1403 .constraints
= snb_uncore_cbox_constraints
,
1404 .ops
= &snb_uncore_msr_ops
,
1405 .format_group
= &snb_uncore_format_group
,
1406 .event_descs
= snb_uncore_events
,
1409 static struct intel_uncore_type
*snb_msr_uncores
[] = {
1413 /* end of Sandy Bridge uncore support */
1415 /* Nehalem uncore support */
1416 static void nhm_uncore_msr_disable_box(struct intel_uncore_box
*box
)
1418 wrmsrl(NHM_UNC_PERF_GLOBAL_CTL
, 0);
1421 static void nhm_uncore_msr_enable_box(struct intel_uncore_box
*box
)
1423 wrmsrl(NHM_UNC_PERF_GLOBAL_CTL
, NHM_UNC_GLOBAL_CTL_EN_PC_ALL
| NHM_UNC_GLOBAL_CTL_EN_FC
);
1426 static void nhm_uncore_msr_enable_event(struct intel_uncore_box
*box
, struct perf_event
*event
)
1428 struct hw_perf_event
*hwc
= &event
->hw
;
1430 if (hwc
->idx
< UNCORE_PMC_IDX_FIXED
)
1431 wrmsrl(hwc
->config_base
, hwc
->config
| SNB_UNC_CTL_EN
);
1433 wrmsrl(hwc
->config_base
, NHM_UNC_FIXED_CTR_CTL_EN
);
1436 static struct attribute
*nhm_uncore_formats_attr
[] = {
1437 &format_attr_event
.attr
,
1438 &format_attr_umask
.attr
,
1439 &format_attr_edge
.attr
,
1440 &format_attr_inv
.attr
,
1441 &format_attr_cmask8
.attr
,
1445 static struct attribute_group nhm_uncore_format_group
= {
1447 .attrs
= nhm_uncore_formats_attr
,
1450 static struct uncore_event_desc nhm_uncore_events
[] = {
1451 INTEL_UNCORE_EVENT_DESC(clockticks
, "event=0xff,umask=0x00"),
1452 INTEL_UNCORE_EVENT_DESC(qmc_writes_full_any
, "event=0x2f,umask=0x0f"),
1453 INTEL_UNCORE_EVENT_DESC(qmc_normal_reads_any
, "event=0x2c,umask=0x0f"),
1454 INTEL_UNCORE_EVENT_DESC(qhl_request_ioh_reads
, "event=0x20,umask=0x01"),
1455 INTEL_UNCORE_EVENT_DESC(qhl_request_ioh_writes
, "event=0x20,umask=0x02"),
1456 INTEL_UNCORE_EVENT_DESC(qhl_request_remote_reads
, "event=0x20,umask=0x04"),
1457 INTEL_UNCORE_EVENT_DESC(qhl_request_remote_writes
, "event=0x20,umask=0x08"),
1458 INTEL_UNCORE_EVENT_DESC(qhl_request_local_reads
, "event=0x20,umask=0x10"),
1459 INTEL_UNCORE_EVENT_DESC(qhl_request_local_writes
, "event=0x20,umask=0x20"),
1460 { /* end: all zeroes */ },
1463 static struct intel_uncore_ops nhm_uncore_msr_ops
= {
1464 .disable_box
= nhm_uncore_msr_disable_box
,
1465 .enable_box
= nhm_uncore_msr_enable_box
,
1466 .disable_event
= snb_uncore_msr_disable_event
,
1467 .enable_event
= nhm_uncore_msr_enable_event
,
1468 .read_counter
= uncore_msr_read_counter
,
1471 static struct intel_uncore_type nhm_uncore
= {
1475 .perf_ctr_bits
= 48,
1476 .fixed_ctr_bits
= 48,
1477 .event_ctl
= NHM_UNC_PERFEVTSEL0
,
1478 .perf_ctr
= NHM_UNC_UNCORE_PMC0
,
1479 .fixed_ctr
= NHM_UNC_FIXED_CTR
,
1480 .fixed_ctl
= NHM_UNC_FIXED_CTR_CTRL
,
1481 .event_mask
= NHM_UNC_RAW_EVENT_MASK
,
1482 .event_descs
= nhm_uncore_events
,
1483 .ops
= &nhm_uncore_msr_ops
,
1484 .format_group
= &nhm_uncore_format_group
,
1487 static struct intel_uncore_type
*nhm_msr_uncores
[] = {
1491 /* end of Nehalem uncore support */
1493 /* Nehalem-EX uncore support */
1494 DEFINE_UNCORE_FORMAT_ATTR(event5
, event
, "config:1-5");
1495 DEFINE_UNCORE_FORMAT_ATTR(counter
, counter
, "config:6-7");
1496 DEFINE_UNCORE_FORMAT_ATTR(match
, match
, "config1:0-63");
1497 DEFINE_UNCORE_FORMAT_ATTR(mask
, mask
, "config2:0-63");
1499 static void nhmex_uncore_msr_init_box(struct intel_uncore_box
*box
)
1501 wrmsrl(NHMEX_U_MSR_PMON_GLOBAL_CTL
, NHMEX_U_PMON_GLOBAL_EN_ALL
);
1504 static void nhmex_uncore_msr_disable_box(struct intel_uncore_box
*box
)
1506 unsigned msr
= uncore_msr_box_ctl(box
);
1510 rdmsrl(msr
, config
);
1511 config
&= ~((1ULL << uncore_num_counters(box
)) - 1);
1512 /* WBox has a fixed counter */
1513 if (uncore_msr_fixed_ctl(box
))
1514 config
&= ~NHMEX_W_PMON_GLOBAL_FIXED_EN
;
1515 wrmsrl(msr
, config
);
1519 static void nhmex_uncore_msr_enable_box(struct intel_uncore_box
*box
)
1521 unsigned msr
= uncore_msr_box_ctl(box
);
1525 rdmsrl(msr
, config
);
1526 config
|= (1ULL << uncore_num_counters(box
)) - 1;
1527 /* WBox has a fixed counter */
1528 if (uncore_msr_fixed_ctl(box
))
1529 config
|= NHMEX_W_PMON_GLOBAL_FIXED_EN
;
1530 wrmsrl(msr
, config
);
1534 static void nhmex_uncore_msr_disable_event(struct intel_uncore_box
*box
, struct perf_event
*event
)
1536 wrmsrl(event
->hw
.config_base
, 0);
1539 static void nhmex_uncore_msr_enable_event(struct intel_uncore_box
*box
, struct perf_event
*event
)
1541 struct hw_perf_event
*hwc
= &event
->hw
;
1543 if (hwc
->idx
>= UNCORE_PMC_IDX_FIXED
)
1544 wrmsrl(hwc
->config_base
, NHMEX_PMON_CTL_EN_BIT0
);
1545 else if (box
->pmu
->type
->event_mask
& NHMEX_PMON_CTL_EN_BIT0
)
1546 wrmsrl(hwc
->config_base
, hwc
->config
| NHMEX_PMON_CTL_EN_BIT22
);
1548 wrmsrl(hwc
->config_base
, hwc
->config
| NHMEX_PMON_CTL_EN_BIT0
);
1551 #define NHMEX_UNCORE_OPS_COMMON_INIT() \
1552 .init_box = nhmex_uncore_msr_init_box, \
1553 .disable_box = nhmex_uncore_msr_disable_box, \
1554 .enable_box = nhmex_uncore_msr_enable_box, \
1555 .disable_event = nhmex_uncore_msr_disable_event, \
1556 .read_counter = uncore_msr_read_counter
1558 static struct intel_uncore_ops nhmex_uncore_ops
= {
1559 NHMEX_UNCORE_OPS_COMMON_INIT(),
1560 .enable_event
= nhmex_uncore_msr_enable_event
,
1563 static struct attribute
*nhmex_uncore_ubox_formats_attr
[] = {
1564 &format_attr_event
.attr
,
1565 &format_attr_edge
.attr
,
1569 static struct attribute_group nhmex_uncore_ubox_format_group
= {
1571 .attrs
= nhmex_uncore_ubox_formats_attr
,
1574 static struct intel_uncore_type nhmex_uncore_ubox
= {
1578 .perf_ctr_bits
= 48,
1579 .event_ctl
= NHMEX_U_MSR_PMON_EV_SEL
,
1580 .perf_ctr
= NHMEX_U_MSR_PMON_CTR
,
1581 .event_mask
= NHMEX_U_PMON_RAW_EVENT_MASK
,
1582 .box_ctl
= NHMEX_U_MSR_PMON_GLOBAL_CTL
,
1583 .ops
= &nhmex_uncore_ops
,
1584 .format_group
= &nhmex_uncore_ubox_format_group
1587 static struct attribute
*nhmex_uncore_cbox_formats_attr
[] = {
1588 &format_attr_event
.attr
,
1589 &format_attr_umask
.attr
,
1590 &format_attr_edge
.attr
,
1591 &format_attr_inv
.attr
,
1592 &format_attr_thresh8
.attr
,
1596 static struct attribute_group nhmex_uncore_cbox_format_group
= {
1598 .attrs
= nhmex_uncore_cbox_formats_attr
,
1601 /* msr offset for each instance of cbox */
1602 static unsigned nhmex_cbox_msr_offsets
[] = {
1603 0x0, 0x80, 0x40, 0xc0, 0x20, 0xa0, 0x60, 0xe0, 0x240, 0x2c0,
1606 static struct intel_uncore_type nhmex_uncore_cbox
= {
1610 .perf_ctr_bits
= 48,
1611 .event_ctl
= NHMEX_C0_MSR_PMON_EV_SEL0
,
1612 .perf_ctr
= NHMEX_C0_MSR_PMON_CTR0
,
1613 .event_mask
= NHMEX_PMON_RAW_EVENT_MASK
,
1614 .box_ctl
= NHMEX_C0_MSR_PMON_GLOBAL_CTL
,
1615 .msr_offsets
= nhmex_cbox_msr_offsets
,
1617 .ops
= &nhmex_uncore_ops
,
1618 .format_group
= &nhmex_uncore_cbox_format_group
1621 static struct uncore_event_desc nhmex_uncore_wbox_events
[] = {
1622 INTEL_UNCORE_EVENT_DESC(clockticks
, "event=0xff,umask=0"),
1623 { /* end: all zeroes */ },
1626 static struct intel_uncore_type nhmex_uncore_wbox
= {
1630 .perf_ctr_bits
= 48,
1631 .event_ctl
= NHMEX_W_MSR_PMON_CNT0
,
1632 .perf_ctr
= NHMEX_W_MSR_PMON_EVT_SEL0
,
1633 .fixed_ctr
= NHMEX_W_MSR_PMON_FIXED_CTR
,
1634 .fixed_ctl
= NHMEX_W_MSR_PMON_FIXED_CTL
,
1635 .event_mask
= NHMEX_PMON_RAW_EVENT_MASK
,
1636 .box_ctl
= NHMEX_W_MSR_GLOBAL_CTL
,
1638 .event_descs
= nhmex_uncore_wbox_events
,
1639 .ops
= &nhmex_uncore_ops
,
1640 .format_group
= &nhmex_uncore_cbox_format_group
1643 static int nhmex_bbox_hw_config(struct intel_uncore_box
*box
, struct perf_event
*event
)
1645 struct hw_perf_event
*hwc
= &event
->hw
;
1646 struct hw_perf_event_extra
*reg1
= &hwc
->extra_reg
;
1647 struct hw_perf_event_extra
*reg2
= &hwc
->branch_reg
;
1650 ctr
= (hwc
->config
& NHMEX_B_PMON_CTR_MASK
) >>
1651 NHMEX_B_PMON_CTR_SHIFT
;
1652 ev_sel
= (hwc
->config
& NHMEX_B_PMON_CTL_EV_SEL_MASK
) >>
1653 NHMEX_B_PMON_CTL_EV_SEL_SHIFT
;
1655 /* events that do not use the match/mask registers */
1656 if ((ctr
== 0 && ev_sel
> 0x3) || (ctr
== 1 && ev_sel
> 0x6) ||
1657 (ctr
== 2 && ev_sel
!= 0x4) || ctr
== 3)
1660 if (box
->pmu
->pmu_idx
== 0)
1661 reg1
->reg
= NHMEX_B0_MSR_MATCH
;
1663 reg1
->reg
= NHMEX_B1_MSR_MATCH
;
1665 reg1
->config
= event
->attr
.config1
;
1666 reg2
->config
= event
->attr
.config2
;
1670 static void nhmex_bbox_msr_enable_event(struct intel_uncore_box
*box
, struct perf_event
*event
)
1672 struct hw_perf_event
*hwc
= &event
->hw
;
1673 struct hw_perf_event_extra
*reg1
= &hwc
->extra_reg
;
1674 struct hw_perf_event_extra
*reg2
= &hwc
->branch_reg
;
1676 if (reg1
->idx
!= EXTRA_REG_NONE
) {
1677 wrmsrl(reg1
->reg
, reg1
->config
);
1678 wrmsrl(reg1
->reg
+ 1, reg2
->config
);
1680 wrmsrl(hwc
->config_base
, NHMEX_PMON_CTL_EN_BIT0
|
1681 (hwc
->config
& NHMEX_B_PMON_CTL_EV_SEL_MASK
));
1685 * The Bbox has 4 counters, but each counter monitors different events.
1686 * Use bits 6-7 in the event config to select counter.
1688 static struct event_constraint nhmex_uncore_bbox_constraints
[] = {
1689 EVENT_CONSTRAINT(0 , 1, 0xc0),
1690 EVENT_CONSTRAINT(0x40, 2, 0xc0),
1691 EVENT_CONSTRAINT(0x80, 4, 0xc0),
1692 EVENT_CONSTRAINT(0xc0, 8, 0xc0),
1693 EVENT_CONSTRAINT_END
,
1696 static struct attribute
*nhmex_uncore_bbox_formats_attr
[] = {
1697 &format_attr_event5
.attr
,
1698 &format_attr_counter
.attr
,
1699 &format_attr_match
.attr
,
1700 &format_attr_mask
.attr
,
1704 static struct attribute_group nhmex_uncore_bbox_format_group
= {
1706 .attrs
= nhmex_uncore_bbox_formats_attr
,
1709 static struct intel_uncore_ops nhmex_uncore_bbox_ops
= {
1710 NHMEX_UNCORE_OPS_COMMON_INIT(),
1711 .enable_event
= nhmex_bbox_msr_enable_event
,
1712 .hw_config
= nhmex_bbox_hw_config
,
1713 .get_constraint
= uncore_get_constraint
,
1714 .put_constraint
= uncore_put_constraint
,
1717 static struct intel_uncore_type nhmex_uncore_bbox
= {
1721 .perf_ctr_bits
= 48,
1722 .event_ctl
= NHMEX_B0_MSR_PMON_CTL0
,
1723 .perf_ctr
= NHMEX_B0_MSR_PMON_CTR0
,
1724 .event_mask
= NHMEX_B_PMON_RAW_EVENT_MASK
,
1725 .box_ctl
= NHMEX_B0_MSR_PMON_GLOBAL_CTL
,
1726 .msr_offset
= NHMEX_B_MSR_OFFSET
,
1728 .num_shared_regs
= 1,
1729 .constraints
= nhmex_uncore_bbox_constraints
,
1730 .ops
= &nhmex_uncore_bbox_ops
,
1731 .format_group
= &nhmex_uncore_bbox_format_group
1734 static int nhmex_sbox_hw_config(struct intel_uncore_box
*box
, struct perf_event
*event
)
1736 struct hw_perf_event
*hwc
= &event
->hw
;
1737 struct hw_perf_event_extra
*reg1
= &hwc
->extra_reg
;
1738 struct hw_perf_event_extra
*reg2
= &hwc
->branch_reg
;
1740 /* only TO_R_PROG_EV event uses the match/mask register */
1741 if ((hwc
->config
& NHMEX_PMON_CTL_EV_SEL_MASK
) !=
1742 NHMEX_S_EVENT_TO_R_PROG_EV
)
1745 if (box
->pmu
->pmu_idx
== 0)
1746 reg1
->reg
= NHMEX_S0_MSR_MM_CFG
;
1748 reg1
->reg
= NHMEX_S1_MSR_MM_CFG
;
1750 reg1
->config
= event
->attr
.config1
;
1751 reg2
->config
= event
->attr
.config2
;
1755 static void nhmex_sbox_msr_enable_event(struct intel_uncore_box
*box
, struct perf_event
*event
)
1757 struct hw_perf_event
*hwc
= &event
->hw
;
1758 struct hw_perf_event_extra
*reg1
= &hwc
->extra_reg
;
1759 struct hw_perf_event_extra
*reg2
= &hwc
->branch_reg
;
1761 if (reg1
->idx
!= EXTRA_REG_NONE
) {
1762 wrmsrl(reg1
->reg
, 0);
1763 wrmsrl(reg1
->reg
+ 1, reg1
->config
);
1764 wrmsrl(reg1
->reg
+ 2, reg2
->config
);
1765 wrmsrl(reg1
->reg
, NHMEX_S_PMON_MM_CFG_EN
);
1767 wrmsrl(hwc
->config_base
, hwc
->config
| NHMEX_PMON_CTL_EN_BIT22
);
1770 static struct attribute
*nhmex_uncore_sbox_formats_attr
[] = {
1771 &format_attr_event
.attr
,
1772 &format_attr_umask
.attr
,
1773 &format_attr_edge
.attr
,
1774 &format_attr_inv
.attr
,
1775 &format_attr_thresh8
.attr
,
1776 &format_attr_match
.attr
,
1777 &format_attr_mask
.attr
,
1781 static struct attribute_group nhmex_uncore_sbox_format_group
= {
1783 .attrs
= nhmex_uncore_sbox_formats_attr
,
1786 static struct intel_uncore_ops nhmex_uncore_sbox_ops
= {
1787 NHMEX_UNCORE_OPS_COMMON_INIT(),
1788 .enable_event
= nhmex_sbox_msr_enable_event
,
1789 .hw_config
= nhmex_sbox_hw_config
,
1790 .get_constraint
= uncore_get_constraint
,
1791 .put_constraint
= uncore_put_constraint
,
1794 static struct intel_uncore_type nhmex_uncore_sbox
= {
1798 .perf_ctr_bits
= 48,
1799 .event_ctl
= NHMEX_S0_MSR_PMON_CTL0
,
1800 .perf_ctr
= NHMEX_S0_MSR_PMON_CTR0
,
1801 .event_mask
= NHMEX_PMON_RAW_EVENT_MASK
,
1802 .box_ctl
= NHMEX_S0_MSR_PMON_GLOBAL_CTL
,
1803 .msr_offset
= NHMEX_S_MSR_OFFSET
,
1805 .num_shared_regs
= 1,
1806 .ops
= &nhmex_uncore_sbox_ops
,
1807 .format_group
= &nhmex_uncore_sbox_format_group
1811 EXTRA_REG_NHMEX_M_FILTER
,
1812 EXTRA_REG_NHMEX_M_DSP
,
1813 EXTRA_REG_NHMEX_M_ISS
,
1814 EXTRA_REG_NHMEX_M_MAP
,
1815 EXTRA_REG_NHMEX_M_MSC_THR
,
1816 EXTRA_REG_NHMEX_M_PGT
,
1817 EXTRA_REG_NHMEX_M_PLD
,
1818 EXTRA_REG_NHMEX_M_ZDP_CTL_FVC
,
1821 static struct extra_reg nhmex_uncore_mbox_extra_regs
[] = {
1822 MBOX_INC_SEL_EXTAR_REG(0x0, DSP
),
1823 MBOX_INC_SEL_EXTAR_REG(0x4, MSC_THR
),
1824 MBOX_INC_SEL_EXTAR_REG(0x5, MSC_THR
),
1825 MBOX_INC_SEL_EXTAR_REG(0x9, ISS
),
1826 /* event 0xa uses two extra registers */
1827 MBOX_INC_SEL_EXTAR_REG(0xa, ISS
),
1828 MBOX_INC_SEL_EXTAR_REG(0xa, PLD
),
1829 MBOX_INC_SEL_EXTAR_REG(0xb, PLD
),
1830 /* events 0xd ~ 0x10 use the same extra register */
1831 MBOX_INC_SEL_EXTAR_REG(0xd, ZDP_CTL_FVC
),
1832 MBOX_INC_SEL_EXTAR_REG(0xe, ZDP_CTL_FVC
),
1833 MBOX_INC_SEL_EXTAR_REG(0xf, ZDP_CTL_FVC
),
1834 MBOX_INC_SEL_EXTAR_REG(0x10, ZDP_CTL_FVC
),
1835 MBOX_INC_SEL_EXTAR_REG(0x16, PGT
),
1836 MBOX_SET_FLAG_SEL_EXTRA_REG(0x0, DSP
),
1837 MBOX_SET_FLAG_SEL_EXTRA_REG(0x1, ISS
),
1838 MBOX_SET_FLAG_SEL_EXTRA_REG(0x5, PGT
),
1839 MBOX_SET_FLAG_SEL_EXTRA_REG(0x6, MAP
),
1843 /* Nehalem-EX or Westmere-EX ? */
1844 static bool uncore_nhmex
;
1846 static bool nhmex_mbox_get_shared_reg(struct intel_uncore_box
*box
, int idx
, u64 config
)
1848 struct intel_uncore_extra_reg
*er
;
1849 unsigned long flags
;
1853 if (idx
< EXTRA_REG_NHMEX_M_ZDP_CTL_FVC
) {
1854 er
= &box
->shared_regs
[idx
];
1855 raw_spin_lock_irqsave(&er
->lock
, flags
);
1856 if (!atomic_read(&er
->ref
) || er
->config
== config
) {
1857 atomic_inc(&er
->ref
);
1858 er
->config
= config
;
1861 raw_spin_unlock_irqrestore(&er
->lock
, flags
);
1866 * The ZDP_CTL_FVC MSR has 4 fields which are used to control
1867 * events 0xd ~ 0x10. Besides these 4 fields, there are additional
1868 * fields which are shared.
1870 idx
-= EXTRA_REG_NHMEX_M_ZDP_CTL_FVC
;
1871 if (WARN_ON_ONCE(idx
>= 4))
1874 /* mask of the shared fields */
1876 mask
= NHMEX_M_PMON_ZDP_CTL_FVC_MASK
;
1878 mask
= WSMEX_M_PMON_ZDP_CTL_FVC_MASK
;
1879 er
= &box
->shared_regs
[EXTRA_REG_NHMEX_M_ZDP_CTL_FVC
];
1881 raw_spin_lock_irqsave(&er
->lock
, flags
);
1882 /* add mask of the non-shared field if it's in use */
1883 if (__BITS_VALUE(atomic_read(&er
->ref
), idx
, 8)) {
1885 mask
|= NHMEX_M_PMON_ZDP_CTL_FVC_EVENT_MASK(idx
);
1887 mask
|= WSMEX_M_PMON_ZDP_CTL_FVC_EVENT_MASK(idx
);
1890 if (!atomic_read(&er
->ref
) || !((er
->config
^ config
) & mask
)) {
1891 atomic_add(1 << (idx
* 8), &er
->ref
);
1893 mask
= NHMEX_M_PMON_ZDP_CTL_FVC_MASK
|
1894 NHMEX_M_PMON_ZDP_CTL_FVC_EVENT_MASK(idx
);
1896 mask
= WSMEX_M_PMON_ZDP_CTL_FVC_MASK
|
1897 WSMEX_M_PMON_ZDP_CTL_FVC_EVENT_MASK(idx
);
1898 er
->config
&= ~mask
;
1899 er
->config
|= (config
& mask
);
1902 raw_spin_unlock_irqrestore(&er
->lock
, flags
);
1907 static void nhmex_mbox_put_shared_reg(struct intel_uncore_box
*box
, int idx
)
1909 struct intel_uncore_extra_reg
*er
;
1911 if (idx
< EXTRA_REG_NHMEX_M_ZDP_CTL_FVC
) {
1912 er
= &box
->shared_regs
[idx
];
1913 atomic_dec(&er
->ref
);
1917 idx
-= EXTRA_REG_NHMEX_M_ZDP_CTL_FVC
;
1918 er
= &box
->shared_regs
[EXTRA_REG_NHMEX_M_ZDP_CTL_FVC
];
1919 atomic_sub(1 << (idx
* 8), &er
->ref
);
1922 static u64
nhmex_mbox_alter_er(struct perf_event
*event
, int new_idx
, bool modify
)
1924 struct hw_perf_event
*hwc
= &event
->hw
;
1925 struct hw_perf_event_extra
*reg1
= &hwc
->extra_reg
;
1926 u64 idx
, orig_idx
= __BITS_VALUE(reg1
->idx
, 0, 8);
1927 u64 config
= reg1
->config
;
1929 /* get the non-shared control bits and shift them */
1930 idx
= orig_idx
- EXTRA_REG_NHMEX_M_ZDP_CTL_FVC
;
1932 config
&= NHMEX_M_PMON_ZDP_CTL_FVC_EVENT_MASK(idx
);
1934 config
&= WSMEX_M_PMON_ZDP_CTL_FVC_EVENT_MASK(idx
);
1935 if (new_idx
> orig_idx
) {
1936 idx
= new_idx
- orig_idx
;
1939 idx
= orig_idx
- new_idx
;
1943 /* add the shared control bits back */
1945 config
|= NHMEX_M_PMON_ZDP_CTL_FVC_MASK
& reg1
->config
;
1947 config
|= WSMEX_M_PMON_ZDP_CTL_FVC_MASK
& reg1
->config
;
1948 config
|= NHMEX_M_PMON_ZDP_CTL_FVC_MASK
& reg1
->config
;
1950 /* adjust the main event selector */
1951 if (new_idx
> orig_idx
)
1952 hwc
->config
+= idx
<< NHMEX_M_PMON_CTL_INC_SEL_SHIFT
;
1954 hwc
->config
-= idx
<< NHMEX_M_PMON_CTL_INC_SEL_SHIFT
;
1955 reg1
->config
= config
;
1956 reg1
->idx
= ~0xff | new_idx
;
1961 static struct event_constraint
*
1962 nhmex_mbox_get_constraint(struct intel_uncore_box
*box
, struct perf_event
*event
)
1964 struct hw_perf_event_extra
*reg1
= &event
->hw
.extra_reg
;
1965 struct hw_perf_event_extra
*reg2
= &event
->hw
.branch_reg
;
1966 int i
, idx
[2], alloc
= 0;
1967 u64 config1
= reg1
->config
;
1969 idx
[0] = __BITS_VALUE(reg1
->idx
, 0, 8);
1970 idx
[1] = __BITS_VALUE(reg1
->idx
, 1, 8);
1972 for (i
= 0; i
< 2; i
++) {
1973 if (!uncore_box_is_fake(box
) && (reg1
->alloc
& (0x1 << i
)))
1979 if (!nhmex_mbox_get_shared_reg(box
, idx
[i
],
1980 __BITS_VALUE(config1
, i
, 32)))
1982 alloc
|= (0x1 << i
);
1985 /* for the match/mask registers */
1986 if (reg2
->idx
!= EXTRA_REG_NONE
&&
1987 (uncore_box_is_fake(box
) || !reg2
->alloc
) &&
1988 !nhmex_mbox_get_shared_reg(box
, reg2
->idx
, reg2
->config
))
1992 * If it's a fake box -- as per validate_{group,event}() we
1993 * shouldn't touch event state and we can avoid doing so
1994 * since both will only call get_event_constraints() once
1995 * on each event, this avoids the need for reg->alloc.
1997 if (!uncore_box_is_fake(box
)) {
1998 if (idx
[0] != 0xff && idx
[0] != __BITS_VALUE(reg1
->idx
, 0, 8))
1999 nhmex_mbox_alter_er(event
, idx
[0], true);
2000 reg1
->alloc
|= alloc
;
2001 if (reg2
->idx
!= EXTRA_REG_NONE
)
2006 if (idx
[0] != 0xff && !(alloc
& 0x1) &&
2007 idx
[0] >= EXTRA_REG_NHMEX_M_ZDP_CTL_FVC
) {
2009 * events 0xd ~ 0x10 are functional identical, but are
2010 * controlled by different fields in the ZDP_CTL_FVC
2011 * register. If we failed to take one field, try the
2014 BUG_ON(__BITS_VALUE(reg1
->idx
, 1, 8) != 0xff);
2015 idx
[0] -= EXTRA_REG_NHMEX_M_ZDP_CTL_FVC
;
2016 idx
[0] = (idx
[0] + 1) % 4;
2017 idx
[0] += EXTRA_REG_NHMEX_M_ZDP_CTL_FVC
;
2018 if (idx
[0] != __BITS_VALUE(reg1
->idx
, 0, 8)) {
2019 config1
= nhmex_mbox_alter_er(event
, idx
[0], false);
2025 nhmex_mbox_put_shared_reg(box
, idx
[0]);
2027 nhmex_mbox_put_shared_reg(box
, idx
[1]);
2028 return &constraint_empty
;
2031 static void nhmex_mbox_put_constraint(struct intel_uncore_box
*box
, struct perf_event
*event
)
2033 struct hw_perf_event_extra
*reg1
= &event
->hw
.extra_reg
;
2034 struct hw_perf_event_extra
*reg2
= &event
->hw
.branch_reg
;
2036 if (uncore_box_is_fake(box
))
2039 if (reg1
->alloc
& 0x1)
2040 nhmex_mbox_put_shared_reg(box
, __BITS_VALUE(reg1
->idx
, 0, 8));
2041 if (reg1
->alloc
& 0x2)
2042 nhmex_mbox_put_shared_reg(box
, __BITS_VALUE(reg1
->idx
, 1, 8));
2046 nhmex_mbox_put_shared_reg(box
, reg2
->idx
);
2051 static int nhmex_mbox_extra_reg_idx(struct extra_reg
*er
)
2053 if (er
->idx
< EXTRA_REG_NHMEX_M_ZDP_CTL_FVC
)
2055 return er
->idx
+ (er
->event
>> NHMEX_M_PMON_CTL_INC_SEL_SHIFT
) - 0xd;
2058 static int nhmex_mbox_hw_config(struct intel_uncore_box
*box
, struct perf_event
*event
)
2060 struct intel_uncore_type
*type
= box
->pmu
->type
;
2061 struct hw_perf_event_extra
*reg1
= &event
->hw
.extra_reg
;
2062 struct hw_perf_event_extra
*reg2
= &event
->hw
.branch_reg
;
2063 struct extra_reg
*er
;
2067 * The mbox events may require 2 extra MSRs at the most. But only
2068 * the lower 32 bits in these MSRs are significant, so we can use
2069 * config1 to pass two MSRs' config.
2071 for (er
= nhmex_uncore_mbox_extra_regs
; er
->msr
; er
++) {
2072 if (er
->event
!= (event
->hw
.config
& er
->config_mask
))
2074 if (event
->attr
.config1
& ~er
->valid_mask
)
2077 msr
= er
->msr
+ type
->msr_offset
* box
->pmu
->pmu_idx
;
2078 if (WARN_ON_ONCE(msr
>= 0xffff || er
->idx
>= 0xff))
2081 /* always use the 32~63 bits to pass the PLD config */
2082 if (er
->idx
== EXTRA_REG_NHMEX_M_PLD
)
2084 else if (WARN_ON_ONCE(reg_idx
> 0))
2087 reg1
->idx
&= ~(0xff << (reg_idx
* 8));
2088 reg1
->reg
&= ~(0xffff << (reg_idx
* 16));
2089 reg1
->idx
|= nhmex_mbox_extra_reg_idx(er
) << (reg_idx
* 8);
2090 reg1
->reg
|= msr
<< (reg_idx
* 16);
2091 reg1
->config
= event
->attr
.config1
;
2095 * The mbox only provides ability to perform address matching
2096 * for the PLD events.
2099 reg2
->idx
= EXTRA_REG_NHMEX_M_FILTER
;
2100 if (event
->attr
.config2
& NHMEX_M_PMON_MM_CFG_EN
)
2101 reg2
->config
= event
->attr
.config2
;
2103 reg2
->config
= ~0ULL;
2104 if (box
->pmu
->pmu_idx
== 0)
2105 reg2
->reg
= NHMEX_M0_MSR_PMU_MM_CFG
;
2107 reg2
->reg
= NHMEX_M1_MSR_PMU_MM_CFG
;
2112 static u64
nhmex_mbox_shared_reg_config(struct intel_uncore_box
*box
, int idx
)
2114 struct intel_uncore_extra_reg
*er
;
2115 unsigned long flags
;
2118 if (idx
< EXTRA_REG_NHMEX_M_ZDP_CTL_FVC
)
2119 return box
->shared_regs
[idx
].config
;
2121 er
= &box
->shared_regs
[EXTRA_REG_NHMEX_M_ZDP_CTL_FVC
];
2122 raw_spin_lock_irqsave(&er
->lock
, flags
);
2123 config
= er
->config
;
2124 raw_spin_unlock_irqrestore(&er
->lock
, flags
);
2128 static void nhmex_mbox_msr_enable_event(struct intel_uncore_box
*box
, struct perf_event
*event
)
2130 struct hw_perf_event
*hwc
= &event
->hw
;
2131 struct hw_perf_event_extra
*reg1
= &hwc
->extra_reg
;
2132 struct hw_perf_event_extra
*reg2
= &hwc
->branch_reg
;
2135 idx
= __BITS_VALUE(reg1
->idx
, 0, 8);
2137 wrmsrl(__BITS_VALUE(reg1
->reg
, 0, 16),
2138 nhmex_mbox_shared_reg_config(box
, idx
));
2139 idx
= __BITS_VALUE(reg1
->idx
, 1, 8);
2141 wrmsrl(__BITS_VALUE(reg1
->reg
, 1, 16),
2142 nhmex_mbox_shared_reg_config(box
, idx
));
2144 if (reg2
->idx
!= EXTRA_REG_NONE
) {
2145 wrmsrl(reg2
->reg
, 0);
2146 if (reg2
->config
!= ~0ULL) {
2147 wrmsrl(reg2
->reg
+ 1,
2148 reg2
->config
& NHMEX_M_PMON_ADDR_MATCH_MASK
);
2149 wrmsrl(reg2
->reg
+ 2, NHMEX_M_PMON_ADDR_MASK_MASK
&
2150 (reg2
->config
>> NHMEX_M_PMON_ADDR_MASK_SHIFT
));
2151 wrmsrl(reg2
->reg
, NHMEX_M_PMON_MM_CFG_EN
);
2155 wrmsrl(hwc
->config_base
, hwc
->config
| NHMEX_PMON_CTL_EN_BIT0
);
2158 DEFINE_UNCORE_FORMAT_ATTR(count_mode
, count_mode
, "config:2-3");
2159 DEFINE_UNCORE_FORMAT_ATTR(storage_mode
, storage_mode
, "config:4-5");
2160 DEFINE_UNCORE_FORMAT_ATTR(wrap_mode
, wrap_mode
, "config:6");
2161 DEFINE_UNCORE_FORMAT_ATTR(flag_mode
, flag_mode
, "config:7");
2162 DEFINE_UNCORE_FORMAT_ATTR(inc_sel
, inc_sel
, "config:9-13");
2163 DEFINE_UNCORE_FORMAT_ATTR(set_flag_sel
, set_flag_sel
, "config:19-21");
2164 DEFINE_UNCORE_FORMAT_ATTR(filter_cfg_en
, filter_cfg_en
, "config2:63");
2165 DEFINE_UNCORE_FORMAT_ATTR(filter_match
, filter_match
, "config2:0-33");
2166 DEFINE_UNCORE_FORMAT_ATTR(filter_mask
, filter_mask
, "config2:34-61");
2167 DEFINE_UNCORE_FORMAT_ATTR(dsp
, dsp
, "config1:0-31");
2168 DEFINE_UNCORE_FORMAT_ATTR(thr
, thr
, "config1:0-31");
2169 DEFINE_UNCORE_FORMAT_ATTR(fvc
, fvc
, "config1:0-31");
2170 DEFINE_UNCORE_FORMAT_ATTR(pgt
, pgt
, "config1:0-31");
2171 DEFINE_UNCORE_FORMAT_ATTR(map
, map
, "config1:0-31");
2172 DEFINE_UNCORE_FORMAT_ATTR(iss
, iss
, "config1:0-31");
2173 DEFINE_UNCORE_FORMAT_ATTR(pld
, pld
, "config1:32-63");
2175 static struct attribute
*nhmex_uncore_mbox_formats_attr
[] = {
2176 &format_attr_count_mode
.attr
,
2177 &format_attr_storage_mode
.attr
,
2178 &format_attr_wrap_mode
.attr
,
2179 &format_attr_flag_mode
.attr
,
2180 &format_attr_inc_sel
.attr
,
2181 &format_attr_set_flag_sel
.attr
,
2182 &format_attr_filter_cfg_en
.attr
,
2183 &format_attr_filter_match
.attr
,
2184 &format_attr_filter_mask
.attr
,
2185 &format_attr_dsp
.attr
,
2186 &format_attr_thr
.attr
,
2187 &format_attr_fvc
.attr
,
2188 &format_attr_pgt
.attr
,
2189 &format_attr_map
.attr
,
2190 &format_attr_iss
.attr
,
2191 &format_attr_pld
.attr
,
2195 static struct attribute_group nhmex_uncore_mbox_format_group
= {
2197 .attrs
= nhmex_uncore_mbox_formats_attr
,
2200 static struct uncore_event_desc nhmex_uncore_mbox_events
[] = {
2201 INTEL_UNCORE_EVENT_DESC(bbox_cmds_read
, "inc_sel=0xd,fvc=0x2800"),
2202 INTEL_UNCORE_EVENT_DESC(bbox_cmds_write
, "inc_sel=0xd,fvc=0x2820"),
2203 { /* end: all zeroes */ },
2206 static struct uncore_event_desc wsmex_uncore_mbox_events
[] = {
2207 INTEL_UNCORE_EVENT_DESC(bbox_cmds_read
, "inc_sel=0xd,fvc=0x5000"),
2208 INTEL_UNCORE_EVENT_DESC(bbox_cmds_write
, "inc_sel=0xd,fvc=0x5040"),
2209 { /* end: all zeroes */ },
2212 static struct intel_uncore_ops nhmex_uncore_mbox_ops
= {
2213 NHMEX_UNCORE_OPS_COMMON_INIT(),
2214 .enable_event
= nhmex_mbox_msr_enable_event
,
2215 .hw_config
= nhmex_mbox_hw_config
,
2216 .get_constraint
= nhmex_mbox_get_constraint
,
2217 .put_constraint
= nhmex_mbox_put_constraint
,
2220 static struct intel_uncore_type nhmex_uncore_mbox
= {
2224 .perf_ctr_bits
= 48,
2225 .event_ctl
= NHMEX_M0_MSR_PMU_CTL0
,
2226 .perf_ctr
= NHMEX_M0_MSR_PMU_CNT0
,
2227 .event_mask
= NHMEX_M_PMON_RAW_EVENT_MASK
,
2228 .box_ctl
= NHMEX_M0_MSR_GLOBAL_CTL
,
2229 .msr_offset
= NHMEX_M_MSR_OFFSET
,
2231 .num_shared_regs
= 8,
2232 .event_descs
= nhmex_uncore_mbox_events
,
2233 .ops
= &nhmex_uncore_mbox_ops
,
2234 .format_group
= &nhmex_uncore_mbox_format_group
,
2237 static void nhmex_rbox_alter_er(struct intel_uncore_box
*box
, struct perf_event
*event
)
2239 struct hw_perf_event
*hwc
= &event
->hw
;
2240 struct hw_perf_event_extra
*reg1
= &hwc
->extra_reg
;
2242 /* adjust the main event selector and extra register index */
2243 if (reg1
->idx
% 2) {
2245 hwc
->config
-= 1 << NHMEX_R_PMON_CTL_EV_SEL_SHIFT
;
2248 hwc
->config
+= 1 << NHMEX_R_PMON_CTL_EV_SEL_SHIFT
;
2251 /* adjust extra register config */
2252 switch (reg1
->idx
% 6) {
2254 /* shift the 8~15 bits to the 0~7 bits */
2258 /* shift the 0~7 bits to the 8~15 bits */
2265 * Each rbox has 4 event set which monitor PQI port 0~3 or 4~7.
2266 * An event set consists of 6 events, the 3rd and 4th events in
2267 * an event set use the same extra register. So an event set uses
2268 * 5 extra registers.
2270 static struct event_constraint
*
2271 nhmex_rbox_get_constraint(struct intel_uncore_box
*box
, struct perf_event
*event
)
2273 struct hw_perf_event
*hwc
= &event
->hw
;
2274 struct hw_perf_event_extra
*reg1
= &hwc
->extra_reg
;
2275 struct hw_perf_event_extra
*reg2
= &hwc
->branch_reg
;
2276 struct intel_uncore_extra_reg
*er
;
2277 unsigned long flags
;
2282 if (!uncore_box_is_fake(box
) && reg1
->alloc
)
2285 idx
= reg1
->idx
% 6;
2286 config1
= reg1
->config
;
2289 /* the 3rd and 4th events use the same extra register */
2292 er_idx
+= (reg1
->idx
/ 6) * 5;
2294 er
= &box
->shared_regs
[er_idx
];
2295 raw_spin_lock_irqsave(&er
->lock
, flags
);
2297 if (!atomic_read(&er
->ref
) || er
->config
== reg1
->config
) {
2298 atomic_inc(&er
->ref
);
2299 er
->config
= reg1
->config
;
2302 } else if (idx
== 2 || idx
== 3) {
2304 * these two events use different fields in a extra register,
2305 * the 0~7 bits and the 8~15 bits respectively.
2307 u64 mask
= 0xff << ((idx
- 2) * 8);
2308 if (!__BITS_VALUE(atomic_read(&er
->ref
), idx
- 2, 8) ||
2309 !((er
->config
^ config1
) & mask
)) {
2310 atomic_add(1 << ((idx
- 2) * 8), &er
->ref
);
2311 er
->config
&= ~mask
;
2312 er
->config
|= config1
& mask
;
2316 if (!atomic_read(&er
->ref
) ||
2317 (er
->config
== (hwc
->config
>> 32) &&
2318 er
->config1
== reg1
->config
&&
2319 er
->config2
== reg2
->config
)) {
2320 atomic_inc(&er
->ref
);
2321 er
->config
= (hwc
->config
>> 32);
2322 er
->config1
= reg1
->config
;
2323 er
->config2
= reg2
->config
;
2327 raw_spin_unlock_irqrestore(&er
->lock
, flags
);
2331 * The Rbox events are always in pairs. The paired
2332 * events are functional identical, but use different
2333 * extra registers. If we failed to take an extra
2334 * register, try the alternative.
2340 if (idx
!= reg1
->idx
% 6) {
2348 if (!uncore_box_is_fake(box
)) {
2349 if (idx
!= reg1
->idx
% 6)
2350 nhmex_rbox_alter_er(box
, event
);
2355 return &constraint_empty
;
2358 static void nhmex_rbox_put_constraint(struct intel_uncore_box
*box
, struct perf_event
*event
)
2360 struct intel_uncore_extra_reg
*er
;
2361 struct hw_perf_event_extra
*reg1
= &event
->hw
.extra_reg
;
2364 if (uncore_box_is_fake(box
) || !reg1
->alloc
)
2367 idx
= reg1
->idx
% 6;
2371 er_idx
+= (reg1
->idx
/ 6) * 5;
2373 er
= &box
->shared_regs
[er_idx
];
2374 if (idx
== 2 || idx
== 3)
2375 atomic_sub(1 << ((idx
- 2) * 8), &er
->ref
);
2377 atomic_dec(&er
->ref
);
2382 static int nhmex_rbox_hw_config(struct intel_uncore_box
*box
, struct perf_event
*event
)
2384 struct hw_perf_event
*hwc
= &event
->hw
;
2385 struct hw_perf_event_extra
*reg1
= &event
->hw
.extra_reg
;
2386 struct hw_perf_event_extra
*reg2
= &event
->hw
.branch_reg
;
2389 idx
= (event
->hw
.config
& NHMEX_R_PMON_CTL_EV_SEL_MASK
) >>
2390 NHMEX_R_PMON_CTL_EV_SEL_SHIFT
;
2395 reg1
->config
= event
->attr
.config1
;
2400 hwc
->config
|= event
->attr
.config
& (~0ULL << 32);
2401 reg2
->config
= event
->attr
.config2
;
2407 static void nhmex_rbox_msr_enable_event(struct intel_uncore_box
*box
, struct perf_event
*event
)
2409 struct hw_perf_event
*hwc
= &event
->hw
;
2410 struct hw_perf_event_extra
*reg1
= &hwc
->extra_reg
;
2411 struct hw_perf_event_extra
*reg2
= &hwc
->branch_reg
;
2415 port
= idx
/ 6 + box
->pmu
->pmu_idx
* 4;
2419 wrmsrl(NHMEX_R_MSR_PORTN_IPERF_CFG0(port
), reg1
->config
);
2422 wrmsrl(NHMEX_R_MSR_PORTN_IPERF_CFG1(port
), reg1
->config
);
2426 wrmsrl(NHMEX_R_MSR_PORTN_QLX_CFG(port
),
2427 uncore_shared_reg_config(box
, 2 + (idx
/ 6) * 5));
2430 wrmsrl(NHMEX_R_MSR_PORTN_XBR_SET1_MM_CFG(port
),
2432 wrmsrl(NHMEX_R_MSR_PORTN_XBR_SET1_MATCH(port
), reg1
->config
);
2433 wrmsrl(NHMEX_R_MSR_PORTN_XBR_SET1_MASK(port
), reg2
->config
);
2436 wrmsrl(NHMEX_R_MSR_PORTN_XBR_SET2_MM_CFG(port
),
2438 wrmsrl(NHMEX_R_MSR_PORTN_XBR_SET2_MATCH(port
), reg1
->config
);
2439 wrmsrl(NHMEX_R_MSR_PORTN_XBR_SET2_MASK(port
), reg2
->config
);
2443 wrmsrl(hwc
->config_base
, NHMEX_PMON_CTL_EN_BIT0
|
2444 (hwc
->config
& NHMEX_R_PMON_CTL_EV_SEL_MASK
));
2447 DEFINE_UNCORE_FORMAT_ATTR(xbr_mm_cfg
, xbr_mm_cfg
, "config:32-63");
2448 DEFINE_UNCORE_FORMAT_ATTR(xbr_match
, xbr_match
, "config1:0-63");
2449 DEFINE_UNCORE_FORMAT_ATTR(xbr_mask
, xbr_mask
, "config2:0-63");
2450 DEFINE_UNCORE_FORMAT_ATTR(qlx_cfg
, qlx_cfg
, "config1:0-15");
2451 DEFINE_UNCORE_FORMAT_ATTR(iperf_cfg
, iperf_cfg
, "config1:0-31");
2453 static struct attribute
*nhmex_uncore_rbox_formats_attr
[] = {
2454 &format_attr_event5
.attr
,
2455 &format_attr_xbr_mm_cfg
.attr
,
2456 &format_attr_xbr_match
.attr
,
2457 &format_attr_xbr_mask
.attr
,
2458 &format_attr_qlx_cfg
.attr
,
2459 &format_attr_iperf_cfg
.attr
,
2463 static struct attribute_group nhmex_uncore_rbox_format_group
= {
2465 .attrs
= nhmex_uncore_rbox_formats_attr
,
2468 static struct uncore_event_desc nhmex_uncore_rbox_events
[] = {
2469 INTEL_UNCORE_EVENT_DESC(qpi0_flit_send
, "event=0x0,iperf_cfg=0x80000000"),
2470 INTEL_UNCORE_EVENT_DESC(qpi1_filt_send
, "event=0x6,iperf_cfg=0x80000000"),
2471 INTEL_UNCORE_EVENT_DESC(qpi0_idle_filt
, "event=0x0,iperf_cfg=0x40000000"),
2472 INTEL_UNCORE_EVENT_DESC(qpi1_idle_filt
, "event=0x6,iperf_cfg=0x40000000"),
2473 INTEL_UNCORE_EVENT_DESC(qpi0_date_response
, "event=0x0,iperf_cfg=0xc4"),
2474 INTEL_UNCORE_EVENT_DESC(qpi1_date_response
, "event=0x6,iperf_cfg=0xc4"),
2475 { /* end: all zeroes */ },
2478 static struct intel_uncore_ops nhmex_uncore_rbox_ops
= {
2479 NHMEX_UNCORE_OPS_COMMON_INIT(),
2480 .enable_event
= nhmex_rbox_msr_enable_event
,
2481 .hw_config
= nhmex_rbox_hw_config
,
2482 .get_constraint
= nhmex_rbox_get_constraint
,
2483 .put_constraint
= nhmex_rbox_put_constraint
,
2486 static struct intel_uncore_type nhmex_uncore_rbox
= {
2490 .perf_ctr_bits
= 48,
2491 .event_ctl
= NHMEX_R_MSR_PMON_CTL0
,
2492 .perf_ctr
= NHMEX_R_MSR_PMON_CNT0
,
2493 .event_mask
= NHMEX_R_PMON_RAW_EVENT_MASK
,
2494 .box_ctl
= NHMEX_R_MSR_GLOBAL_CTL
,
2495 .msr_offset
= NHMEX_R_MSR_OFFSET
,
2497 .num_shared_regs
= 20,
2498 .event_descs
= nhmex_uncore_rbox_events
,
2499 .ops
= &nhmex_uncore_rbox_ops
,
2500 .format_group
= &nhmex_uncore_rbox_format_group
2503 static struct intel_uncore_type
*nhmex_msr_uncores
[] = {
2513 /* end of Nehalem-EX uncore support */
2515 static void uncore_assign_hw_event(struct intel_uncore_box
*box
, struct perf_event
*event
, int idx
)
2517 struct hw_perf_event
*hwc
= &event
->hw
;
2520 hwc
->last_tag
= ++box
->tags
[idx
];
2522 if (hwc
->idx
== UNCORE_PMC_IDX_FIXED
) {
2523 hwc
->event_base
= uncore_fixed_ctr(box
);
2524 hwc
->config_base
= uncore_fixed_ctl(box
);
2528 hwc
->config_base
= uncore_event_ctl(box
, hwc
->idx
);
2529 hwc
->event_base
= uncore_perf_ctr(box
, hwc
->idx
);
2532 static void uncore_perf_event_update(struct intel_uncore_box
*box
, struct perf_event
*event
)
2534 u64 prev_count
, new_count
, delta
;
2537 if (event
->hw
.idx
>= UNCORE_PMC_IDX_FIXED
)
2538 shift
= 64 - uncore_fixed_ctr_bits(box
);
2540 shift
= 64 - uncore_perf_ctr_bits(box
);
2542 /* the hrtimer might modify the previous event value */
2544 prev_count
= local64_read(&event
->hw
.prev_count
);
2545 new_count
= uncore_read_counter(box
, event
);
2546 if (local64_xchg(&event
->hw
.prev_count
, new_count
) != prev_count
)
2549 delta
= (new_count
<< shift
) - (prev_count
<< shift
);
2552 local64_add(delta
, &event
->count
);
2556 * The overflow interrupt is unavailable for SandyBridge-EP, is broken
2557 * for SandyBridge. So we use hrtimer to periodically poll the counter
2558 * to avoid overflow.
2560 static enum hrtimer_restart
uncore_pmu_hrtimer(struct hrtimer
*hrtimer
)
2562 struct intel_uncore_box
*box
;
2563 unsigned long flags
;
2566 box
= container_of(hrtimer
, struct intel_uncore_box
, hrtimer
);
2567 if (!box
->n_active
|| box
->cpu
!= smp_processor_id())
2568 return HRTIMER_NORESTART
;
2570 * disable local interrupt to prevent uncore_pmu_event_start/stop
2571 * to interrupt the update process
2573 local_irq_save(flags
);
2575 for_each_set_bit(bit
, box
->active_mask
, UNCORE_PMC_IDX_MAX
)
2576 uncore_perf_event_update(box
, box
->events
[bit
]);
2578 local_irq_restore(flags
);
2580 hrtimer_forward_now(hrtimer
, ns_to_ktime(UNCORE_PMU_HRTIMER_INTERVAL
));
2581 return HRTIMER_RESTART
;
2584 static void uncore_pmu_start_hrtimer(struct intel_uncore_box
*box
)
2586 __hrtimer_start_range_ns(&box
->hrtimer
,
2587 ns_to_ktime(UNCORE_PMU_HRTIMER_INTERVAL
), 0,
2588 HRTIMER_MODE_REL_PINNED
, 0);
2591 static void uncore_pmu_cancel_hrtimer(struct intel_uncore_box
*box
)
2593 hrtimer_cancel(&box
->hrtimer
);
2596 static void uncore_pmu_init_hrtimer(struct intel_uncore_box
*box
)
2598 hrtimer_init(&box
->hrtimer
, CLOCK_MONOTONIC
, HRTIMER_MODE_REL
);
2599 box
->hrtimer
.function
= uncore_pmu_hrtimer
;
2602 struct intel_uncore_box
*uncore_alloc_box(struct intel_uncore_type
*type
, int cpu
)
2604 struct intel_uncore_box
*box
;
2607 size
= sizeof(*box
) + type
->num_shared_regs
* sizeof(struct intel_uncore_extra_reg
);
2609 box
= kmalloc_node(size
, GFP_KERNEL
| __GFP_ZERO
, cpu_to_node(cpu
));
2613 for (i
= 0; i
< type
->num_shared_regs
; i
++)
2614 raw_spin_lock_init(&box
->shared_regs
[i
].lock
);
2616 uncore_pmu_init_hrtimer(box
);
2617 atomic_set(&box
->refcnt
, 1);
2624 static struct intel_uncore_box
*
2625 uncore_pmu_to_box(struct intel_uncore_pmu
*pmu
, int cpu
)
2627 struct intel_uncore_box
*box
;
2629 box
= *per_cpu_ptr(pmu
->box
, cpu
);
2633 raw_spin_lock(&uncore_box_lock
);
2634 list_for_each_entry(box
, &pmu
->box_list
, list
) {
2635 if (box
->phys_id
== topology_physical_package_id(cpu
)) {
2636 atomic_inc(&box
->refcnt
);
2637 *per_cpu_ptr(pmu
->box
, cpu
) = box
;
2641 raw_spin_unlock(&uncore_box_lock
);
2643 return *per_cpu_ptr(pmu
->box
, cpu
);
2646 static struct intel_uncore_pmu
*uncore_event_to_pmu(struct perf_event
*event
)
2648 return container_of(event
->pmu
, struct intel_uncore_pmu
, pmu
);
2651 static struct intel_uncore_box
*uncore_event_to_box(struct perf_event
*event
)
2654 * perf core schedules event on the basis of cpu, uncore events are
2655 * collected by one of the cpus inside a physical package.
2657 return uncore_pmu_to_box(uncore_event_to_pmu(event
), smp_processor_id());
2661 uncore_collect_events(struct intel_uncore_box
*box
, struct perf_event
*leader
, bool dogrp
)
2663 struct perf_event
*event
;
2666 max_count
= box
->pmu
->type
->num_counters
;
2667 if (box
->pmu
->type
->fixed_ctl
)
2670 if (box
->n_events
>= max_count
)
2674 box
->event_list
[n
] = leader
;
2679 list_for_each_entry(event
, &leader
->sibling_list
, group_entry
) {
2680 if (event
->state
<= PERF_EVENT_STATE_OFF
)
2686 box
->event_list
[n
] = event
;
2692 static struct event_constraint
*
2693 uncore_get_event_constraint(struct intel_uncore_box
*box
, struct perf_event
*event
)
2695 struct intel_uncore_type
*type
= box
->pmu
->type
;
2696 struct event_constraint
*c
;
2698 if (type
->ops
->get_constraint
) {
2699 c
= type
->ops
->get_constraint(box
, event
);
2704 if (event
->hw
.config
== ~0ULL)
2705 return &constraint_fixed
;
2707 if (type
->constraints
) {
2708 for_each_event_constraint(c
, type
->constraints
) {
2709 if ((event
->hw
.config
& c
->cmask
) == c
->code
)
2714 return &type
->unconstrainted
;
2717 static void uncore_put_event_constraint(struct intel_uncore_box
*box
, struct perf_event
*event
)
2719 if (box
->pmu
->type
->ops
->put_constraint
)
2720 box
->pmu
->type
->ops
->put_constraint(box
, event
);
2723 static int uncore_assign_events(struct intel_uncore_box
*box
, int assign
[], int n
)
2725 unsigned long used_mask
[BITS_TO_LONGS(UNCORE_PMC_IDX_MAX
)];
2726 struct event_constraint
*c
;
2727 int i
, wmin
, wmax
, ret
= 0;
2728 struct hw_perf_event
*hwc
;
2730 bitmap_zero(used_mask
, UNCORE_PMC_IDX_MAX
);
2732 for (i
= 0, wmin
= UNCORE_PMC_IDX_MAX
, wmax
= 0; i
< n
; i
++) {
2733 hwc
= &box
->event_list
[i
]->hw
;
2734 c
= uncore_get_event_constraint(box
, box
->event_list
[i
]);
2735 hwc
->constraint
= c
;
2736 wmin
= min(wmin
, c
->weight
);
2737 wmax
= max(wmax
, c
->weight
);
2740 /* fastpath, try to reuse previous register */
2741 for (i
= 0; i
< n
; i
++) {
2742 hwc
= &box
->event_list
[i
]->hw
;
2743 c
= hwc
->constraint
;
2745 /* never assigned */
2749 /* constraint still honored */
2750 if (!test_bit(hwc
->idx
, c
->idxmsk
))
2753 /* not already used */
2754 if (test_bit(hwc
->idx
, used_mask
))
2757 __set_bit(hwc
->idx
, used_mask
);
2759 assign
[i
] = hwc
->idx
;
2763 ret
= perf_assign_events(box
->event_list
, n
,
2764 wmin
, wmax
, assign
);
2766 if (!assign
|| ret
) {
2767 for (i
= 0; i
< n
; i
++)
2768 uncore_put_event_constraint(box
, box
->event_list
[i
]);
2770 return ret
? -EINVAL
: 0;
2773 static void uncore_pmu_event_start(struct perf_event
*event
, int flags
)
2775 struct intel_uncore_box
*box
= uncore_event_to_box(event
);
2776 int idx
= event
->hw
.idx
;
2778 if (WARN_ON_ONCE(!(event
->hw
.state
& PERF_HES_STOPPED
)))
2781 if (WARN_ON_ONCE(idx
== -1 || idx
>= UNCORE_PMC_IDX_MAX
))
2784 event
->hw
.state
= 0;
2785 box
->events
[idx
] = event
;
2787 __set_bit(idx
, box
->active_mask
);
2789 local64_set(&event
->hw
.prev_count
, uncore_read_counter(box
, event
));
2790 uncore_enable_event(box
, event
);
2792 if (box
->n_active
== 1) {
2793 uncore_enable_box(box
);
2794 uncore_pmu_start_hrtimer(box
);
2798 static void uncore_pmu_event_stop(struct perf_event
*event
, int flags
)
2800 struct intel_uncore_box
*box
= uncore_event_to_box(event
);
2801 struct hw_perf_event
*hwc
= &event
->hw
;
2803 if (__test_and_clear_bit(hwc
->idx
, box
->active_mask
)) {
2804 uncore_disable_event(box
, event
);
2806 box
->events
[hwc
->idx
] = NULL
;
2807 WARN_ON_ONCE(hwc
->state
& PERF_HES_STOPPED
);
2808 hwc
->state
|= PERF_HES_STOPPED
;
2810 if (box
->n_active
== 0) {
2811 uncore_disable_box(box
);
2812 uncore_pmu_cancel_hrtimer(box
);
2816 if ((flags
& PERF_EF_UPDATE
) && !(hwc
->state
& PERF_HES_UPTODATE
)) {
2818 * Drain the remaining delta count out of a event
2819 * that we are disabling:
2821 uncore_perf_event_update(box
, event
);
2822 hwc
->state
|= PERF_HES_UPTODATE
;
2826 static int uncore_pmu_event_add(struct perf_event
*event
, int flags
)
2828 struct intel_uncore_box
*box
= uncore_event_to_box(event
);
2829 struct hw_perf_event
*hwc
= &event
->hw
;
2830 int assign
[UNCORE_PMC_IDX_MAX
];
2836 ret
= n
= uncore_collect_events(box
, event
, false);
2840 hwc
->state
= PERF_HES_UPTODATE
| PERF_HES_STOPPED
;
2841 if (!(flags
& PERF_EF_START
))
2842 hwc
->state
|= PERF_HES_ARCH
;
2844 ret
= uncore_assign_events(box
, assign
, n
);
2848 /* save events moving to new counters */
2849 for (i
= 0; i
< box
->n_events
; i
++) {
2850 event
= box
->event_list
[i
];
2853 if (hwc
->idx
== assign
[i
] &&
2854 hwc
->last_tag
== box
->tags
[assign
[i
]])
2857 * Ensure we don't accidentally enable a stopped
2858 * counter simply because we rescheduled.
2860 if (hwc
->state
& PERF_HES_STOPPED
)
2861 hwc
->state
|= PERF_HES_ARCH
;
2863 uncore_pmu_event_stop(event
, PERF_EF_UPDATE
);
2866 /* reprogram moved events into new counters */
2867 for (i
= 0; i
< n
; i
++) {
2868 event
= box
->event_list
[i
];
2871 if (hwc
->idx
!= assign
[i
] ||
2872 hwc
->last_tag
!= box
->tags
[assign
[i
]])
2873 uncore_assign_hw_event(box
, event
, assign
[i
]);
2874 else if (i
< box
->n_events
)
2877 if (hwc
->state
& PERF_HES_ARCH
)
2880 uncore_pmu_event_start(event
, 0);
2887 static void uncore_pmu_event_del(struct perf_event
*event
, int flags
)
2889 struct intel_uncore_box
*box
= uncore_event_to_box(event
);
2892 uncore_pmu_event_stop(event
, PERF_EF_UPDATE
);
2894 for (i
= 0; i
< box
->n_events
; i
++) {
2895 if (event
== box
->event_list
[i
]) {
2896 uncore_put_event_constraint(box
, event
);
2898 while (++i
< box
->n_events
)
2899 box
->event_list
[i
- 1] = box
->event_list
[i
];
2907 event
->hw
.last_tag
= ~0ULL;
2910 static void uncore_pmu_event_read(struct perf_event
*event
)
2912 struct intel_uncore_box
*box
= uncore_event_to_box(event
);
2913 uncore_perf_event_update(box
, event
);
2917 * validation ensures the group can be loaded onto the
2918 * PMU if it was the only group available.
2920 static int uncore_validate_group(struct intel_uncore_pmu
*pmu
,
2921 struct perf_event
*event
)
2923 struct perf_event
*leader
= event
->group_leader
;
2924 struct intel_uncore_box
*fake_box
;
2925 int ret
= -EINVAL
, n
;
2927 fake_box
= uncore_alloc_box(pmu
->type
, smp_processor_id());
2931 fake_box
->pmu
= pmu
;
2933 * the event is not yet connected with its
2934 * siblings therefore we must first collect
2935 * existing siblings, then add the new event
2936 * before we can simulate the scheduling
2938 n
= uncore_collect_events(fake_box
, leader
, true);
2942 fake_box
->n_events
= n
;
2943 n
= uncore_collect_events(fake_box
, event
, false);
2947 fake_box
->n_events
= n
;
2949 ret
= uncore_assign_events(fake_box
, NULL
, n
);
2955 static int uncore_pmu_event_init(struct perf_event
*event
)
2957 struct intel_uncore_pmu
*pmu
;
2958 struct intel_uncore_box
*box
;
2959 struct hw_perf_event
*hwc
= &event
->hw
;
2962 if (event
->attr
.type
!= event
->pmu
->type
)
2965 pmu
= uncore_event_to_pmu(event
);
2966 /* no device found for this pmu */
2967 if (pmu
->func_id
< 0)
2971 * Uncore PMU does measure at all privilege level all the time.
2972 * So it doesn't make sense to specify any exclude bits.
2974 if (event
->attr
.exclude_user
|| event
->attr
.exclude_kernel
||
2975 event
->attr
.exclude_hv
|| event
->attr
.exclude_idle
)
2978 /* Sampling not supported yet */
2979 if (hwc
->sample_period
)
2983 * Place all uncore events for a particular physical package
2988 box
= uncore_pmu_to_box(pmu
, event
->cpu
);
2989 if (!box
|| box
->cpu
< 0)
2991 event
->cpu
= box
->cpu
;
2994 event
->hw
.last_tag
= ~0ULL;
2995 event
->hw
.extra_reg
.idx
= EXTRA_REG_NONE
;
2996 event
->hw
.branch_reg
.idx
= EXTRA_REG_NONE
;
2998 if (event
->attr
.config
== UNCORE_FIXED_EVENT
) {
2999 /* no fixed counter */
3000 if (!pmu
->type
->fixed_ctl
)
3003 * if there is only one fixed counter, only the first pmu
3004 * can access the fixed counter
3006 if (pmu
->type
->single_fixed
&& pmu
->pmu_idx
> 0)
3008 hwc
->config
= ~0ULL;
3010 hwc
->config
= event
->attr
.config
& pmu
->type
->event_mask
;
3011 if (pmu
->type
->ops
->hw_config
) {
3012 ret
= pmu
->type
->ops
->hw_config(box
, event
);
3018 if (event
->group_leader
!= event
)
3019 ret
= uncore_validate_group(pmu
, event
);
3026 static ssize_t
uncore_get_attr_cpumask(struct device
*dev
,
3027 struct device_attribute
*attr
, char *buf
)
3029 int n
= cpulist_scnprintf(buf
, PAGE_SIZE
- 2, &uncore_cpu_mask
);
3036 static DEVICE_ATTR(cpumask
, S_IRUGO
, uncore_get_attr_cpumask
, NULL
);
3038 static struct attribute
*uncore_pmu_attrs
[] = {
3039 &dev_attr_cpumask
.attr
,
3043 static struct attribute_group uncore_pmu_attr_group
= {
3044 .attrs
= uncore_pmu_attrs
,
3047 static int __init
uncore_pmu_register(struct intel_uncore_pmu
*pmu
)
3051 pmu
->pmu
= (struct pmu
) {
3052 .attr_groups
= pmu
->type
->attr_groups
,
3053 .task_ctx_nr
= perf_invalid_context
,
3054 .event_init
= uncore_pmu_event_init
,
3055 .add
= uncore_pmu_event_add
,
3056 .del
= uncore_pmu_event_del
,
3057 .start
= uncore_pmu_event_start
,
3058 .stop
= uncore_pmu_event_stop
,
3059 .read
= uncore_pmu_event_read
,
3062 if (pmu
->type
->num_boxes
== 1) {
3063 if (strlen(pmu
->type
->name
) > 0)
3064 sprintf(pmu
->name
, "uncore_%s", pmu
->type
->name
);
3066 sprintf(pmu
->name
, "uncore");
3068 sprintf(pmu
->name
, "uncore_%s_%d", pmu
->type
->name
,
3072 ret
= perf_pmu_register(&pmu
->pmu
, pmu
->name
, -1);
3076 static void __init
uncore_type_exit(struct intel_uncore_type
*type
)
3080 for (i
= 0; i
< type
->num_boxes
; i
++)
3081 free_percpu(type
->pmus
[i
].box
);
3084 kfree(type
->events_group
);
3085 type
->events_group
= NULL
;
3088 static void __init
uncore_types_exit(struct intel_uncore_type
**types
)
3091 for (i
= 0; types
[i
]; i
++)
3092 uncore_type_exit(types
[i
]);
3095 static int __init
uncore_type_init(struct intel_uncore_type
*type
)
3097 struct intel_uncore_pmu
*pmus
;
3098 struct attribute_group
*attr_group
;
3099 struct attribute
**attrs
;
3102 pmus
= kzalloc(sizeof(*pmus
) * type
->num_boxes
, GFP_KERNEL
);
3106 type
->unconstrainted
= (struct event_constraint
)
3107 __EVENT_CONSTRAINT(0, (1ULL << type
->num_counters
) - 1,
3108 0, type
->num_counters
, 0, 0);
3110 for (i
= 0; i
< type
->num_boxes
; i
++) {
3111 pmus
[i
].func_id
= -1;
3112 pmus
[i
].pmu_idx
= i
;
3113 pmus
[i
].type
= type
;
3114 INIT_LIST_HEAD(&pmus
[i
].box_list
);
3115 pmus
[i
].box
= alloc_percpu(struct intel_uncore_box
*);
3120 if (type
->event_descs
) {
3122 while (type
->event_descs
[i
].attr
.attr
.name
)
3125 attr_group
= kzalloc(sizeof(struct attribute
*) * (i
+ 1) +
3126 sizeof(*attr_group
), GFP_KERNEL
);
3130 attrs
= (struct attribute
**)(attr_group
+ 1);
3131 attr_group
->name
= "events";
3132 attr_group
->attrs
= attrs
;
3134 for (j
= 0; j
< i
; j
++)
3135 attrs
[j
] = &type
->event_descs
[j
].attr
.attr
;
3137 type
->events_group
= attr_group
;
3140 type
->pmu_group
= &uncore_pmu_attr_group
;
3144 uncore_type_exit(type
);
3148 static int __init
uncore_types_init(struct intel_uncore_type
**types
)
3152 for (i
= 0; types
[i
]; i
++) {
3153 ret
= uncore_type_init(types
[i
]);
3160 uncore_type_exit(types
[i
]);
3164 static struct pci_driver
*uncore_pci_driver
;
3165 static bool pcidrv_registered
;
3168 * add a pci uncore device
3170 static int uncore_pci_add(struct intel_uncore_type
*type
, struct pci_dev
*pdev
)
3172 struct intel_uncore_pmu
*pmu
;
3173 struct intel_uncore_box
*box
;
3176 phys_id
= pcibus_to_physid
[pdev
->bus
->number
];
3180 box
= uncore_alloc_box(type
, 0);
3185 * for performance monitoring unit with multiple boxes,
3186 * each box has a different function id.
3188 for (i
= 0; i
< type
->num_boxes
; i
++) {
3189 pmu
= &type
->pmus
[i
];
3190 if (pmu
->func_id
== pdev
->devfn
)
3192 if (pmu
->func_id
< 0) {
3193 pmu
->func_id
= pdev
->devfn
;
3204 box
->phys_id
= phys_id
;
3205 box
->pci_dev
= pdev
;
3207 uncore_box_init(box
);
3208 pci_set_drvdata(pdev
, box
);
3210 raw_spin_lock(&uncore_box_lock
);
3211 list_add_tail(&box
->list
, &pmu
->box_list
);
3212 raw_spin_unlock(&uncore_box_lock
);
3217 static void uncore_pci_remove(struct pci_dev
*pdev
)
3219 struct intel_uncore_box
*box
= pci_get_drvdata(pdev
);
3220 struct intel_uncore_pmu
*pmu
= box
->pmu
;
3221 int cpu
, phys_id
= pcibus_to_physid
[pdev
->bus
->number
];
3223 if (WARN_ON_ONCE(phys_id
!= box
->phys_id
))
3226 pci_set_drvdata(pdev
, NULL
);
3228 raw_spin_lock(&uncore_box_lock
);
3229 list_del(&box
->list
);
3230 raw_spin_unlock(&uncore_box_lock
);
3232 for_each_possible_cpu(cpu
) {
3233 if (*per_cpu_ptr(pmu
->box
, cpu
) == box
) {
3234 *per_cpu_ptr(pmu
->box
, cpu
) = NULL
;
3235 atomic_dec(&box
->refcnt
);
3239 WARN_ON_ONCE(atomic_read(&box
->refcnt
) != 1);
3243 static int uncore_pci_probe(struct pci_dev
*pdev
,
3244 const struct pci_device_id
*id
)
3246 return uncore_pci_add(pci_uncores
[id
->driver_data
], pdev
);
3249 static int __init
uncore_pci_init(void)
3253 switch (boot_cpu_data
.x86_model
) {
3254 case 45: /* Sandy Bridge-EP */
3255 ret
= snbep_pci2phy_map_init(0x3ce0);
3258 pci_uncores
= snbep_pci_uncores
;
3259 uncore_pci_driver
= &snbep_uncore_pci_driver
;
3261 case 62: /* IvyTown */
3262 ret
= snbep_pci2phy_map_init(0x0e1e);
3265 pci_uncores
= ivt_pci_uncores
;
3266 uncore_pci_driver
= &ivt_uncore_pci_driver
;
3272 ret
= uncore_types_init(pci_uncores
);
3276 uncore_pci_driver
->probe
= uncore_pci_probe
;
3277 uncore_pci_driver
->remove
= uncore_pci_remove
;
3279 ret
= pci_register_driver(uncore_pci_driver
);
3281 pcidrv_registered
= true;
3283 uncore_types_exit(pci_uncores
);
3288 static void __init
uncore_pci_exit(void)
3290 if (pcidrv_registered
) {
3291 pcidrv_registered
= false;
3292 pci_unregister_driver(uncore_pci_driver
);
3293 uncore_types_exit(pci_uncores
);
3297 /* CPU hot plug/unplug are serialized by cpu_add_remove_lock mutex */
3298 static LIST_HEAD(boxes_to_free
);
3300 static void __cpuinit
uncore_kfree_boxes(void)
3302 struct intel_uncore_box
*box
;
3304 while (!list_empty(&boxes_to_free
)) {
3305 box
= list_entry(boxes_to_free
.next
,
3306 struct intel_uncore_box
, list
);
3307 list_del(&box
->list
);
3312 static void __cpuinit
uncore_cpu_dying(int cpu
)
3314 struct intel_uncore_type
*type
;
3315 struct intel_uncore_pmu
*pmu
;
3316 struct intel_uncore_box
*box
;
3319 for (i
= 0; msr_uncores
[i
]; i
++) {
3320 type
= msr_uncores
[i
];
3321 for (j
= 0; j
< type
->num_boxes
; j
++) {
3322 pmu
= &type
->pmus
[j
];
3323 box
= *per_cpu_ptr(pmu
->box
, cpu
);
3324 *per_cpu_ptr(pmu
->box
, cpu
) = NULL
;
3325 if (box
&& atomic_dec_and_test(&box
->refcnt
))
3326 list_add(&box
->list
, &boxes_to_free
);
3331 static int __cpuinit
uncore_cpu_starting(int cpu
)
3333 struct intel_uncore_type
*type
;
3334 struct intel_uncore_pmu
*pmu
;
3335 struct intel_uncore_box
*box
, *exist
;
3336 int i
, j
, k
, phys_id
;
3338 phys_id
= topology_physical_package_id(cpu
);
3340 for (i
= 0; msr_uncores
[i
]; i
++) {
3341 type
= msr_uncores
[i
];
3342 for (j
= 0; j
< type
->num_boxes
; j
++) {
3343 pmu
= &type
->pmus
[j
];
3344 box
= *per_cpu_ptr(pmu
->box
, cpu
);
3345 /* called by uncore_cpu_init? */
3346 if (box
&& box
->phys_id
>= 0) {
3347 uncore_box_init(box
);
3351 for_each_online_cpu(k
) {
3352 exist
= *per_cpu_ptr(pmu
->box
, k
);
3353 if (exist
&& exist
->phys_id
== phys_id
) {
3354 atomic_inc(&exist
->refcnt
);
3355 *per_cpu_ptr(pmu
->box
, cpu
) = exist
;
3357 list_add(&box
->list
,
3366 box
->phys_id
= phys_id
;
3367 uncore_box_init(box
);
3374 static int __cpuinit
uncore_cpu_prepare(int cpu
, int phys_id
)
3376 struct intel_uncore_type
*type
;
3377 struct intel_uncore_pmu
*pmu
;
3378 struct intel_uncore_box
*box
;
3381 for (i
= 0; msr_uncores
[i
]; i
++) {
3382 type
= msr_uncores
[i
];
3383 for (j
= 0; j
< type
->num_boxes
; j
++) {
3384 pmu
= &type
->pmus
[j
];
3385 if (pmu
->func_id
< 0)
3388 box
= uncore_alloc_box(type
, cpu
);
3393 box
->phys_id
= phys_id
;
3394 *per_cpu_ptr(pmu
->box
, cpu
) = box
;
3400 static void __cpuinit
3401 uncore_change_context(struct intel_uncore_type
**uncores
, int old_cpu
, int new_cpu
)
3403 struct intel_uncore_type
*type
;
3404 struct intel_uncore_pmu
*pmu
;
3405 struct intel_uncore_box
*box
;
3408 for (i
= 0; uncores
[i
]; i
++) {
3410 for (j
= 0; j
< type
->num_boxes
; j
++) {
3411 pmu
= &type
->pmus
[j
];
3413 box
= uncore_pmu_to_box(pmu
, new_cpu
);
3415 box
= uncore_pmu_to_box(pmu
, old_cpu
);
3420 WARN_ON_ONCE(box
->cpu
!= -1);
3425 WARN_ON_ONCE(box
->cpu
!= old_cpu
);
3427 uncore_pmu_cancel_hrtimer(box
);
3428 perf_pmu_migrate_context(&pmu
->pmu
,
3438 static void __cpuinit
uncore_event_exit_cpu(int cpu
)
3440 int i
, phys_id
, target
;
3442 /* if exiting cpu is used for collecting uncore events */
3443 if (!cpumask_test_and_clear_cpu(cpu
, &uncore_cpu_mask
))
3446 /* find a new cpu to collect uncore events */
3447 phys_id
= topology_physical_package_id(cpu
);
3449 for_each_online_cpu(i
) {
3452 if (phys_id
== topology_physical_package_id(i
)) {
3458 /* migrate uncore events to the new cpu */
3460 cpumask_set_cpu(target
, &uncore_cpu_mask
);
3462 uncore_change_context(msr_uncores
, cpu
, target
);
3463 uncore_change_context(pci_uncores
, cpu
, target
);
3466 static void __cpuinit
uncore_event_init_cpu(int cpu
)
3470 phys_id
= topology_physical_package_id(cpu
);
3471 for_each_cpu(i
, &uncore_cpu_mask
) {
3472 if (phys_id
== topology_physical_package_id(i
))
3476 cpumask_set_cpu(cpu
, &uncore_cpu_mask
);
3478 uncore_change_context(msr_uncores
, -1, cpu
);
3479 uncore_change_context(pci_uncores
, -1, cpu
);
3483 __cpuinit
uncore_cpu_notifier(struct notifier_block
*self
, unsigned long action
, void *hcpu
)
3485 unsigned int cpu
= (long)hcpu
;
3487 /* allocate/free data structure for uncore box */
3488 switch (action
& ~CPU_TASKS_FROZEN
) {
3489 case CPU_UP_PREPARE
:
3490 uncore_cpu_prepare(cpu
, -1);
3493 uncore_cpu_starting(cpu
);
3495 case CPU_UP_CANCELED
:
3497 uncore_cpu_dying(cpu
);
3501 uncore_kfree_boxes();
3507 /* select the cpu that collects uncore events */
3508 switch (action
& ~CPU_TASKS_FROZEN
) {
3509 case CPU_DOWN_FAILED
:
3511 uncore_event_init_cpu(cpu
);
3513 case CPU_DOWN_PREPARE
:
3514 uncore_event_exit_cpu(cpu
);
3523 static struct notifier_block uncore_cpu_nb __cpuinitdata
= {
3524 .notifier_call
= uncore_cpu_notifier
,
3526 * to migrate uncore events, our notifier should be executed
3527 * before perf core's notifier.
3529 .priority
= CPU_PRI_PERF
+ 1,
3532 static void __init
uncore_cpu_setup(void *dummy
)
3534 uncore_cpu_starting(smp_processor_id());
3537 static int __init
uncore_cpu_init(void)
3539 int ret
, cpu
, max_cores
;
3541 max_cores
= boot_cpu_data
.x86_max_cores
;
3542 switch (boot_cpu_data
.x86_model
) {
3543 case 26: /* Nehalem */
3545 case 37: /* Westmere */
3547 msr_uncores
= nhm_msr_uncores
;
3549 case 42: /* Sandy Bridge */
3550 case 58: /* Ivy Bridge */
3551 if (snb_uncore_cbox
.num_boxes
> max_cores
)
3552 snb_uncore_cbox
.num_boxes
= max_cores
;
3553 msr_uncores
= snb_msr_uncores
;
3555 case 45: /* Sandy Bridge-EP */
3556 if (snbep_uncore_cbox
.num_boxes
> max_cores
)
3557 snbep_uncore_cbox
.num_boxes
= max_cores
;
3558 msr_uncores
= snbep_msr_uncores
;
3560 case 46: /* Nehalem-EX */
3561 uncore_nhmex
= true;
3562 case 47: /* Westmere-EX aka. Xeon E7 */
3564 nhmex_uncore_mbox
.event_descs
= wsmex_uncore_mbox_events
;
3565 if (nhmex_uncore_cbox
.num_boxes
> max_cores
)
3566 nhmex_uncore_cbox
.num_boxes
= max_cores
;
3567 msr_uncores
= nhmex_msr_uncores
;
3569 case 62: /* IvyTown */
3570 if (ivt_uncore_cbox
.num_boxes
> max_cores
)
3571 ivt_uncore_cbox
.num_boxes
= max_cores
;
3572 msr_uncores
= ivt_msr_uncores
;
3579 ret
= uncore_types_init(msr_uncores
);
3585 for_each_online_cpu(cpu
) {
3586 int i
, phys_id
= topology_physical_package_id(cpu
);
3588 for_each_cpu(i
, &uncore_cpu_mask
) {
3589 if (phys_id
== topology_physical_package_id(i
)) {
3597 uncore_cpu_prepare(cpu
, phys_id
);
3598 uncore_event_init_cpu(cpu
);
3600 on_each_cpu(uncore_cpu_setup
, NULL
, 1);
3602 register_cpu_notifier(&uncore_cpu_nb
);
3609 static int __init
uncore_pmus_register(void)
3611 struct intel_uncore_pmu
*pmu
;
3612 struct intel_uncore_type
*type
;
3615 for (i
= 0; msr_uncores
[i
]; i
++) {
3616 type
= msr_uncores
[i
];
3617 for (j
= 0; j
< type
->num_boxes
; j
++) {
3618 pmu
= &type
->pmus
[j
];
3619 uncore_pmu_register(pmu
);
3623 for (i
= 0; pci_uncores
[i
]; i
++) {
3624 type
= pci_uncores
[i
];
3625 for (j
= 0; j
< type
->num_boxes
; j
++) {
3626 pmu
= &type
->pmus
[j
];
3627 uncore_pmu_register(pmu
);
3634 static int __init
intel_uncore_init(void)
3638 if (boot_cpu_data
.x86_vendor
!= X86_VENDOR_INTEL
)
3641 if (cpu_has_hypervisor
)
3644 ret
= uncore_pci_init();
3647 ret
= uncore_cpu_init();
3653 uncore_pmus_register();
3658 device_initcall(intel_uncore_init
);