kernel - Fix some rare pmap races in i386 and x86_64.
[dragonfly.git] / sys / platform / pc32 / i386 / perfmon.c
blob55034982c728dffeda7078c65b851fee32a475a4
1 /*
2 * Copyright 1996 Massachusetts Institute of Technology
4 * Permission to use, copy, modify, and distribute this software and
5 * its documentation for any purpose and without fee is hereby
6 * granted, provided that both the above copyright notice and this
7 * permission notice appear in all copies, that both the above
8 * copyright notice and this permission notice appear in all
9 * supporting documentation, and that the name of M.I.T. not be used
10 * in advertising or publicity pertaining to distribution of the
11 * software without specific, written prior permission. M.I.T. makes
12 * no representations about the suitability of this software for any
13 * purpose. It is provided "as is" without express or implied
14 * warranty.
16 * THIS SOFTWARE IS PROVIDED BY M.I.T. ``AS IS''. M.I.T. DISCLAIMS
17 * ALL EXPRESS OR IMPLIED WARRANTIES WITH REGARD TO THIS SOFTWARE,
18 * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
19 * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE. IN NO EVENT
20 * SHALL M.I.T. BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
21 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
22 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
23 * USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
24 * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
25 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
26 * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27 * SUCH DAMAGE.
29 * $FreeBSD: src/sys/i386/i386/perfmon.c,v 1.21 1999/09/25 18:24:04 phk Exp $
30 * $DragonFly: src/sys/platform/pc32/i386/perfmon.c,v 1.11 2008/05/10 17:24:07 dillon Exp $
33 #include <sys/param.h>
34 #include <sys/systm.h>
35 #include <sys/kernel.h>
36 #include <sys/conf.h>
37 #include <sys/device.h>
38 #include <sys/fcntl.h>
39 #include <sys/lock.h>
41 #ifndef SMP
42 #include <machine/cputypes.h>
43 #endif
44 #include <machine/clock.h>
45 #include <machine/perfmon.h>
47 static int perfmon_inuse;
48 static int perfmon_cpuok;
49 #ifndef SMP
50 static int msr_ctl[NPMC];
51 #endif
52 static int msr_pmc[NPMC];
53 static unsigned int ctl_shadow[NPMC];
54 static quad_t pmc_shadow[NPMC]; /* used when ctr is stopped on P5 */
55 static int (*writectl)(int);
56 #ifndef SMP
57 static int writectl5(int);
58 static int writectl6(int);
59 #endif
61 static d_close_t perfmon_close;
62 static d_open_t perfmon_open;
63 static d_ioctl_t perfmon_ioctl;
65 #define CDEV_MAJOR 2 /* We're really a minor of mem.c */
66 static struct dev_ops perfmon_ops = {
67 { "perfmon", CDEV_MAJOR, 0 },
68 .d_open = perfmon_open,
69 .d_close = perfmon_close,
70 .d_ioctl = perfmon_ioctl,
74 * Initialize the device ops for user access to the perfmon. This must
75 * be done late in the boot sequence.
77 * NOTE: The perfmon is really a minor of the mem major. Perfmon
78 * gets 32-47.
80 static void
81 perfmon_driver_init(void *unused __unused)
83 make_dev(&perfmon_ops, 32, UID_ROOT, GID_KMEM, 0640, "perfmon");
86 SYSINIT(perfmondrv, SI_SUB_DRIVERS, SI_ORDER_ANY, perfmon_driver_init, NULL)
89 * This is called in early boot, after cpu_class has been set up.
91 void
92 perfmon_init(void)
94 #ifndef SMP
95 switch(cpu_class) {
96 case CPUCLASS_586:
97 perfmon_cpuok = 1;
98 msr_ctl[0] = 0x11;
99 msr_ctl[1] = 0x11;
100 msr_pmc[0] = 0x12;
101 msr_pmc[1] = 0x13;
102 writectl = writectl5;
103 break;
104 case CPUCLASS_686:
105 perfmon_cpuok = 1;
106 msr_ctl[0] = 0x186;
107 msr_ctl[1] = 0x187;
108 msr_pmc[0] = 0xc1;
109 msr_pmc[1] = 0xc2;
110 writectl = writectl6;
111 break;
113 default:
114 perfmon_cpuok = 0;
115 break;
117 #endif /* SMP */
121 perfmon_avail(void)
123 return perfmon_cpuok;
127 perfmon_setup(int pmc, unsigned int control)
129 if (pmc < 0 || pmc >= NPMC)
130 return EINVAL;
132 perfmon_inuse |= (1 << pmc);
133 control &= ~(PMCF_SYS_FLAGS << 16);
134 mpintr_lock(); /* doesn't have to be mpintr_lock YYY */
135 ctl_shadow[pmc] = control;
136 writectl(pmc);
137 wrmsr(msr_pmc[pmc], pmc_shadow[pmc] = 0);
138 mpintr_unlock();
139 return 0;
143 perfmon_get(int pmc, unsigned int *control)
145 if (pmc < 0 || pmc >= NPMC)
146 return EINVAL;
148 if (perfmon_inuse & (1 << pmc)) {
149 *control = ctl_shadow[pmc];
150 return 0;
152 return EBUSY; /* XXX reversed sense */
156 perfmon_fini(int pmc)
158 if (pmc < 0 || pmc >= NPMC)
159 return EINVAL;
161 if (perfmon_inuse & (1 << pmc)) {
162 perfmon_stop(pmc);
163 ctl_shadow[pmc] = 0;
164 perfmon_inuse &= ~(1 << pmc);
165 return 0;
167 return EBUSY; /* XXX reversed sense */
171 perfmon_start(int pmc)
173 if (pmc < 0 || pmc >= NPMC)
174 return EINVAL;
176 if (perfmon_inuse & (1 << pmc)) {
177 mpintr_lock(); /* doesn't have to be mpintr YYY */
178 ctl_shadow[pmc] |= (PMCF_EN << 16);
179 wrmsr(msr_pmc[pmc], pmc_shadow[pmc]);
180 writectl(pmc);
181 mpintr_unlock();
182 return 0;
184 return EBUSY;
188 perfmon_stop(int pmc)
190 if (pmc < 0 || pmc >= NPMC)
191 return EINVAL;
193 if (perfmon_inuse & (1 << pmc)) {
194 mpintr_lock();
195 pmc_shadow[pmc] = rdmsr(msr_pmc[pmc]) & 0xffffffffffULL;
196 ctl_shadow[pmc] &= ~(PMCF_EN << 16);
197 writectl(pmc);
198 mpintr_unlock();
199 return 0;
201 return EBUSY;
205 perfmon_read(int pmc, quad_t *val)
207 if (pmc < 0 || pmc >= NPMC)
208 return EINVAL;
210 if (perfmon_inuse & (1 << pmc)) {
211 if (ctl_shadow[pmc] & (PMCF_EN << 16))
212 *val = rdmsr(msr_pmc[pmc]) & 0xffffffffffULL;
213 else
214 *val = pmc_shadow[pmc];
215 return 0;
218 return EBUSY;
222 perfmon_reset(int pmc)
224 if (pmc < 0 || pmc >= NPMC)
225 return EINVAL;
227 if (perfmon_inuse & (1 << pmc)) {
228 wrmsr(msr_pmc[pmc], pmc_shadow[pmc] = 0);
229 return 0;
231 return EBUSY;
234 #ifndef SMP
236 * Unfortunately, the performance-monitoring registers are laid out
237 * differently in the P5 and P6. We keep everything in P6 format
238 * internally (except for the event code), and convert to P5
239 * format as needed on those CPUs. The writectl function pointer
240 * is set up to point to one of these functions by perfmon_init().
243 writectl6(int pmc)
245 if (pmc > 0 && !(ctl_shadow[pmc] & (PMCF_EN << 16))) {
246 wrmsr(msr_ctl[pmc], 0);
247 } else {
248 wrmsr(msr_ctl[pmc], ctl_shadow[pmc]);
250 return 0;
253 #define P5FLAG_P 0x200
254 #define P5FLAG_E 0x100
255 #define P5FLAG_USR 0x80
256 #define P5FLAG_OS 0x40
259 writectl5(int pmc)
261 quad_t newval = 0;
263 if (ctl_shadow[1] & (PMCF_EN << 16)) {
264 if (ctl_shadow[1] & (PMCF_USR << 16))
265 newval |= P5FLAG_USR << 16;
266 if (ctl_shadow[1] & (PMCF_OS << 16))
267 newval |= P5FLAG_OS << 16;
268 if (!(ctl_shadow[1] & (PMCF_E << 16)))
269 newval |= P5FLAG_E << 16;
270 newval |= (ctl_shadow[1] & 0x3f) << 16;
272 if (ctl_shadow[0] & (PMCF_EN << 16)) {
273 if (ctl_shadow[0] & (PMCF_USR << 16))
274 newval |= P5FLAG_USR;
275 if (ctl_shadow[0] & (PMCF_OS << 16))
276 newval |= P5FLAG_OS;
277 if (!(ctl_shadow[0] & (PMCF_E << 16)))
278 newval |= P5FLAG_E;
279 newval |= ctl_shadow[0] & 0x3f;
282 wrmsr(msr_ctl[0], newval);
283 return 0; /* XXX should check for unimplemented bits */
285 #endif /* !SMP */
288 * Now the user-mode interface, called from a subdevice of mem.c.
290 static int writer;
291 static int writerpmc;
293 static int
294 perfmon_open(struct dev_open_args *ap)
296 if (!perfmon_cpuok)
297 return ENXIO;
299 if (ap->a_oflags & FWRITE) {
300 if (writer) {
301 return EBUSY;
302 } else {
303 writer = 1;
304 writerpmc = 0;
307 return 0;
310 static int
311 perfmon_close(struct dev_close_args *ap)
313 if (ap->a_fflag & FWRITE) {
314 int i;
316 for (i = 0; i < NPMC; i++) {
317 if (writerpmc & (1 << i))
318 perfmon_fini(i);
320 writer = 0;
322 return 0;
325 static int
326 perfmon_ioctl(struct dev_ioctl_args *ap)
328 caddr_t param = ap->a_data;
329 struct pmc *pmc;
330 struct pmc_data *pmcd;
331 struct pmc_tstamp *pmct;
332 int *ip;
333 int rv;
335 switch(ap->a_cmd) {
336 case PMIOSETUP:
337 if (!(ap->a_fflag & FWRITE))
338 return EPERM;
339 pmc = (struct pmc *)param;
341 rv = perfmon_setup(pmc->pmc_num, pmc->pmc_val);
342 if (!rv) {
343 writerpmc |= (1 << pmc->pmc_num);
345 break;
347 case PMIOGET:
348 pmc = (struct pmc *)param;
349 rv = perfmon_get(pmc->pmc_num, &pmc->pmc_val);
350 break;
352 case PMIOSTART:
353 if (!(ap->a_fflag & FWRITE))
354 return EPERM;
356 ip = (int *)param;
357 rv = perfmon_start(*ip);
358 break;
360 case PMIOSTOP:
361 if (!(ap->a_fflag & FWRITE))
362 return EPERM;
364 ip = (int *)param;
365 rv = perfmon_stop(*ip);
366 break;
368 case PMIORESET:
369 if (!(ap->a_fflag & FWRITE))
370 return EPERM;
372 ip = (int *)param;
373 rv = perfmon_reset(*ip);
374 break;
376 case PMIOREAD:
377 pmcd = (struct pmc_data *)param;
378 rv = perfmon_read(pmcd->pmcd_num, &pmcd->pmcd_value);
379 break;
381 case PMIOTSTAMP:
382 if (tsc_frequency == 0) {
383 rv = ENOTTY;
384 break;
386 pmct = (struct pmc_tstamp *)param;
387 /* XXX interface loses precision. */
388 pmct->pmct_rate = (int)(tsc_frequency / 1000000);
389 pmct->pmct_value = rdtsc();
390 rv = 0;
391 break;
392 default:
393 rv = ENOTTY;
396 return rv;