4 * The contents of this file are subject to the terms of the
5 * Common Development and Distribution License (the "License").
6 * You may not use this file except in compliance with the License.
8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9 * or http://www.opensolaris.org/os/licensing.
10 * See the License for the specific language governing permissions
11 * and limitations under the License.
13 * When distributing Covered Code, include this CDDL HEADER in each
14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15 * If applicable, add the following below this CDDL HEADER, with the
16 * fields enclosed by brackets "[]" replaced with your own identifying
17 * information: Portions Copyright [yyyy] [name of copyright owner]
22 * Copyright 2009 Sun Microsystems, Inc. All rights reserved.
23 * Use is subject to license terms.
26 * Copyright (c) 2009, Intel Corporation.
27 * All Rights Reserved.
33 #include <sys/promif.h>
34 #include <sys/cpuvar.h>
35 #include <sys/taskq.h>
44 * CPU power management data
47 * Data related to a particular speed.
49 * All per speed data nodes for a CPU are linked together using down_spd.
50 * The link list is ordered with first node containing data for
51 * normal (maximum) speed. up_spd points to the next speed up. Currently
52 * all up_spd's point to the normal speed but this can be changed in future.
53 * quant_cnt is the number of ticks when monitoring system will be called
54 * next. There are different quant_cnt for different speeds.
56 * Note that 'speed' has different meaning depending upon the platform.
57 * On SPARC, the speed is really a divisor of the maximum speed (e.g., a speed
58 * of 2 means that it's 1/2 the maximum speed). On x86, speed is a processor
61 typedef struct cpudrv_pm_spd
{
62 uint_t speed
; /* platform dependent notion */
63 uint_t quant_cnt
; /* quantum count in ticks */
64 struct cpudrv_pm_spd
*down_spd
; /* ptr to next speed down */
65 struct cpudrv_pm_spd
*up_spd
; /* ptr to next speed up */
66 uint_t idle_hwm
; /* down if idle thread >= hwm */
67 uint_t idle_lwm
; /* up if idle thread < lwm */
68 uint_t idle_bhwm_cnt
; /* # of iters idle is < hwm */
69 uint_t idle_blwm_cnt
; /* # of iters idle is < lwm */
70 uint_t user_hwm
; /* up if user thread > hwm */
71 int user_lwm
; /* down if user thread <= lwm */
72 int pm_level
; /* power level for framework */
76 * Power management data
78 typedef struct cpudrv_pm
{
79 cpudrv_pm_spd_t
*head_spd
; /* ptr to head of speed */
80 cpudrv_pm_spd_t
*cur_spd
; /* ptr to current speed */
81 uint_t num_spd
; /* number of speeds */
82 hrtime_t lastquan_mstate
[NCMSTATES
]; /* last quantum's mstate */
83 clock_t lastquan_ticks
; /* last quantum's clock tick */
84 int pm_busycnt
; /* pm_busy_component() count */
85 ddi_taskq_t
*tq
; /* taskq handler for CPU monitor */
86 timeout_id_t timeout_id
; /* cpudrv_monitor()'s timeout_id */
87 int timeout_count
; /* count dispatched timeouts */
88 kmutex_t timeout_lock
; /* protect timeout_count */
89 kcondvar_t timeout_cv
; /* wait on timeout_count change */
91 kthread_t
*pm_governor_thread
; /* governor thread */
92 cpudrv_pm_spd_t
*top_spd
; /* ptr to effective head speed */
94 boolean_t pm_started
; /* PM really started */
98 * Idle & user threads water marks in percentage
101 #define CPUDRV_IDLE_HWM 85 /* idle high water mark */
102 #define CPUDRV_IDLE_LWM 70 /* idle low water mark */
103 #define CPUDRV_IDLE_BLWM_CNT_MAX 1 /* # of iters idle can be < lwm */
104 #define CPUDRV_IDLE_BHWM_CNT_MAX 1 /* # of iters idle can be < hwm */
106 #define CPUDRV_IDLE_HWM 98 /* idle high water mark */
107 #define CPUDRV_IDLE_LWM 8 /* idle low water mark */
108 #define CPUDRV_IDLE_BLWM_CNT_MAX 2 /* # of iters idle can be < lwm */
109 #define CPUDRV_IDLE_BHWM_CNT_MAX 2 /* # of iters idle can be < hwm */
111 #define CPUDRV_USER_HWM 20 /* user high water mark */
112 #define CPUDRV_IDLE_BUF_ZONE 4 /* buffer zone when going down */
116 * Maximums for creating 'pm-components' property
118 #define CPUDRV_COMP_MAX_DIG 4 /* max digits in power level */
120 #define CPUDRV_COMP_MAX_VAL 9999 /* max value in above digits */
123 * Component number for calls to PM framework
125 #define CPUDRV_COMP_NUM 0 /* first component is 0 */
128 * Quantum counts for normal and other clock speeds in terms of ticks.
130 * In determining the quantum count, we need to balance two opposing factors:
132 * 1) Minimal delay when user start using the CPU that is in low
133 * power mode -- requires that we monitor more frequently,
135 * 2) Extra code executed because of frequent monitoring -- requires
136 * that we monitor less frequently.
138 * We reach a tradeoff between these two requirements by monitoring
139 * more frequently when we are in low speed mode (CPUDRV_QUANT_CNT_OTHR)
140 * so we can bring the CPU up without user noticing it. Moreover, at low
141 * speed we are not using CPU much so extra code execution should be fine.
142 * Since we are in no hurry to bring CPU down and at normal speed and we
143 * might really be using the CPU fully, we monitor less frequently
144 * (CPUDRV_QUANT_CNT_NORMAL).
147 #define CPUDRV_QUANT_CNT_NORMAL (hz * 1) /* 1 sec */
149 #define CPUDRV_QUANT_CNT_NORMAL (hz * 5) /* 5 sec */
151 #define CPUDRV_QUANT_CNT_OTHR (hz * 1) /* 1 sec */
156 #define CPUDRV_TASKQ_THREADS 1 /* # threads to run CPU monitor */
157 #define CPUDRV_TASKQ_MIN 2 /* min # of taskq entries */
158 #define CPUDRV_TASKQ_MAX 2 /* max # of taskq entries */
162 * Device driver state structure
164 typedef struct cpudrv_devstate
{
165 dev_info_t
*dip
; /* devinfo handle */
166 cpu_t
*cp
; /* CPU data for this node */
167 processorid_t cpu_id
; /* CPU number for this node */
168 cpudrv_pm_t cpudrv_pm
; /* power management data */
169 kmutex_t lock
; /* protects state struct */
172 extern void *cpudrv_state
;
173 extern boolean_t cpudrv_enabled
;
176 * Debugging definitions
179 #define D_INIT 0x00000001
180 #define D_FINI 0x00000002
181 #define D_ATTACH 0x00000004
182 #define D_DETACH 0x00000008
183 #define D_POWER 0x00000010
184 #define D_PM_INIT 0x00000020
185 #define D_PM_FREE 0x00000040
186 #define D_PM_COMP_CREATE 0x00000080
187 #define D_PM_MONITOR 0x00000100
188 #define D_PM_MONITOR_VERBOSE 0x00000200
189 #define D_PM_MONITOR_DELAY 0x00000400
191 extern uint_t cpudrv_debug
;
193 #define _PRINTF prom_printf
194 #define DPRINTF(flag, args) if (cpudrv_debug & flag) _PRINTF args;
196 #define DPRINTF(flag, args)
199 extern int cpudrv_change_speed(cpudrv_devstate_t
*, cpudrv_pm_spd_t
*);
200 extern boolean_t
cpudrv_get_cpu_id(dev_info_t
*, processorid_t
*);
201 extern boolean_t
cpudrv_is_governor_thread(cpudrv_pm_t
*);
202 extern boolean_t
cpudrv_mach_init(cpudrv_devstate_t
*);
203 extern boolean_t
cpudrv_mach_fini(cpudrv_devstate_t
*);
204 extern boolean_t
cpudrv_power_ready(cpu_t
*);
205 extern boolean_t
cpudrv_is_enabled(cpudrv_devstate_t
*);
206 extern void cpudrv_set_supp_freqs(cpudrv_devstate_t
*);
207 extern int cpudrv_get_cpu(cpudrv_devstate_t
*);
215 #endif /* _SYS_CPUDRV_H */