]> bbs.cooldavid.org Git - net-next-2.6.git/blame - drivers/acpi/processor_idle.c
ACPI: acpi_idle: touch TS_POLLING only in the non-MWAIT case
[net-next-2.6.git] / drivers / acpi / processor_idle.c
CommitLineData
1da177e4
LT
1/*
2 * processor_idle - idle state submodule to the ACPI processor driver
3 *
4 * Copyright (C) 2001, 2002 Andy Grover <andrew.grover@intel.com>
5 * Copyright (C) 2001, 2002 Paul Diefenbaugh <paul.s.diefenbaugh@intel.com>
c5ab81ca 6 * Copyright (C) 2004, 2005 Dominik Brodowski <linux@brodo.de>
1da177e4
LT
7 * Copyright (C) 2004 Anil S Keshavamurthy <anil.s.keshavamurthy@intel.com>
8 * - Added processor hotplug support
02df8b93
VP
9 * Copyright (C) 2005 Venkatesh Pallipadi <venkatesh.pallipadi@intel.com>
10 * - Added support for C3 on SMP
1da177e4
LT
11 *
12 * ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
13 *
14 * This program is free software; you can redistribute it and/or modify
15 * it under the terms of the GNU General Public License as published by
16 * the Free Software Foundation; either version 2 of the License, or (at
17 * your option) any later version.
18 *
19 * This program is distributed in the hope that it will be useful, but
20 * WITHOUT ANY WARRANTY; without even the implied warranty of
21 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
22 * General Public License for more details.
23 *
24 * You should have received a copy of the GNU General Public License along
25 * with this program; if not, write to the Free Software Foundation, Inc.,
26 * 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA.
27 *
28 * ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
29 */
30
31#include <linux/kernel.h>
32#include <linux/module.h>
33#include <linux/init.h>
34#include <linux/cpufreq.h>
5a0e3ad6 35#include <linux/slab.h>
1da177e4
LT
36#include <linux/proc_fs.h>
37#include <linux/seq_file.h>
38#include <linux/acpi.h>
39#include <linux/dmi.h>
40#include <linux/moduleparam.h>
4e57b681 41#include <linux/sched.h> /* need_resched() */
f011e2e2 42#include <linux/pm_qos_params.h>
e9e2cdb4 43#include <linux/clockchips.h>
4f86d3a8 44#include <linux/cpuidle.h>
ba84be23 45#include <linux/irqflags.h>
1da177e4 46
3434933b
TG
47/*
48 * Include the apic definitions for x86 to have the APIC timer related defines
49 * available also for UP (on SMP it gets magically included via linux/smp.h).
50 * asm/acpi.h is not an option, as it would require more include magic. Also
51 * creating an empty asm-ia64/apic.h would just trade pest vs. cholera.
52 */
53#ifdef CONFIG_X86
54#include <asm/apic.h>
55#endif
56
1da177e4
LT
57#include <asm/io.h>
58#include <asm/uaccess.h>
59
60#include <acpi/acpi_bus.h>
61#include <acpi/processor.h>
c1e3b377 62#include <asm/processor.h>
1da177e4 63
a192a958
LB
64#define PREFIX "ACPI: "
65
1da177e4 66#define ACPI_PROCESSOR_CLASS "processor"
1da177e4 67#define _COMPONENT ACPI_PROCESSOR_COMPONENT
f52fd66d 68ACPI_MODULE_NAME("processor_idle");
1da177e4 69#define ACPI_PROCESSOR_FILE_POWER "power"
2aa44d05 70#define PM_TIMER_TICK_NS (1000000000ULL/PM_TIMER_FREQUENCY)
4f86d3a8
LB
71#define C2_OVERHEAD 1 /* 1us */
72#define C3_OVERHEAD 1 /* 1us */
4f86d3a8 73#define PM_TIMER_TICKS_TO_US(p) (((p) * 1000)/(PM_TIMER_FREQUENCY/1000))
1da177e4 74
4f86d3a8
LB
75static unsigned int max_cstate __read_mostly = ACPI_PROCESSOR_MAX_POWER;
76module_param(max_cstate, uint, 0000);
b6835052 77static unsigned int nocst __read_mostly;
1da177e4
LT
78module_param(nocst, uint, 0000);
79
25de5718 80static unsigned int latency_factor __read_mostly = 2;
4963f620 81module_param(latency_factor, uint, 0644);
1da177e4 82
ff69f2bb 83static s64 us_to_pm_timer_ticks(s64 t)
84{
85 return div64_u64(t * PM_TIMER_FREQUENCY, 1000000);
86}
1da177e4
LT
87/*
88 * IBM ThinkPad R40e crashes mysteriously when going into C2 or C3.
89 * For now disable this. Probably a bug somewhere else.
90 *
91 * To skip this limit, boot/load with a large max_cstate limit.
92 */
1855256c 93static int set_max_cstate(const struct dmi_system_id *id)
1da177e4
LT
94{
95 if (max_cstate > ACPI_PROCESSOR_MAX_POWER)
96 return 0;
97
3d35600a 98 printk(KERN_NOTICE PREFIX "%s detected - limiting to C%ld max_cstate."
4be44fcd
LB
99 " Override with \"processor.max_cstate=%d\"\n", id->ident,
100 (long)id->driver_data, ACPI_PROCESSOR_MAX_POWER + 1);
1da177e4 101
3d35600a 102 max_cstate = (long)id->driver_data;
1da177e4
LT
103
104 return 0;
105}
106
7ded5689
AR
107/* Actually this shouldn't be __cpuinitdata, would be better to fix the
108 callers to only run once -AK */
109static struct dmi_system_id __cpuinitdata processor_power_dmi_table[] = {
876c184b
TR
110 { set_max_cstate, "Clevo 5600D", {
111 DMI_MATCH(DMI_BIOS_VENDOR,"Phoenix Technologies LTD"),
112 DMI_MATCH(DMI_BIOS_VERSION,"SHE845M0.86C.0013.D.0302131307")},
4be44fcd 113 (void *)2},
370d5cd8
AV
114 { set_max_cstate, "Pavilion zv5000", {
115 DMI_MATCH(DMI_SYS_VENDOR, "Hewlett-Packard"),
116 DMI_MATCH(DMI_PRODUCT_NAME,"Pavilion zv5000 (DS502A#ABA)")},
117 (void *)1},
118 { set_max_cstate, "Asus L8400B", {
119 DMI_MATCH(DMI_SYS_VENDOR, "ASUSTeK Computer Inc."),
120 DMI_MATCH(DMI_PRODUCT_NAME,"L8400B series Notebook PC")},
121 (void *)1},
1da177e4
LT
122 {},
123};
124
4f86d3a8 125
2e906655 126/*
127 * Callers should disable interrupts before the call and enable
128 * interrupts after return.
129 */
ddc081a1
VP
130static void acpi_safe_halt(void)
131{
132 current_thread_info()->status &= ~TS_POLLING;
133 /*
134 * TS_POLLING-cleared state must be visible before we
135 * test NEED_RESCHED:
136 */
137 smp_mb();
71e93d15 138 if (!need_resched()) {
ddc081a1 139 safe_halt();
71e93d15
VP
140 local_irq_disable();
141 }
ddc081a1
VP
142 current_thread_info()->status |= TS_POLLING;
143}
144
169a0abb
TG
145#ifdef ARCH_APICTIMER_STOPS_ON_C3
146
147/*
148 * Some BIOS implementations switch to C3 in the published C2 state.
296d93cd
LT
149 * This seems to be a common problem on AMD boxen, but other vendors
150 * are affected too. We pick the most conservative approach: we assume
151 * that the local APIC stops in both C2 and C3.
169a0abb 152 */
7e275cc4 153static void lapic_timer_check_state(int state, struct acpi_processor *pr,
169a0abb
TG
154 struct acpi_processor_cx *cx)
155{
156 struct acpi_processor_power *pwr = &pr->power;
e585bef8 157 u8 type = local_apic_timer_c2_ok ? ACPI_STATE_C3 : ACPI_STATE_C2;
169a0abb 158
db954b58
VP
159 if (cpu_has(&cpu_data(pr->id), X86_FEATURE_ARAT))
160 return;
161
87ad57ba
SL
162 if (boot_cpu_has(X86_FEATURE_AMDC1E))
163 type = ACPI_STATE_C1;
164
169a0abb
TG
165 /*
166 * Check, if one of the previous states already marked the lapic
167 * unstable
168 */
169 if (pwr->timer_broadcast_on_state < state)
170 return;
171
e585bef8 172 if (cx->type >= type)
296d93cd 173 pr->power.timer_broadcast_on_state = state;
169a0abb
TG
174}
175
918aae42 176static void __lapic_timer_propagate_broadcast(void *arg)
169a0abb 177{
f833bab8 178 struct acpi_processor *pr = (struct acpi_processor *) arg;
e9e2cdb4
TG
179 unsigned long reason;
180
181 reason = pr->power.timer_broadcast_on_state < INT_MAX ?
182 CLOCK_EVT_NOTIFY_BROADCAST_ON : CLOCK_EVT_NOTIFY_BROADCAST_OFF;
183
184 clockevents_notify(reason, &pr->id);
e9e2cdb4
TG
185}
186
918aae42
HS
187static void lapic_timer_propagate_broadcast(struct acpi_processor *pr)
188{
189 smp_call_function_single(pr->id, __lapic_timer_propagate_broadcast,
190 (void *)pr, 1);
191}
192
e9e2cdb4 193/* Power(C) State timer broadcast control */
7e275cc4 194static void lapic_timer_state_broadcast(struct acpi_processor *pr,
e9e2cdb4
TG
195 struct acpi_processor_cx *cx,
196 int broadcast)
197{
e9e2cdb4
TG
198 int state = cx - pr->power.states;
199
200 if (state >= pr->power.timer_broadcast_on_state) {
201 unsigned long reason;
202
203 reason = broadcast ? CLOCK_EVT_NOTIFY_BROADCAST_ENTER :
204 CLOCK_EVT_NOTIFY_BROADCAST_EXIT;
205 clockevents_notify(reason, &pr->id);
206 }
169a0abb
TG
207}
208
209#else
210
7e275cc4 211static void lapic_timer_check_state(int state, struct acpi_processor *pr,
169a0abb 212 struct acpi_processor_cx *cstate) { }
7e275cc4
LB
213static void lapic_timer_propagate_broadcast(struct acpi_processor *pr) { }
214static void lapic_timer_state_broadcast(struct acpi_processor *pr,
e9e2cdb4
TG
215 struct acpi_processor_cx *cx,
216 int broadcast)
217{
218}
169a0abb
TG
219
220#endif
221
b04e7bdb
TG
222/*
223 * Suspend / resume control
224 */
225static int acpi_idle_suspend;
815ab0fd
LB
226static u32 saved_bm_rld;
227
228static void acpi_idle_bm_rld_save(void)
229{
230 acpi_read_bit_register(ACPI_BITREG_BUS_MASTER_RLD, &saved_bm_rld);
231}
232static void acpi_idle_bm_rld_restore(void)
233{
234 u32 resumed_bm_rld;
235
236 acpi_read_bit_register(ACPI_BITREG_BUS_MASTER_RLD, &resumed_bm_rld);
237
238 if (resumed_bm_rld != saved_bm_rld)
239 acpi_write_bit_register(ACPI_BITREG_BUS_MASTER_RLD, saved_bm_rld);
240}
b04e7bdb
TG
241
242int acpi_processor_suspend(struct acpi_device * device, pm_message_t state)
243{
815ab0fd
LB
244 if (acpi_idle_suspend == 1)
245 return 0;
246
247 acpi_idle_bm_rld_save();
b04e7bdb
TG
248 acpi_idle_suspend = 1;
249 return 0;
250}
251
252int acpi_processor_resume(struct acpi_device * device)
253{
815ab0fd
LB
254 if (acpi_idle_suspend == 0)
255 return 0;
256
257 acpi_idle_bm_rld_restore();
b04e7bdb
TG
258 acpi_idle_suspend = 0;
259 return 0;
260}
261
61331168 262#if defined (CONFIG_GENERIC_TIME) && defined (CONFIG_X86)
520daf72 263static void tsc_check_state(int state)
ddb25f9a
AK
264{
265 switch (boot_cpu_data.x86_vendor) {
266 case X86_VENDOR_AMD:
40fb1715 267 case X86_VENDOR_INTEL:
ddb25f9a
AK
268 /*
269 * AMD Fam10h TSC will tick in all
270 * C/P/S0/S1 states when this bit is set.
271 */
40fb1715 272 if (boot_cpu_has(X86_FEATURE_NONSTOP_TSC))
520daf72 273 return;
40fb1715 274
ddb25f9a 275 /*FALL THROUGH*/
ddb25f9a 276 default:
520daf72
LB
277 /* TSC could halt in idle, so notify users */
278 if (state > ACPI_STATE_C1)
279 mark_tsc_unstable("TSC halts in idle");
ddb25f9a
AK
280 }
281}
520daf72
LB
282#else
283static void tsc_check_state(int state) { return; }
ddb25f9a
AK
284#endif
285
4be44fcd 286static int acpi_processor_get_power_info_fadt(struct acpi_processor *pr)
1da177e4 287{
1da177e4
LT
288
289 if (!pr)
d550d98d 290 return -EINVAL;
1da177e4
LT
291
292 if (!pr->pblk)
d550d98d 293 return -ENODEV;
1da177e4 294
1da177e4 295 /* if info is obtained from pblk/fadt, type equals state */
1da177e4
LT
296 pr->power.states[ACPI_STATE_C2].type = ACPI_STATE_C2;
297 pr->power.states[ACPI_STATE_C3].type = ACPI_STATE_C3;
298
4c033552
VP
299#ifndef CONFIG_HOTPLUG_CPU
300 /*
301 * Check for P_LVL2_UP flag before entering C2 and above on
4f86d3a8 302 * an SMP system.
4c033552 303 */
ad71860a 304 if ((num_online_cpus() > 1) &&
cee324b1 305 !(acpi_gbl_FADT.flags & ACPI_FADT_C2_MP_SUPPORTED))
d550d98d 306 return -ENODEV;
4c033552
VP
307#endif
308
1da177e4
LT
309 /* determine C2 and C3 address from pblk */
310 pr->power.states[ACPI_STATE_C2].address = pr->pblk + 4;
311 pr->power.states[ACPI_STATE_C3].address = pr->pblk + 5;
312
313 /* determine latencies from FADT */
cee324b1
AS
314 pr->power.states[ACPI_STATE_C2].latency = acpi_gbl_FADT.C2latency;
315 pr->power.states[ACPI_STATE_C3].latency = acpi_gbl_FADT.C3latency;
1da177e4 316
5d76b6f6
LB
317 /*
318 * FADT specified C2 latency must be less than or equal to
319 * 100 microseconds.
320 */
321 if (acpi_gbl_FADT.C2latency > ACPI_PROCESSOR_MAX_C2_LATENCY) {
322 ACPI_DEBUG_PRINT((ACPI_DB_INFO,
323 "C2 latency too large [%d]\n", acpi_gbl_FADT.C2latency));
324 /* invalidate C2 */
325 pr->power.states[ACPI_STATE_C2].address = 0;
326 }
327
a6d72c18
LB
328 /*
329 * FADT supplied C3 latency must be less than or equal to
330 * 1000 microseconds.
331 */
332 if (acpi_gbl_FADT.C3latency > ACPI_PROCESSOR_MAX_C3_LATENCY) {
333 ACPI_DEBUG_PRINT((ACPI_DB_INFO,
334 "C3 latency too large [%d]\n", acpi_gbl_FADT.C3latency));
335 /* invalidate C3 */
336 pr->power.states[ACPI_STATE_C3].address = 0;
337 }
338
1da177e4
LT
339 ACPI_DEBUG_PRINT((ACPI_DB_INFO,
340 "lvl2[0x%08x] lvl3[0x%08x]\n",
341 pr->power.states[ACPI_STATE_C2].address,
342 pr->power.states[ACPI_STATE_C3].address));
343
d550d98d 344 return 0;
1da177e4
LT
345}
346
991528d7 347static int acpi_processor_get_power_info_default(struct acpi_processor *pr)
acf05f4b 348{
991528d7
VP
349 if (!pr->power.states[ACPI_STATE_C1].valid) {
350 /* set the first C-State to C1 */
351 /* all processors need to support C1 */
352 pr->power.states[ACPI_STATE_C1].type = ACPI_STATE_C1;
353 pr->power.states[ACPI_STATE_C1].valid = 1;
0fda6b40 354 pr->power.states[ACPI_STATE_C1].entry_method = ACPI_CSTATE_HALT;
991528d7
VP
355 }
356 /* the C0 state only exists as a filler in our array */
acf05f4b 357 pr->power.states[ACPI_STATE_C0].valid = 1;
d550d98d 358 return 0;
acf05f4b
VP
359}
360
4be44fcd 361static int acpi_processor_get_power_info_cst(struct acpi_processor *pr)
1da177e4 362{
4be44fcd 363 acpi_status status = 0;
439913ff 364 u64 count;
cf824788 365 int current_count;
4be44fcd
LB
366 int i;
367 struct acpi_buffer buffer = { ACPI_ALLOCATE_BUFFER, NULL };
368 union acpi_object *cst;
1da177e4 369
1da177e4 370
1da177e4 371 if (nocst)
d550d98d 372 return -ENODEV;
1da177e4 373
991528d7 374 current_count = 0;
1da177e4
LT
375
376 status = acpi_evaluate_object(pr->handle, "_CST", NULL, &buffer);
377 if (ACPI_FAILURE(status)) {
378 ACPI_DEBUG_PRINT((ACPI_DB_INFO, "No _CST, giving up\n"));
d550d98d 379 return -ENODEV;
4be44fcd 380 }
1da177e4 381
50dd0969 382 cst = buffer.pointer;
1da177e4
LT
383
384 /* There must be at least 2 elements */
385 if (!cst || (cst->type != ACPI_TYPE_PACKAGE) || cst->package.count < 2) {
6468463a 386 printk(KERN_ERR PREFIX "not enough elements in _CST\n");
1da177e4
LT
387 status = -EFAULT;
388 goto end;
389 }
390
391 count = cst->package.elements[0].integer.value;
392
393 /* Validate number of power states. */
394 if (count < 1 || count != cst->package.count - 1) {
6468463a 395 printk(KERN_ERR PREFIX "count given by _CST is not valid\n");
1da177e4
LT
396 status = -EFAULT;
397 goto end;
398 }
399
1da177e4
LT
400 /* Tell driver that at least _CST is supported. */
401 pr->flags.has_cst = 1;
402
403 for (i = 1; i <= count; i++) {
404 union acpi_object *element;
405 union acpi_object *obj;
406 struct acpi_power_register *reg;
407 struct acpi_processor_cx cx;
408
409 memset(&cx, 0, sizeof(cx));
410
50dd0969 411 element = &(cst->package.elements[i]);
1da177e4
LT
412 if (element->type != ACPI_TYPE_PACKAGE)
413 continue;
414
415 if (element->package.count != 4)
416 continue;
417
50dd0969 418 obj = &(element->package.elements[0]);
1da177e4
LT
419
420 if (obj->type != ACPI_TYPE_BUFFER)
421 continue;
422
4be44fcd 423 reg = (struct acpi_power_register *)obj->buffer.pointer;
1da177e4
LT
424
425 if (reg->space_id != ACPI_ADR_SPACE_SYSTEM_IO &&
4be44fcd 426 (reg->space_id != ACPI_ADR_SPACE_FIXED_HARDWARE))
1da177e4
LT
427 continue;
428
1da177e4 429 /* There should be an easy way to extract an integer... */
50dd0969 430 obj = &(element->package.elements[1]);
1da177e4
LT
431 if (obj->type != ACPI_TYPE_INTEGER)
432 continue;
433
434 cx.type = obj->integer.value;
991528d7
VP
435 /*
436 * Some buggy BIOSes won't list C1 in _CST -
437 * Let acpi_processor_get_power_info_default() handle them later
438 */
439 if (i == 1 && cx.type != ACPI_STATE_C1)
440 current_count++;
441
442 cx.address = reg->address;
443 cx.index = current_count + 1;
444
bc71bec9 445 cx.entry_method = ACPI_CSTATE_SYSTEMIO;
991528d7
VP
446 if (reg->space_id == ACPI_ADR_SPACE_FIXED_HARDWARE) {
447 if (acpi_processor_ffh_cstate_probe
448 (pr->id, &cx, reg) == 0) {
bc71bec9 449 cx.entry_method = ACPI_CSTATE_FFH;
450 } else if (cx.type == ACPI_STATE_C1) {
991528d7
VP
451 /*
452 * C1 is a special case where FIXED_HARDWARE
453 * can be handled in non-MWAIT way as well.
454 * In that case, save this _CST entry info.
991528d7
VP
455 * Otherwise, ignore this info and continue.
456 */
bc71bec9 457 cx.entry_method = ACPI_CSTATE_HALT;
4fcb2fcd 458 snprintf(cx.desc, ACPI_CX_DESC_LEN, "ACPI HLT");
bc71bec9 459 } else {
991528d7
VP
460 continue;
461 }
da5e09a1
ZY
462 if (cx.type == ACPI_STATE_C1 &&
463 (idle_halt || idle_nomwait)) {
c1e3b377
ZY
464 /*
465 * In most cases the C1 space_id obtained from
466 * _CST object is FIXED_HARDWARE access mode.
467 * But when the option of idle=halt is added,
468 * the entry_method type should be changed from
469 * CSTATE_FFH to CSTATE_HALT.
da5e09a1
ZY
470 * When the option of idle=nomwait is added,
471 * the C1 entry_method type should be
472 * CSTATE_HALT.
c1e3b377
ZY
473 */
474 cx.entry_method = ACPI_CSTATE_HALT;
475 snprintf(cx.desc, ACPI_CX_DESC_LEN, "ACPI HLT");
476 }
4fcb2fcd
VP
477 } else {
478 snprintf(cx.desc, ACPI_CX_DESC_LEN, "ACPI IOPORT 0x%x",
479 cx.address);
991528d7 480 }
1da177e4 481
0fda6b40
VP
482 if (cx.type == ACPI_STATE_C1) {
483 cx.valid = 1;
484 }
4fcb2fcd 485
50dd0969 486 obj = &(element->package.elements[2]);
1da177e4
LT
487 if (obj->type != ACPI_TYPE_INTEGER)
488 continue;
489
490 cx.latency = obj->integer.value;
491
50dd0969 492 obj = &(element->package.elements[3]);
1da177e4
LT
493 if (obj->type != ACPI_TYPE_INTEGER)
494 continue;
495
496 cx.power = obj->integer.value;
497
cf824788
JM
498 current_count++;
499 memcpy(&(pr->power.states[current_count]), &cx, sizeof(cx));
500
501 /*
502 * We support total ACPI_PROCESSOR_MAX_POWER - 1
503 * (From 1 through ACPI_PROCESSOR_MAX_POWER - 1)
504 */
505 if (current_count >= (ACPI_PROCESSOR_MAX_POWER - 1)) {
506 printk(KERN_WARNING
507 "Limiting number of power states to max (%d)\n",
508 ACPI_PROCESSOR_MAX_POWER);
509 printk(KERN_WARNING
510 "Please increase ACPI_PROCESSOR_MAX_POWER if needed.\n");
511 break;
512 }
1da177e4
LT
513 }
514
4be44fcd 515 ACPI_DEBUG_PRINT((ACPI_DB_INFO, "Found %d power states\n",
cf824788 516 current_count));
1da177e4
LT
517
518 /* Validate number of power states discovered */
cf824788 519 if (current_count < 2)
6d93c648 520 status = -EFAULT;
1da177e4 521
4be44fcd 522 end:
02438d87 523 kfree(buffer.pointer);
1da177e4 524
d550d98d 525 return status;
1da177e4
LT
526}
527
4be44fcd
LB
528static void acpi_processor_power_verify_c3(struct acpi_processor *pr,
529 struct acpi_processor_cx *cx)
1da177e4 530{
ee1ca48f
PV
531 static int bm_check_flag = -1;
532 static int bm_control_flag = -1;
02df8b93 533
1da177e4
LT
534
535 if (!cx->address)
d550d98d 536 return;
1da177e4 537
1da177e4
LT
538 /*
539 * PIIX4 Erratum #18: We don't support C3 when Type-F (fast)
540 * DMA transfers are used by any ISA device to avoid livelock.
541 * Note that we could disable Type-F DMA (as recommended by
542 * the erratum), but this is known to disrupt certain ISA
543 * devices thus we take the conservative approach.
544 */
545 else if (errata.piix4.fdma) {
546 ACPI_DEBUG_PRINT((ACPI_DB_INFO,
4be44fcd 547 "C3 not supported on PIIX4 with Type-F DMA\n"));
d550d98d 548 return;
1da177e4
LT
549 }
550
02df8b93 551 /* All the logic here assumes flags.bm_check is same across all CPUs */
ee1ca48f 552 if (bm_check_flag == -1) {
02df8b93
VP
553 /* Determine whether bm_check is needed based on CPU */
554 acpi_processor_power_init_bm_check(&(pr->flags), pr->id);
555 bm_check_flag = pr->flags.bm_check;
ee1ca48f 556 bm_control_flag = pr->flags.bm_control;
02df8b93
VP
557 } else {
558 pr->flags.bm_check = bm_check_flag;
ee1ca48f 559 pr->flags.bm_control = bm_control_flag;
02df8b93
VP
560 }
561
562 if (pr->flags.bm_check) {
02df8b93 563 if (!pr->flags.bm_control) {
ed3110ef
VP
564 if (pr->flags.has_cst != 1) {
565 /* bus mastering control is necessary */
566 ACPI_DEBUG_PRINT((ACPI_DB_INFO,
567 "C3 support requires BM control\n"));
568 return;
569 } else {
570 /* Here we enter C3 without bus mastering */
571 ACPI_DEBUG_PRINT((ACPI_DB_INFO,
572 "C3 support without BM control\n"));
573 }
02df8b93
VP
574 }
575 } else {
02df8b93
VP
576 /*
577 * WBINVD should be set in fadt, for C3 state to be
578 * supported on when bm_check is not required.
579 */
cee324b1 580 if (!(acpi_gbl_FADT.flags & ACPI_FADT_WBINVD)) {
02df8b93 581 ACPI_DEBUG_PRINT((ACPI_DB_INFO,
4be44fcd
LB
582 "Cache invalidation should work properly"
583 " for C3 to be enabled on SMP systems\n"));
d550d98d 584 return;
02df8b93 585 }
02df8b93
VP
586 }
587
1da177e4
LT
588 /*
589 * Otherwise we've met all of our C3 requirements.
590 * Normalize the C3 latency to expidite policy. Enable
591 * checking of bus mastering status (bm_check) so we can
592 * use this in our C3 policy
593 */
594 cx->valid = 1;
4f86d3a8 595
4f86d3a8 596 cx->latency_ticks = cx->latency;
31878dd8
LB
597 /*
598 * On older chipsets, BM_RLD needs to be set
599 * in order for Bus Master activity to wake the
600 * system from C3. Newer chipsets handle DMA
601 * during C3 automatically and BM_RLD is a NOP.
602 * In either case, the proper way to
603 * handle BM_RLD is to set it and leave it set.
604 */
50ffba1b 605 acpi_write_bit_register(ACPI_BITREG_BUS_MASTER_RLD, 1);
1da177e4 606
d550d98d 607 return;
1da177e4
LT
608}
609
1da177e4
LT
610static int acpi_processor_power_verify(struct acpi_processor *pr)
611{
612 unsigned int i;
613 unsigned int working = 0;
6eb0a0fd 614
169a0abb 615 pr->power.timer_broadcast_on_state = INT_MAX;
6eb0a0fd 616
a0bf284b 617 for (i = 1; i < ACPI_PROCESSOR_MAX_POWER && i <= max_cstate; i++) {
1da177e4
LT
618 struct acpi_processor_cx *cx = &pr->power.states[i];
619
620 switch (cx->type) {
621 case ACPI_STATE_C1:
622 cx->valid = 1;
623 break;
624
625 case ACPI_STATE_C2:
d22edd29
LB
626 if (!cx->address)
627 break;
628 cx->valid = 1;
629 cx->latency_ticks = cx->latency; /* Normalize latency */
1da177e4
LT
630 break;
631
632 case ACPI_STATE_C3:
633 acpi_processor_power_verify_c3(pr, cx);
634 break;
635 }
7e275cc4
LB
636 if (!cx->valid)
637 continue;
1da177e4 638
7e275cc4
LB
639 lapic_timer_check_state(i, pr, cx);
640 tsc_check_state(cx->type);
641 working++;
1da177e4 642 }
bd663347 643
918aae42 644 lapic_timer_propagate_broadcast(pr);
1da177e4
LT
645
646 return (working);
647}
648
4be44fcd 649static int acpi_processor_get_power_info(struct acpi_processor *pr)
1da177e4
LT
650{
651 unsigned int i;
652 int result;
653
1da177e4
LT
654
655 /* NOTE: the idle thread may not be running while calling
656 * this function */
657
991528d7
VP
658 /* Zero initialize all the C-states info. */
659 memset(pr->power.states, 0, sizeof(pr->power.states));
660
1da177e4 661 result = acpi_processor_get_power_info_cst(pr);
6d93c648 662 if (result == -ENODEV)
c5a114f1 663 result = acpi_processor_get_power_info_fadt(pr);
6d93c648 664
991528d7
VP
665 if (result)
666 return result;
667
668 acpi_processor_get_power_info_default(pr);
669
cf824788 670 pr->power.count = acpi_processor_power_verify(pr);
1da177e4 671
1da177e4
LT
672 /*
673 * if one state of type C2 or C3 is available, mark this
674 * CPU as being "idle manageable"
675 */
676 for (i = 1; i < ACPI_PROCESSOR_MAX_POWER; i++) {
acf05f4b 677 if (pr->power.states[i].valid) {
1da177e4 678 pr->power.count = i;
2203d6ed
LT
679 if (pr->power.states[i].type >= ACPI_STATE_C2)
680 pr->flags.power = 1;
acf05f4b 681 }
1da177e4
LT
682 }
683
d550d98d 684 return 0;
1da177e4
LT
685}
686
74cad4ee 687#ifdef CONFIG_ACPI_PROCFS
1da177e4
LT
688static int acpi_processor_power_seq_show(struct seq_file *seq, void *offset)
689{
50dd0969 690 struct acpi_processor *pr = seq->private;
4be44fcd 691 unsigned int i;
1da177e4 692
1da177e4
LT
693
694 if (!pr)
695 goto end;
696
697 seq_printf(seq, "active state: C%zd\n"
4be44fcd 698 "max_cstate: C%d\n"
5c87579e 699 "maximum allowed latency: %d usec\n",
4be44fcd 700 pr->power.state ? pr->power.state - pr->power.states : 0,
92614610 701 max_cstate, pm_qos_requirement(PM_QOS_CPU_DMA_LATENCY));
1da177e4
LT
702
703 seq_puts(seq, "states:\n");
704
705 for (i = 1; i <= pr->power.count; i++) {
706 seq_printf(seq, " %cC%d: ",
4be44fcd
LB
707 (&pr->power.states[i] ==
708 pr->power.state ? '*' : ' '), i);
1da177e4
LT
709
710 if (!pr->power.states[i].valid) {
711 seq_puts(seq, "<not supported>\n");
712 continue;
713 }
714
715 switch (pr->power.states[i].type) {
716 case ACPI_STATE_C1:
717 seq_printf(seq, "type[C1] ");
718 break;
719 case ACPI_STATE_C2:
720 seq_printf(seq, "type[C2] ");
721 break;
722 case ACPI_STATE_C3:
723 seq_printf(seq, "type[C3] ");
724 break;
725 default:
726 seq_printf(seq, "type[--] ");
727 break;
728 }
729
730 if (pr->power.states[i].promotion.state)
731 seq_printf(seq, "promotion[C%zd] ",
4be44fcd
LB
732 (pr->power.states[i].promotion.state -
733 pr->power.states));
1da177e4
LT
734 else
735 seq_puts(seq, "promotion[--] ");
736
737 if (pr->power.states[i].demotion.state)
738 seq_printf(seq, "demotion[C%zd] ",
4be44fcd
LB
739 (pr->power.states[i].demotion.state -
740 pr->power.states));
1da177e4
LT
741 else
742 seq_puts(seq, "demotion[--] ");
743
a3c6598f 744 seq_printf(seq, "latency[%03d] usage[%08d] duration[%020llu]\n",
4be44fcd 745 pr->power.states[i].latency,
a3c6598f 746 pr->power.states[i].usage,
b0b7eaaf 747 (unsigned long long)pr->power.states[i].time);
1da177e4
LT
748 }
749
4be44fcd 750 end:
d550d98d 751 return 0;
1da177e4
LT
752}
753
754static int acpi_processor_power_open_fs(struct inode *inode, struct file *file)
755{
756 return single_open(file, acpi_processor_power_seq_show,
4be44fcd 757 PDE(inode)->data);
1da177e4
LT
758}
759
d7508032 760static const struct file_operations acpi_processor_power_fops = {
cf7acfab 761 .owner = THIS_MODULE,
4be44fcd
LB
762 .open = acpi_processor_power_open_fs,
763 .read = seq_read,
764 .llseek = seq_lseek,
765 .release = single_release,
1da177e4 766};
74cad4ee 767#endif
4f86d3a8
LB
768
769/**
770 * acpi_idle_bm_check - checks if bus master activity was detected
771 */
772static int acpi_idle_bm_check(void)
773{
774 u32 bm_status = 0;
775
50ffba1b 776 acpi_read_bit_register(ACPI_BITREG_BUS_MASTER_STATUS, &bm_status);
4f86d3a8 777 if (bm_status)
50ffba1b 778 acpi_write_bit_register(ACPI_BITREG_BUS_MASTER_STATUS, 1);
4f86d3a8
LB
779 /*
780 * PIIX4 Erratum #18: Note that BM_STS doesn't always reflect
781 * the true state of bus mastering activity; forcing us to
782 * manually check the BMIDEA bit of each IDE channel.
783 */
784 else if (errata.piix4.bmisx) {
785 if ((inb_p(errata.piix4.bmisx + 0x02) & 0x01)
786 || (inb_p(errata.piix4.bmisx + 0x0A) & 0x01))
787 bm_status = 1;
788 }
789 return bm_status;
790}
791
4f86d3a8
LB
792/**
793 * acpi_idle_do_entry - a helper function that does C2 and C3 type entry
794 * @cx: cstate data
bc71bec9 795 *
796 * Caller disables interrupt before call and enables interrupt after return.
4f86d3a8
LB
797 */
798static inline void acpi_idle_do_entry(struct acpi_processor_cx *cx)
799{
dcf30997
SR
800 /* Don't trace irqs off for idle */
801 stop_critical_timings();
bc71bec9 802 if (cx->entry_method == ACPI_CSTATE_FFH) {
4f86d3a8
LB
803 /* Call into architectural FFH based C-state */
804 acpi_processor_ffh_cstate_enter(cx);
bc71bec9 805 } else if (cx->entry_method == ACPI_CSTATE_HALT) {
806 acpi_safe_halt();
4f86d3a8
LB
807 } else {
808 int unused;
809 /* IO port based C-state */
810 inb(cx->address);
811 /* Dummy wait op - must do something useless after P_LVL2 read
812 because chipsets cannot guarantee that STPCLK# signal
813 gets asserted in time to freeze execution properly. */
814 unused = inl(acpi_gbl_FADT.xpm_timer_block.address);
815 }
dcf30997 816 start_critical_timings();
4f86d3a8
LB
817}
818
819/**
820 * acpi_idle_enter_c1 - enters an ACPI C1 state-type
821 * @dev: the target CPU
822 * @state: the state data
823 *
824 * This is equivalent to the HALT instruction.
825 */
826static int acpi_idle_enter_c1(struct cpuidle_device *dev,
827 struct cpuidle_state *state)
828{
ff69f2bb 829 ktime_t kt1, kt2;
830 s64 idle_time;
4f86d3a8
LB
831 struct acpi_processor *pr;
832 struct acpi_processor_cx *cx = cpuidle_get_statedata(state);
9b12e18c 833
706546d0 834 pr = __get_cpu_var(processors);
4f86d3a8
LB
835
836 if (unlikely(!pr))
837 return 0;
838
2e906655 839 local_irq_disable();
b077fbad
VP
840
841 /* Do not access any ACPI IO ports in suspend path */
842 if (acpi_idle_suspend) {
b077fbad 843 local_irq_enable();
7d60e8ab 844 cpu_relax();
b077fbad
VP
845 return 0;
846 }
847
7e275cc4 848 lapic_timer_state_broadcast(pr, cx, 1);
ff69f2bb 849 kt1 = ktime_get_real();
bc71bec9 850 acpi_idle_do_entry(cx);
ff69f2bb 851 kt2 = ktime_get_real();
852 idle_time = ktime_to_us(ktime_sub(kt2, kt1));
4f86d3a8 853
2e906655 854 local_irq_enable();
4f86d3a8 855 cx->usage++;
7e275cc4 856 lapic_timer_state_broadcast(pr, cx, 0);
4f86d3a8 857
ff69f2bb 858 return idle_time;
4f86d3a8
LB
859}
860
861/**
862 * acpi_idle_enter_simple - enters an ACPI state without BM handling
863 * @dev: the target CPU
864 * @state: the state data
865 */
866static int acpi_idle_enter_simple(struct cpuidle_device *dev,
867 struct cpuidle_state *state)
868{
869 struct acpi_processor *pr;
870 struct acpi_processor_cx *cx = cpuidle_get_statedata(state);
ff69f2bb 871 ktime_t kt1, kt2;
872 s64 idle_time;
873 s64 sleep_ticks = 0;
50629118 874
706546d0 875 pr = __get_cpu_var(processors);
4f86d3a8
LB
876
877 if (unlikely(!pr))
878 return 0;
879
e196441b
LB
880 if (acpi_idle_suspend)
881 return(acpi_idle_enter_c1(dev, state));
882
4f86d3a8 883 local_irq_disable();
02cf4f98 884
d306ebc2
PV
885 if (cx->entry_method != ACPI_CSTATE_FFH) {
886 current_thread_info()->status &= ~TS_POLLING;
887 /*
888 * TS_POLLING-cleared state must be visible before we test
889 * NEED_RESCHED:
890 */
891 smp_mb();
4f86d3a8 892
02cf4f98
LB
893 if (unlikely(need_resched())) {
894 current_thread_info()->status |= TS_POLLING;
895 local_irq_enable();
896 return 0;
897 }
4f86d3a8
LB
898 }
899
e17bcb43
TG
900 /*
901 * Must be done before busmaster disable as we might need to
902 * access HPET !
903 */
7e275cc4 904 lapic_timer_state_broadcast(pr, cx, 1);
e17bcb43 905
4f86d3a8
LB
906 if (cx->type == ACPI_STATE_C3)
907 ACPI_FLUSH_CPU_CACHE();
908
ff69f2bb 909 kt1 = ktime_get_real();
50629118
VP
910 /* Tell the scheduler that we are going deep-idle: */
911 sched_clock_idle_sleep_event();
4f86d3a8 912 acpi_idle_do_entry(cx);
ff69f2bb 913 kt2 = ktime_get_real();
914 idle_time = ktime_to_us(ktime_sub(kt2, kt1));
4f86d3a8 915
ff69f2bb 916 sleep_ticks = us_to_pm_timer_ticks(idle_time);
50629118
VP
917
918 /* Tell the scheduler how much we idled: */
919 sched_clock_idle_wakeup_event(sleep_ticks*PM_TIMER_TICK_NS);
4f86d3a8
LB
920
921 local_irq_enable();
02cf4f98
LB
922 if (cx->entry_method != ACPI_CSTATE_FFH)
923 current_thread_info()->status |= TS_POLLING;
4f86d3a8
LB
924
925 cx->usage++;
926
7e275cc4 927 lapic_timer_state_broadcast(pr, cx, 0);
50629118 928 cx->time += sleep_ticks;
ff69f2bb 929 return idle_time;
4f86d3a8
LB
930}
931
932static int c3_cpu_count;
933static DEFINE_SPINLOCK(c3_lock);
934
935/**
936 * acpi_idle_enter_bm - enters C3 with proper BM handling
937 * @dev: the target CPU
938 * @state: the state data
939 *
940 * If BM is detected, the deepest non-C3 idle state is entered instead.
941 */
942static int acpi_idle_enter_bm(struct cpuidle_device *dev,
943 struct cpuidle_state *state)
944{
945 struct acpi_processor *pr;
946 struct acpi_processor_cx *cx = cpuidle_get_statedata(state);
ff69f2bb 947 ktime_t kt1, kt2;
948 s64 idle_time;
949 s64 sleep_ticks = 0;
950
50629118 951
706546d0 952 pr = __get_cpu_var(processors);
4f86d3a8
LB
953
954 if (unlikely(!pr))
955 return 0;
956
e196441b
LB
957 if (acpi_idle_suspend)
958 return(acpi_idle_enter_c1(dev, state));
959
ddc081a1
VP
960 if (acpi_idle_bm_check()) {
961 if (dev->safe_state) {
addbad46 962 dev->last_state = dev->safe_state;
ddc081a1
VP
963 return dev->safe_state->enter(dev, dev->safe_state);
964 } else {
2e906655 965 local_irq_disable();
ddc081a1 966 acpi_safe_halt();
2e906655 967 local_irq_enable();
ddc081a1
VP
968 return 0;
969 }
970 }
971
4f86d3a8 972 local_irq_disable();
02cf4f98 973
d306ebc2
PV
974 if (cx->entry_method != ACPI_CSTATE_FFH) {
975 current_thread_info()->status &= ~TS_POLLING;
976 /*
977 * TS_POLLING-cleared state must be visible before we test
978 * NEED_RESCHED:
979 */
980 smp_mb();
4f86d3a8 981
02cf4f98
LB
982 if (unlikely(need_resched())) {
983 current_thread_info()->status |= TS_POLLING;
984 local_irq_enable();
985 return 0;
986 }
4f86d3a8
LB
987 }
988
996520c1
VP
989 acpi_unlazy_tlb(smp_processor_id());
990
50629118
VP
991 /* Tell the scheduler that we are going deep-idle: */
992 sched_clock_idle_sleep_event();
4f86d3a8
LB
993 /*
994 * Must be done before busmaster disable as we might need to
995 * access HPET !
996 */
7e275cc4 997 lapic_timer_state_broadcast(pr, cx, 1);
4f86d3a8 998
f461ddea 999 kt1 = ktime_get_real();
ddc081a1
VP
1000 /*
1001 * disable bus master
1002 * bm_check implies we need ARB_DIS
1003 * !bm_check implies we need cache flush
1004 * bm_control implies whether we can do ARB_DIS
1005 *
1006 * That leaves a case where bm_check is set and bm_control is
1007 * not set. In that case we cannot do much, we enter C3
1008 * without doing anything.
1009 */
1010 if (pr->flags.bm_check && pr->flags.bm_control) {
4f86d3a8
LB
1011 spin_lock(&c3_lock);
1012 c3_cpu_count++;
1013 /* Disable bus master arbitration when all CPUs are in C3 */
1014 if (c3_cpu_count == num_online_cpus())
50ffba1b 1015 acpi_write_bit_register(ACPI_BITREG_ARB_DISABLE, 1);
4f86d3a8 1016 spin_unlock(&c3_lock);
ddc081a1
VP
1017 } else if (!pr->flags.bm_check) {
1018 ACPI_FLUSH_CPU_CACHE();
1019 }
4f86d3a8 1020
ddc081a1 1021 acpi_idle_do_entry(cx);
4f86d3a8 1022
ddc081a1
VP
1023 /* Re-enable bus master arbitration */
1024 if (pr->flags.bm_check && pr->flags.bm_control) {
4f86d3a8 1025 spin_lock(&c3_lock);
50ffba1b 1026 acpi_write_bit_register(ACPI_BITREG_ARB_DISABLE, 0);
4f86d3a8
LB
1027 c3_cpu_count--;
1028 spin_unlock(&c3_lock);
1029 }
f461ddea
LB
1030 kt2 = ktime_get_real();
1031 idle_time = ktime_to_us(ktime_sub(kt2, kt1));
4f86d3a8 1032
ff69f2bb 1033 sleep_ticks = us_to_pm_timer_ticks(idle_time);
50629118
VP
1034 /* Tell the scheduler how much we idled: */
1035 sched_clock_idle_wakeup_event(sleep_ticks*PM_TIMER_TICK_NS);
4f86d3a8
LB
1036
1037 local_irq_enable();
02cf4f98
LB
1038 if (cx->entry_method != ACPI_CSTATE_FFH)
1039 current_thread_info()->status |= TS_POLLING;
4f86d3a8
LB
1040
1041 cx->usage++;
1042
7e275cc4 1043 lapic_timer_state_broadcast(pr, cx, 0);
50629118 1044 cx->time += sleep_ticks;
ff69f2bb 1045 return idle_time;
4f86d3a8
LB
1046}
1047
1048struct cpuidle_driver acpi_idle_driver = {
1049 .name = "acpi_idle",
1050 .owner = THIS_MODULE,
1051};
1052
1053/**
1054 * acpi_processor_setup_cpuidle - prepares and configures CPUIDLE
1055 * @pr: the ACPI processor
1056 */
1057static int acpi_processor_setup_cpuidle(struct acpi_processor *pr)
1058{
9a0b8415 1059 int i, count = CPUIDLE_DRIVER_STATE_START;
4f86d3a8
LB
1060 struct acpi_processor_cx *cx;
1061 struct cpuidle_state *state;
1062 struct cpuidle_device *dev = &pr->power.dev;
1063
1064 if (!pr->flags.power_setup_done)
1065 return -EINVAL;
1066
1067 if (pr->flags.power == 0) {
1068 return -EINVAL;
1069 }
1070
dcb84f33 1071 dev->cpu = pr->id;
4fcb2fcd
VP
1072 for (i = 0; i < CPUIDLE_STATE_MAX; i++) {
1073 dev->states[i].name[0] = '\0';
1074 dev->states[i].desc[0] = '\0';
1075 }
1076
615dfd93
LB
1077 if (max_cstate == 0)
1078 max_cstate = 1;
1079
4f86d3a8
LB
1080 for (i = 1; i < ACPI_PROCESSOR_MAX_POWER && i <= max_cstate; i++) {
1081 cx = &pr->power.states[i];
1082 state = &dev->states[count];
1083
1084 if (!cx->valid)
1085 continue;
1086
1087#ifdef CONFIG_HOTPLUG_CPU
1088 if ((cx->type != ACPI_STATE_C1) && (num_online_cpus() > 1) &&
1089 !pr->flags.has_cst &&
1090 !(acpi_gbl_FADT.flags & ACPI_FADT_C2_MP_SUPPORTED))
1091 continue;
1fec74a9 1092#endif
4f86d3a8
LB
1093 cpuidle_set_statedata(state, cx);
1094
1095 snprintf(state->name, CPUIDLE_NAME_LEN, "C%d", i);
4fcb2fcd 1096 strncpy(state->desc, cx->desc, CPUIDLE_DESC_LEN);
4f86d3a8 1097 state->exit_latency = cx->latency;
4963f620 1098 state->target_residency = cx->latency * latency_factor;
4f86d3a8
LB
1099 state->power_usage = cx->power;
1100
1101 state->flags = 0;
1102 switch (cx->type) {
1103 case ACPI_STATE_C1:
1104 state->flags |= CPUIDLE_FLAG_SHALLOW;
8e92b660
VP
1105 if (cx->entry_method == ACPI_CSTATE_FFH)
1106 state->flags |= CPUIDLE_FLAG_TIME_VALID;
1107
4f86d3a8 1108 state->enter = acpi_idle_enter_c1;
ddc081a1 1109 dev->safe_state = state;
4f86d3a8
LB
1110 break;
1111
1112 case ACPI_STATE_C2:
1113 state->flags |= CPUIDLE_FLAG_BALANCED;
1114 state->flags |= CPUIDLE_FLAG_TIME_VALID;
1115 state->enter = acpi_idle_enter_simple;
ddc081a1 1116 dev->safe_state = state;
4f86d3a8
LB
1117 break;
1118
1119 case ACPI_STATE_C3:
1120 state->flags |= CPUIDLE_FLAG_DEEP;
1121 state->flags |= CPUIDLE_FLAG_TIME_VALID;
1122 state->flags |= CPUIDLE_FLAG_CHECK_BM;
1123 state->enter = pr->flags.bm_check ?
1124 acpi_idle_enter_bm :
1125 acpi_idle_enter_simple;
1126 break;
1127 }
1128
1129 count++;
9a0b8415 1130 if (count == CPUIDLE_STATE_MAX)
1131 break;
4f86d3a8
LB
1132 }
1133
1134 dev->state_count = count;
1135
1136 if (!count)
1137 return -EINVAL;
1138
4f86d3a8
LB
1139 return 0;
1140}
1141
1142int acpi_processor_cst_has_changed(struct acpi_processor *pr)
1143{
dcb84f33 1144 int ret = 0;
4f86d3a8 1145
36a91358
VP
1146 if (boot_option_idle_override)
1147 return 0;
1148
4f86d3a8
LB
1149 if (!pr)
1150 return -EINVAL;
1151
1152 if (nocst) {
1153 return -ENODEV;
1154 }
1155
1156 if (!pr->flags.power_setup_done)
1157 return -ENODEV;
1158
1159 cpuidle_pause_and_lock();
1160 cpuidle_disable_device(&pr->power.dev);
1161 acpi_processor_get_power_info(pr);
dcb84f33
VP
1162 if (pr->flags.power) {
1163 acpi_processor_setup_cpuidle(pr);
1164 ret = cpuidle_enable_device(&pr->power.dev);
1165 }
4f86d3a8
LB
1166 cpuidle_resume_and_unlock();
1167
1168 return ret;
1169}
1170
7af8b660 1171int __cpuinit acpi_processor_power_init(struct acpi_processor *pr,
4be44fcd 1172 struct acpi_device *device)
1da177e4 1173{
4be44fcd 1174 acpi_status status = 0;
b6835052 1175 static int first_run;
b188e4ce 1176#ifdef CONFIG_ACPI_PROCFS
4be44fcd 1177 struct proc_dir_entry *entry = NULL;
b188e4ce 1178#endif
1da177e4 1179
36a91358
VP
1180 if (boot_option_idle_override)
1181 return 0;
1da177e4
LT
1182
1183 if (!first_run) {
c1e3b377
ZY
1184 if (idle_halt) {
1185 /*
1186 * When the boot option of "idle=halt" is added, halt
1187 * is used for CPU IDLE.
1188 * In such case C2/C3 is meaningless. So the max_cstate
1189 * is set to one.
1190 */
1191 max_cstate = 1;
1192 }
1da177e4 1193 dmi_check_system(processor_power_dmi_table);
c1c30634 1194 max_cstate = acpi_processor_cstate_check(max_cstate);
1da177e4 1195 if (max_cstate < ACPI_C_STATES_MAX)
4be44fcd
LB
1196 printk(KERN_NOTICE
1197 "ACPI: processor limited to max C-state %d\n",
1198 max_cstate);
1da177e4
LT
1199 first_run++;
1200 }
1201
02df8b93 1202 if (!pr)
d550d98d 1203 return -EINVAL;
02df8b93 1204
cee324b1 1205 if (acpi_gbl_FADT.cst_control && !nocst) {
4be44fcd 1206 status =
cee324b1 1207 acpi_os_write_port(acpi_gbl_FADT.smi_command, acpi_gbl_FADT.cst_control, 8);
1da177e4 1208 if (ACPI_FAILURE(status)) {
a6fc6720
TR
1209 ACPI_EXCEPTION((AE_INFO, status,
1210 "Notifying BIOS of _CST ability failed"));
1da177e4
LT
1211 }
1212 }
1213
1214 acpi_processor_get_power_info(pr);
4f86d3a8 1215 pr->flags.power_setup_done = 1;
1da177e4
LT
1216
1217 /*
1218 * Install the idle handler if processor power management is supported.
1219 * Note that we use previously set idle handler will be used on
1220 * platforms that only support C1.
1221 */
36a91358 1222 if (pr->flags.power) {
4f86d3a8 1223 acpi_processor_setup_cpuidle(pr);
4f86d3a8
LB
1224 if (cpuidle_register_device(&pr->power.dev))
1225 return -EIO;
1da177e4 1226 }
74cad4ee 1227#ifdef CONFIG_ACPI_PROCFS
1da177e4 1228 /* 'power' [R] */
cf7acfab
DL
1229 entry = proc_create_data(ACPI_PROCESSOR_FILE_POWER,
1230 S_IRUGO, acpi_device_dir(device),
1231 &acpi_processor_power_fops,
1232 acpi_driver_data(device));
1da177e4 1233 if (!entry)
a6fc6720 1234 return -EIO;
74cad4ee 1235#endif
d550d98d 1236 return 0;
1da177e4
LT
1237}
1238
4be44fcd
LB
1239int acpi_processor_power_exit(struct acpi_processor *pr,
1240 struct acpi_device *device)
1da177e4 1241{
36a91358
VP
1242 if (boot_option_idle_override)
1243 return 0;
1244
dcb84f33 1245 cpuidle_unregister_device(&pr->power.dev);
1da177e4
LT
1246 pr->flags.power_setup_done = 0;
1247
74cad4ee 1248#ifdef CONFIG_ACPI_PROCFS
1da177e4 1249 if (acpi_device_dir(device))
4be44fcd
LB
1250 remove_proc_entry(ACPI_PROCESSOR_FILE_POWER,
1251 acpi_device_dir(device));
74cad4ee 1252#endif
1da177e4 1253
d550d98d 1254 return 0;
1da177e4 1255}