]> git.proxmox.com Git - mirror_ubuntu-hirsute-kernel.git/blame - drivers/cpufreq/acpi-cpufreq.c
cpufreq: Properly handle errors from cpufreq_init_policy()
[mirror_ubuntu-hirsute-kernel.git] / drivers / cpufreq / acpi-cpufreq.c
CommitLineData
1da177e4 1/*
3a58df35 2 * acpi-cpufreq.c - ACPI Processor P-States Driver
1da177e4
LT
3 *
4 * Copyright (C) 2001, 2002 Andy Grover <andrew.grover@intel.com>
5 * Copyright (C) 2001, 2002 Paul Diefenbaugh <paul.s.diefenbaugh@intel.com>
6 * Copyright (C) 2002 - 2004 Dominik Brodowski <linux@brodo.de>
fe27cb35 7 * Copyright (C) 2006 Denis Sadykov <denis.m.sadykov@intel.com>
1da177e4
LT
8 *
9 * ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
10 *
11 * This program is free software; you can redistribute it and/or modify
12 * it under the terms of the GNU General Public License as published by
13 * the Free Software Foundation; either version 2 of the License, or (at
14 * your option) any later version.
15 *
16 * This program is distributed in the hope that it will be useful, but
17 * WITHOUT ANY WARRANTY; without even the implied warranty of
18 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
19 * General Public License for more details.
20 *
21 * You should have received a copy of the GNU General Public License along
22 * with this program; if not, write to the Free Software Foundation, Inc.,
23 * 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA.
24 *
25 * ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
26 */
27
1da177e4
LT
28#include <linux/kernel.h>
29#include <linux/module.h>
30#include <linux/init.h>
fe27cb35
VP
31#include <linux/smp.h>
32#include <linux/sched.h>
1da177e4 33#include <linux/cpufreq.h>
d395bf12 34#include <linux/compiler.h>
8adcc0c6 35#include <linux/dmi.h>
5a0e3ad6 36#include <linux/slab.h>
1da177e4
LT
37
38#include <linux/acpi.h>
3a58df35
DJ
39#include <linux/io.h>
40#include <linux/delay.h>
41#include <linux/uaccess.h>
42
1da177e4
LT
43#include <acpi/processor.h>
44
dde9f7ba 45#include <asm/msr.h>
fe27cb35
VP
46#include <asm/processor.h>
47#include <asm/cpufeature.h>
fe27cb35 48
1da177e4
LT
49MODULE_AUTHOR("Paul Diefenbaugh, Dominik Brodowski");
50MODULE_DESCRIPTION("ACPI Processor P-States Driver");
51MODULE_LICENSE("GPL");
52
acd31624
AP
53#define PFX "acpi-cpufreq: "
54
dde9f7ba
VP
55enum {
56 UNDEFINED_CAPABLE = 0,
57 SYSTEM_INTEL_MSR_CAPABLE,
3dc9a633 58 SYSTEM_AMD_MSR_CAPABLE,
dde9f7ba
VP
59 SYSTEM_IO_CAPABLE,
60};
61
62#define INTEL_MSR_RANGE (0xffff)
3dc9a633 63#define AMD_MSR_RANGE (0x7)
dde9f7ba 64
615b7300
AP
65#define MSR_K7_HWCR_CPB_DIS (1ULL << 25)
66
fe27cb35 67struct acpi_cpufreq_data {
64be7eed
VP
68 struct acpi_processor_performance *acpi_data;
69 struct cpufreq_frequency_table *freq_table;
70 unsigned int resume;
71 unsigned int cpu_feature;
f4fd3797 72 cpumask_var_t freqdomain_cpus;
1da177e4
LT
73};
74
50109292 75/* acpi_perf_data is a pointer to percpu data. */
3f6c4df7 76static struct acpi_processor_performance __percpu *acpi_perf_data;
1da177e4
LT
77
78static struct cpufreq_driver acpi_cpufreq_driver;
79
d395bf12 80static unsigned int acpi_pstate_strict;
615b7300
AP
81static struct msr __percpu *msrs;
82
83static bool boost_state(unsigned int cpu)
84{
85 u32 lo, hi;
86 u64 msr;
87
88 switch (boot_cpu_data.x86_vendor) {
89 case X86_VENDOR_INTEL:
90 rdmsr_on_cpu(cpu, MSR_IA32_MISC_ENABLE, &lo, &hi);
91 msr = lo | ((u64)hi << 32);
92 return !(msr & MSR_IA32_MISC_ENABLE_TURBO_DISABLE);
93 case X86_VENDOR_AMD:
94 rdmsr_on_cpu(cpu, MSR_K7_HWCR, &lo, &hi);
95 msr = lo | ((u64)hi << 32);
96 return !(msr & MSR_K7_HWCR_CPB_DIS);
97 }
98 return false;
99}
100
101static void boost_set_msrs(bool enable, const struct cpumask *cpumask)
102{
103 u32 cpu;
104 u32 msr_addr;
105 u64 msr_mask;
106
107 switch (boot_cpu_data.x86_vendor) {
108 case X86_VENDOR_INTEL:
109 msr_addr = MSR_IA32_MISC_ENABLE;
110 msr_mask = MSR_IA32_MISC_ENABLE_TURBO_DISABLE;
111 break;
112 case X86_VENDOR_AMD:
113 msr_addr = MSR_K7_HWCR;
114 msr_mask = MSR_K7_HWCR_CPB_DIS;
115 break;
116 default:
117 return;
118 }
119
120 rdmsr_on_cpus(cpumask, msr_addr, msrs);
121
122 for_each_cpu(cpu, cpumask) {
123 struct msr *reg = per_cpu_ptr(msrs, cpu);
124 if (enable)
125 reg->q &= ~msr_mask;
126 else
127 reg->q |= msr_mask;
128 }
129
130 wrmsr_on_cpus(cpumask, msr_addr, msrs);
131}
132
cfc9c8ed 133static int _store_boost(int val)
615b7300 134{
615b7300 135 get_online_cpus();
615b7300 136 boost_set_msrs(val, cpu_online_mask);
615b7300 137 put_online_cpus();
615b7300
AP
138 pr_debug("Core Boosting %sabled.\n", val ? "en" : "dis");
139
cfc9c8ed 140 return 0;
615b7300
AP
141}
142
f4fd3797
LT
143static ssize_t show_freqdomain_cpus(struct cpufreq_policy *policy, char *buf)
144{
eb0b3e78 145 struct acpi_cpufreq_data *data = policy->driver_data;
f4fd3797
LT
146
147 return cpufreq_show_cpus(data->freqdomain_cpus, buf);
148}
149
150cpufreq_freq_attr_ro(freqdomain_cpus);
151
11269ff5 152#ifdef CONFIG_X86_ACPI_CPUFREQ_CPB
cfc9c8ed
LM
153static ssize_t store_boost(const char *buf, size_t count)
154{
155 int ret;
156 unsigned long val = 0;
157
158 if (!acpi_cpufreq_driver.boost_supported)
159 return -EINVAL;
160
161 ret = kstrtoul(buf, 10, &val);
162 if (ret || (val > 1))
163 return -EINVAL;
164
165 _store_boost((int) val);
166
167 return count;
168}
169
11269ff5
AP
170static ssize_t store_cpb(struct cpufreq_policy *policy, const char *buf,
171 size_t count)
172{
cfc9c8ed 173 return store_boost(buf, count);
11269ff5
AP
174}
175
176static ssize_t show_cpb(struct cpufreq_policy *policy, char *buf)
177{
cfc9c8ed 178 return sprintf(buf, "%u\n", acpi_cpufreq_driver.boost_enabled);
11269ff5
AP
179}
180
59027d35 181cpufreq_freq_attr_rw(cpb);
11269ff5
AP
182#endif
183
dde9f7ba
VP
184static int check_est_cpu(unsigned int cpuid)
185{
92cb7612 186 struct cpuinfo_x86 *cpu = &cpu_data(cpuid);
dde9f7ba 187
0de51088 188 return cpu_has(cpu, X86_FEATURE_EST);
dde9f7ba
VP
189}
190
3dc9a633
MG
191static int check_amd_hwpstate_cpu(unsigned int cpuid)
192{
193 struct cpuinfo_x86 *cpu = &cpu_data(cpuid);
194
195 return cpu_has(cpu, X86_FEATURE_HW_PSTATE);
196}
197
dde9f7ba 198static unsigned extract_io(u32 value, struct acpi_cpufreq_data *data)
fe27cb35 199{
64be7eed
VP
200 struct acpi_processor_performance *perf;
201 int i;
fe27cb35
VP
202
203 perf = data->acpi_data;
204
3a58df35 205 for (i = 0; i < perf->state_count; i++) {
fe27cb35
VP
206 if (value == perf->states[i].status)
207 return data->freq_table[i].frequency;
208 }
209 return 0;
210}
211
dde9f7ba
VP
212static unsigned extract_msr(u32 msr, struct acpi_cpufreq_data *data)
213{
041526f9 214 struct cpufreq_frequency_table *pos;
a6f6e6e6 215 struct acpi_processor_performance *perf;
dde9f7ba 216
3dc9a633
MG
217 if (boot_cpu_data.x86_vendor == X86_VENDOR_AMD)
218 msr &= AMD_MSR_RANGE;
219 else
220 msr &= INTEL_MSR_RANGE;
221
a6f6e6e6
VP
222 perf = data->acpi_data;
223
041526f9
SK
224 cpufreq_for_each_entry(pos, data->freq_table)
225 if (msr == perf->states[pos->driver_data].status)
226 return pos->frequency;
dde9f7ba
VP
227 return data->freq_table[0].frequency;
228}
229
dde9f7ba
VP
230static unsigned extract_freq(u32 val, struct acpi_cpufreq_data *data)
231{
232 switch (data->cpu_feature) {
64be7eed 233 case SYSTEM_INTEL_MSR_CAPABLE:
3dc9a633 234 case SYSTEM_AMD_MSR_CAPABLE:
dde9f7ba 235 return extract_msr(val, data);
64be7eed 236 case SYSTEM_IO_CAPABLE:
dde9f7ba 237 return extract_io(val, data);
64be7eed 238 default:
dde9f7ba
VP
239 return 0;
240 }
241}
242
dde9f7ba
VP
243struct msr_addr {
244 u32 reg;
245};
246
fe27cb35
VP
247struct io_addr {
248 u16 port;
249 u8 bit_width;
250};
251
252struct drv_cmd {
dde9f7ba 253 unsigned int type;
bfa318ad 254 const struct cpumask *mask;
3a58df35
DJ
255 union {
256 struct msr_addr msr;
257 struct io_addr io;
258 } addr;
fe27cb35
VP
259 u32 val;
260};
261
01599fca
AM
262/* Called via smp_call_function_single(), on the target CPU */
263static void do_drv_read(void *_cmd)
1da177e4 264{
72859081 265 struct drv_cmd *cmd = _cmd;
dde9f7ba
VP
266 u32 h;
267
268 switch (cmd->type) {
64be7eed 269 case SYSTEM_INTEL_MSR_CAPABLE:
3dc9a633 270 case SYSTEM_AMD_MSR_CAPABLE:
dde9f7ba
VP
271 rdmsr(cmd->addr.msr.reg, cmd->val, h);
272 break;
64be7eed 273 case SYSTEM_IO_CAPABLE:
4e581ff1
VP
274 acpi_os_read_port((acpi_io_address)cmd->addr.io.port,
275 &cmd->val,
276 (u32)cmd->addr.io.bit_width);
dde9f7ba 277 break;
64be7eed 278 default:
dde9f7ba
VP
279 break;
280 }
fe27cb35 281}
1da177e4 282
01599fca
AM
283/* Called via smp_call_function_many(), on the target CPUs */
284static void do_drv_write(void *_cmd)
fe27cb35 285{
72859081 286 struct drv_cmd *cmd = _cmd;
13424f65 287 u32 lo, hi;
dde9f7ba
VP
288
289 switch (cmd->type) {
64be7eed 290 case SYSTEM_INTEL_MSR_CAPABLE:
13424f65
VP
291 rdmsr(cmd->addr.msr.reg, lo, hi);
292 lo = (lo & ~INTEL_MSR_RANGE) | (cmd->val & INTEL_MSR_RANGE);
293 wrmsr(cmd->addr.msr.reg, lo, hi);
dde9f7ba 294 break;
3dc9a633
MG
295 case SYSTEM_AMD_MSR_CAPABLE:
296 wrmsr(cmd->addr.msr.reg, cmd->val, 0);
297 break;
64be7eed 298 case SYSTEM_IO_CAPABLE:
4e581ff1
VP
299 acpi_os_write_port((acpi_io_address)cmd->addr.io.port,
300 cmd->val,
301 (u32)cmd->addr.io.bit_width);
dde9f7ba 302 break;
64be7eed 303 default:
dde9f7ba
VP
304 break;
305 }
fe27cb35 306}
1da177e4 307
95dd7227 308static void drv_read(struct drv_cmd *cmd)
fe27cb35 309{
4a28395d 310 int err;
fe27cb35
VP
311 cmd->val = 0;
312
4a28395d
AM
313 err = smp_call_function_any(cmd->mask, do_drv_read, cmd, 1);
314 WARN_ON_ONCE(err); /* smp_call_function_any() was buggy? */
fe27cb35
VP
315}
316
317static void drv_write(struct drv_cmd *cmd)
318{
ea34f43a
LT
319 int this_cpu;
320
321 this_cpu = get_cpu();
322 if (cpumask_test_cpu(this_cpu, cmd->mask))
323 do_drv_write(cmd);
01599fca 324 smp_call_function_many(cmd->mask, do_drv_write, cmd, 1);
ea34f43a 325 put_cpu();
fe27cb35 326}
1da177e4 327
eb0b3e78
PX
328static u32
329get_cur_val(const struct cpumask *mask, struct acpi_cpufreq_data *data)
fe27cb35 330{
64be7eed
VP
331 struct acpi_processor_performance *perf;
332 struct drv_cmd cmd;
1da177e4 333
4d8bb537 334 if (unlikely(cpumask_empty(mask)))
fe27cb35 335 return 0;
1da177e4 336
eb0b3e78 337 switch (data->cpu_feature) {
dde9f7ba
VP
338 case SYSTEM_INTEL_MSR_CAPABLE:
339 cmd.type = SYSTEM_INTEL_MSR_CAPABLE;
8673b83b 340 cmd.addr.msr.reg = MSR_IA32_PERF_CTL;
dde9f7ba 341 break;
3dc9a633
MG
342 case SYSTEM_AMD_MSR_CAPABLE:
343 cmd.type = SYSTEM_AMD_MSR_CAPABLE;
8673b83b 344 cmd.addr.msr.reg = MSR_AMD_PERF_CTL;
3dc9a633 345 break;
dde9f7ba
VP
346 case SYSTEM_IO_CAPABLE:
347 cmd.type = SYSTEM_IO_CAPABLE;
eb0b3e78 348 perf = data->acpi_data;
dde9f7ba
VP
349 cmd.addr.io.port = perf->control_register.address;
350 cmd.addr.io.bit_width = perf->control_register.bit_width;
351 break;
352 default:
353 return 0;
354 }
355
bfa318ad 356 cmd.mask = mask;
fe27cb35 357 drv_read(&cmd);
1da177e4 358
2d06d8c4 359 pr_debug("get_cur_val = %u\n", cmd.val);
fe27cb35
VP
360
361 return cmd.val;
362}
1da177e4 363
fe27cb35
VP
364static unsigned int get_cur_freq_on_cpu(unsigned int cpu)
365{
eb0b3e78
PX
366 struct acpi_cpufreq_data *data;
367 struct cpufreq_policy *policy;
64be7eed 368 unsigned int freq;
e56a727b 369 unsigned int cached_freq;
fe27cb35 370
2d06d8c4 371 pr_debug("get_cur_freq_on_cpu (%d)\n", cpu);
fe27cb35 372
eb0b3e78
PX
373 policy = cpufreq_cpu_get(cpu);
374 if (unlikely(!policy))
375 return 0;
376
377 data = policy->driver_data;
378 cpufreq_cpu_put(policy);
379 if (unlikely(!data || !data->acpi_data || !data->freq_table))
fe27cb35 380 return 0;
1da177e4 381
e56a727b 382 cached_freq = data->freq_table[data->acpi_data->state].frequency;
eb0b3e78 383 freq = extract_freq(get_cur_val(cpumask_of(cpu), data), data);
e56a727b
VP
384 if (freq != cached_freq) {
385 /*
386 * The dreaded BIOS frequency change behind our back.
387 * Force set the frequency on next target call.
388 */
389 data->resume = 1;
390 }
391
2d06d8c4 392 pr_debug("cur freq = %u\n", freq);
1da177e4 393
fe27cb35 394 return freq;
1da177e4
LT
395}
396
72859081 397static unsigned int check_freqs(const struct cpumask *mask, unsigned int freq,
64be7eed 398 struct acpi_cpufreq_data *data)
fe27cb35 399{
64be7eed
VP
400 unsigned int cur_freq;
401 unsigned int i;
1da177e4 402
3a58df35 403 for (i = 0; i < 100; i++) {
eb0b3e78 404 cur_freq = extract_freq(get_cur_val(mask, data), data);
fe27cb35
VP
405 if (cur_freq == freq)
406 return 1;
407 udelay(10);
408 }
409 return 0;
410}
411
412static int acpi_cpufreq_target(struct cpufreq_policy *policy,
9c0ebcf7 413 unsigned int index)
1da177e4 414{
eb0b3e78 415 struct acpi_cpufreq_data *data = policy->driver_data;
64be7eed 416 struct acpi_processor_performance *perf;
64be7eed 417 struct drv_cmd cmd;
8edc59d9 418 unsigned int next_perf_state = 0; /* Index into perf table */
64be7eed 419 int result = 0;
fe27cb35 420
fe27cb35 421 if (unlikely(data == NULL ||
95dd7227 422 data->acpi_data == NULL || data->freq_table == NULL)) {
fe27cb35
VP
423 return -ENODEV;
424 }
1da177e4 425
fe27cb35 426 perf = data->acpi_data;
9c0ebcf7 427 next_perf_state = data->freq_table[index].driver_data;
7650b281 428 if (perf->state == next_perf_state) {
fe27cb35 429 if (unlikely(data->resume)) {
2d06d8c4 430 pr_debug("Called after resume, resetting to P%d\n",
64be7eed 431 next_perf_state);
fe27cb35
VP
432 data->resume = 0;
433 } else {
2d06d8c4 434 pr_debug("Already at target state (P%d)\n",
64be7eed 435 next_perf_state);
4d8bb537 436 goto out;
fe27cb35 437 }
09b4d1ee
VP
438 }
439
64be7eed
VP
440 switch (data->cpu_feature) {
441 case SYSTEM_INTEL_MSR_CAPABLE:
442 cmd.type = SYSTEM_INTEL_MSR_CAPABLE;
443 cmd.addr.msr.reg = MSR_IA32_PERF_CTL;
13424f65 444 cmd.val = (u32) perf->states[next_perf_state].control;
64be7eed 445 break;
3dc9a633
MG
446 case SYSTEM_AMD_MSR_CAPABLE:
447 cmd.type = SYSTEM_AMD_MSR_CAPABLE;
448 cmd.addr.msr.reg = MSR_AMD_PERF_CTL;
449 cmd.val = (u32) perf->states[next_perf_state].control;
450 break;
64be7eed
VP
451 case SYSTEM_IO_CAPABLE:
452 cmd.type = SYSTEM_IO_CAPABLE;
453 cmd.addr.io.port = perf->control_register.address;
454 cmd.addr.io.bit_width = perf->control_register.bit_width;
455 cmd.val = (u32) perf->states[next_perf_state].control;
456 break;
457 default:
4d8bb537
MT
458 result = -ENODEV;
459 goto out;
64be7eed 460 }
09b4d1ee 461
4d8bb537 462 /* cpufreq holds the hotplug lock, so we are safe from here on */
fe27cb35 463 if (policy->shared_type != CPUFREQ_SHARED_TYPE_ANY)
bfa318ad 464 cmd.mask = policy->cpus;
fe27cb35 465 else
bfa318ad 466 cmd.mask = cpumask_of(policy->cpu);
09b4d1ee 467
fe27cb35 468 drv_write(&cmd);
09b4d1ee 469
fe27cb35 470 if (acpi_pstate_strict) {
d4019f0a
VK
471 if (!check_freqs(cmd.mask, data->freq_table[index].frequency,
472 data)) {
2d06d8c4 473 pr_debug("acpi_cpufreq_target failed (%d)\n",
64be7eed 474 policy->cpu);
4d8bb537 475 result = -EAGAIN;
09b4d1ee
VP
476 }
477 }
478
e15d8309
VK
479 if (!result)
480 perf->state = next_perf_state;
fe27cb35 481
4d8bb537 482out:
fe27cb35 483 return result;
1da177e4
LT
484}
485
1da177e4 486static unsigned long
64be7eed 487acpi_cpufreq_guess_freq(struct acpi_cpufreq_data *data, unsigned int cpu)
1da177e4 488{
64be7eed 489 struct acpi_processor_performance *perf = data->acpi_data;
09b4d1ee 490
1da177e4
LT
491 if (cpu_khz) {
492 /* search the closest match to cpu_khz */
493 unsigned int i;
494 unsigned long freq;
09b4d1ee 495 unsigned long freqn = perf->states[0].core_frequency * 1000;
1da177e4 496
3a58df35 497 for (i = 0; i < (perf->state_count-1); i++) {
1da177e4 498 freq = freqn;
95dd7227 499 freqn = perf->states[i+1].core_frequency * 1000;
1da177e4 500 if ((2 * cpu_khz) > (freqn + freq)) {
09b4d1ee 501 perf->state = i;
64be7eed 502 return freq;
1da177e4
LT
503 }
504 }
95dd7227 505 perf->state = perf->state_count-1;
64be7eed 506 return freqn;
09b4d1ee 507 } else {
1da177e4 508 /* assume CPU is at P0... */
09b4d1ee
VP
509 perf->state = 0;
510 return perf->states[0].core_frequency * 1000;
511 }
1da177e4
LT
512}
513
2fdf66b4
RR
514static void free_acpi_perf_data(void)
515{
516 unsigned int i;
517
518 /* Freeing a NULL pointer is OK, and alloc_percpu zeroes. */
519 for_each_possible_cpu(i)
520 free_cpumask_var(per_cpu_ptr(acpi_perf_data, i)
521 ->shared_cpu_map);
522 free_percpu(acpi_perf_data);
523}
524
615b7300
AP
525static int boost_notify(struct notifier_block *nb, unsigned long action,
526 void *hcpu)
527{
528 unsigned cpu = (long)hcpu;
529 const struct cpumask *cpumask;
530
531 cpumask = get_cpu_mask(cpu);
532
533 /*
534 * Clear the boost-disable bit on the CPU_DOWN path so that
535 * this cpu cannot block the remaining ones from boosting. On
536 * the CPU_UP path we simply keep the boost-disable flag in
537 * sync with the current global state.
538 */
539
540 switch (action) {
541 case CPU_UP_PREPARE:
542 case CPU_UP_PREPARE_FROZEN:
cfc9c8ed 543 boost_set_msrs(acpi_cpufreq_driver.boost_enabled, cpumask);
615b7300
AP
544 break;
545
546 case CPU_DOWN_PREPARE:
547 case CPU_DOWN_PREPARE_FROZEN:
548 boost_set_msrs(1, cpumask);
549 break;
550
551 default:
552 break;
553 }
554
555 return NOTIFY_OK;
556}
557
558
559static struct notifier_block boost_nb = {
560 .notifier_call = boost_notify,
561};
562
09b4d1ee
VP
563/*
564 * acpi_cpufreq_early_init - initialize ACPI P-States library
565 *
566 * Initialize the ACPI P-States library (drivers/acpi/processor_perflib.c)
567 * in order to determine correct frequency and voltage pairings. We can
568 * do _PDC and _PSD and find out the processor dependency for the
569 * actual init that will happen later...
570 */
50109292 571static int __init acpi_cpufreq_early_init(void)
09b4d1ee 572{
2fdf66b4 573 unsigned int i;
2d06d8c4 574 pr_debug("acpi_cpufreq_early_init\n");
09b4d1ee 575
50109292
FY
576 acpi_perf_data = alloc_percpu(struct acpi_processor_performance);
577 if (!acpi_perf_data) {
2d06d8c4 578 pr_debug("Memory allocation error for acpi_perf_data.\n");
50109292 579 return -ENOMEM;
09b4d1ee 580 }
2fdf66b4 581 for_each_possible_cpu(i) {
eaa95840 582 if (!zalloc_cpumask_var_node(
80855f73
MT
583 &per_cpu_ptr(acpi_perf_data, i)->shared_cpu_map,
584 GFP_KERNEL, cpu_to_node(i))) {
2fdf66b4
RR
585
586 /* Freeing a NULL pointer is OK: alloc_percpu zeroes. */
587 free_acpi_perf_data();
588 return -ENOMEM;
589 }
590 }
09b4d1ee
VP
591
592 /* Do initialization in ACPI core */
fe27cb35
VP
593 acpi_processor_preregister_performance(acpi_perf_data);
594 return 0;
09b4d1ee
VP
595}
596
95625b8f 597#ifdef CONFIG_SMP
8adcc0c6
VP
598/*
599 * Some BIOSes do SW_ANY coordination internally, either set it up in hw
600 * or do it in BIOS firmware and won't inform about it to OS. If not
601 * detected, this has a side effect of making CPU run at a different speed
602 * than OS intended it to run at. Detect it and handle it cleanly.
603 */
604static int bios_with_sw_any_bug;
605
1855256c 606static int sw_any_bug_found(const struct dmi_system_id *d)
8adcc0c6
VP
607{
608 bios_with_sw_any_bug = 1;
609 return 0;
610}
611
1855256c 612static const struct dmi_system_id sw_any_bug_dmi_table[] = {
8adcc0c6
VP
613 {
614 .callback = sw_any_bug_found,
615 .ident = "Supermicro Server X6DLP",
616 .matches = {
617 DMI_MATCH(DMI_SYS_VENDOR, "Supermicro"),
618 DMI_MATCH(DMI_BIOS_VERSION, "080010"),
619 DMI_MATCH(DMI_PRODUCT_NAME, "X6DLP"),
620 },
621 },
622 { }
623};
1a8e42fa
PB
624
625static int acpi_cpufreq_blacklist(struct cpuinfo_x86 *c)
626{
293afe44
JV
627 /* Intel Xeon Processor 7100 Series Specification Update
628 * http://www.intel.com/Assets/PDF/specupdate/314554.pdf
1a8e42fa
PB
629 * AL30: A Machine Check Exception (MCE) Occurring during an
630 * Enhanced Intel SpeedStep Technology Ratio Change May Cause
293afe44 631 * Both Processor Cores to Lock Up. */
1a8e42fa
PB
632 if (c->x86_vendor == X86_VENDOR_INTEL) {
633 if ((c->x86 == 15) &&
634 (c->x86_model == 6) &&
293afe44
JV
635 (c->x86_mask == 8)) {
636 printk(KERN_INFO "acpi-cpufreq: Intel(R) "
637 "Xeon(R) 7100 Errata AL30, processors may "
638 "lock up on frequency changes: disabling "
639 "acpi-cpufreq.\n");
1a8e42fa 640 return -ENODEV;
293afe44 641 }
1a8e42fa
PB
642 }
643 return 0;
644}
95625b8f 645#endif
8adcc0c6 646
64be7eed 647static int acpi_cpufreq_cpu_init(struct cpufreq_policy *policy)
1da177e4 648{
64be7eed
VP
649 unsigned int i;
650 unsigned int valid_states = 0;
651 unsigned int cpu = policy->cpu;
652 struct acpi_cpufreq_data *data;
64be7eed 653 unsigned int result = 0;
92cb7612 654 struct cpuinfo_x86 *c = &cpu_data(policy->cpu);
64be7eed 655 struct acpi_processor_performance *perf;
293afe44
JV
656#ifdef CONFIG_SMP
657 static int blacklisted;
658#endif
1da177e4 659
2d06d8c4 660 pr_debug("acpi_cpufreq_cpu_init\n");
1da177e4 661
1a8e42fa 662#ifdef CONFIG_SMP
293afe44
JV
663 if (blacklisted)
664 return blacklisted;
665 blacklisted = acpi_cpufreq_blacklist(c);
666 if (blacklisted)
667 return blacklisted;
1a8e42fa
PB
668#endif
669
d5b73cd8 670 data = kzalloc(sizeof(*data), GFP_KERNEL);
1da177e4 671 if (!data)
64be7eed 672 return -ENOMEM;
1da177e4 673
f4fd3797
LT
674 if (!zalloc_cpumask_var(&data->freqdomain_cpus, GFP_KERNEL)) {
675 result = -ENOMEM;
676 goto err_free;
677 }
678
b36128c8 679 data->acpi_data = per_cpu_ptr(acpi_perf_data, cpu);
eb0b3e78 680 policy->driver_data = data;
1da177e4 681
95dd7227 682 if (cpu_has(c, X86_FEATURE_CONSTANT_TSC))
fe27cb35 683 acpi_cpufreq_driver.flags |= CPUFREQ_CONST_LOOPS;
1da177e4 684
fe27cb35 685 result = acpi_processor_register_performance(data->acpi_data, cpu);
1da177e4 686 if (result)
f4fd3797 687 goto err_free_mask;
1da177e4 688
09b4d1ee 689 perf = data->acpi_data;
09b4d1ee 690 policy->shared_type = perf->shared_type;
95dd7227 691
46f18e3a 692 /*
95dd7227 693 * Will let policy->cpus know about dependency only when software
46f18e3a
VP
694 * coordination is required.
695 */
696 if (policy->shared_type == CPUFREQ_SHARED_TYPE_ALL ||
8adcc0c6 697 policy->shared_type == CPUFREQ_SHARED_TYPE_ANY) {
835481d9 698 cpumask_copy(policy->cpus, perf->shared_cpu_map);
8adcc0c6 699 }
f4fd3797 700 cpumask_copy(data->freqdomain_cpus, perf->shared_cpu_map);
8adcc0c6
VP
701
702#ifdef CONFIG_SMP
703 dmi_check_system(sw_any_bug_dmi_table);
2624f90c 704 if (bios_with_sw_any_bug && !policy_is_shared(policy)) {
8adcc0c6 705 policy->shared_type = CPUFREQ_SHARED_TYPE_ALL;
3280c3c8 706 cpumask_copy(policy->cpus, topology_core_cpumask(cpu));
8adcc0c6 707 }
acd31624
AP
708
709 if (check_amd_hwpstate_cpu(cpu) && !acpi_pstate_strict) {
710 cpumask_clear(policy->cpus);
711 cpumask_set_cpu(cpu, policy->cpus);
3280c3c8
BG
712 cpumask_copy(data->freqdomain_cpus,
713 topology_sibling_cpumask(cpu));
acd31624
AP
714 policy->shared_type = CPUFREQ_SHARED_TYPE_HW;
715 pr_info_once(PFX "overriding BIOS provided _PSD data\n");
716 }
8adcc0c6 717#endif
09b4d1ee 718
1da177e4 719 /* capability check */
09b4d1ee 720 if (perf->state_count <= 1) {
2d06d8c4 721 pr_debug("No P-States\n");
1da177e4
LT
722 result = -ENODEV;
723 goto err_unreg;
724 }
09b4d1ee 725
fe27cb35
VP
726 if (perf->control_register.space_id != perf->status_register.space_id) {
727 result = -ENODEV;
728 goto err_unreg;
729 }
730
731 switch (perf->control_register.space_id) {
64be7eed 732 case ACPI_ADR_SPACE_SYSTEM_IO:
c40a4518
MG
733 if (boot_cpu_data.x86_vendor == X86_VENDOR_AMD &&
734 boot_cpu_data.x86 == 0xf) {
735 pr_debug("AMD K8 systems must use native drivers.\n");
736 result = -ENODEV;
737 goto err_unreg;
738 }
2d06d8c4 739 pr_debug("SYSTEM IO addr space\n");
dde9f7ba
VP
740 data->cpu_feature = SYSTEM_IO_CAPABLE;
741 break;
64be7eed 742 case ACPI_ADR_SPACE_FIXED_HARDWARE:
2d06d8c4 743 pr_debug("HARDWARE addr space\n");
3dc9a633
MG
744 if (check_est_cpu(cpu)) {
745 data->cpu_feature = SYSTEM_INTEL_MSR_CAPABLE;
746 break;
dde9f7ba 747 }
3dc9a633
MG
748 if (check_amd_hwpstate_cpu(cpu)) {
749 data->cpu_feature = SYSTEM_AMD_MSR_CAPABLE;
750 break;
751 }
752 result = -ENODEV;
753 goto err_unreg;
64be7eed 754 default:
2d06d8c4 755 pr_debug("Unknown addr space %d\n",
64be7eed 756 (u32) (perf->control_register.space_id));
1da177e4
LT
757 result = -ENODEV;
758 goto err_unreg;
759 }
760
71508a1f 761 data->freq_table = kzalloc(sizeof(*data->freq_table) *
95dd7227 762 (perf->state_count+1), GFP_KERNEL);
1da177e4
LT
763 if (!data->freq_table) {
764 result = -ENOMEM;
765 goto err_unreg;
766 }
767
768 /* detect transition latency */
769 policy->cpuinfo.transition_latency = 0;
3a58df35 770 for (i = 0; i < perf->state_count; i++) {
64be7eed
VP
771 if ((perf->states[i].transition_latency * 1000) >
772 policy->cpuinfo.transition_latency)
773 policy->cpuinfo.transition_latency =
774 perf->states[i].transition_latency * 1000;
1da177e4 775 }
1da177e4 776
a59d1637
PV
777 /* Check for high latency (>20uS) from buggy BIOSes, like on T42 */
778 if (perf->control_register.space_id == ACPI_ADR_SPACE_FIXED_HARDWARE &&
779 policy->cpuinfo.transition_latency > 20 * 1000) {
a59d1637 780 policy->cpuinfo.transition_latency = 20 * 1000;
61c8c67e
JP
781 printk_once(KERN_INFO
782 "P-state transition latency capped at 20 uS\n");
a59d1637
PV
783 }
784
1da177e4 785 /* table init */
3a58df35
DJ
786 for (i = 0; i < perf->state_count; i++) {
787 if (i > 0 && perf->states[i].core_frequency >=
3cdf552b 788 data->freq_table[valid_states-1].frequency / 1000)
fe27cb35
VP
789 continue;
790
50701588 791 data->freq_table[valid_states].driver_data = i;
fe27cb35 792 data->freq_table[valid_states].frequency =
64be7eed 793 perf->states[i].core_frequency * 1000;
fe27cb35 794 valid_states++;
1da177e4 795 }
3d4a7ef3 796 data->freq_table[valid_states].frequency = CPUFREQ_TABLE_END;
8edc59d9 797 perf->state = 0;
1da177e4 798
776b57be 799 result = cpufreq_table_validate_and_show(policy, data->freq_table);
95dd7227 800 if (result)
1da177e4 801 goto err_freqfree;
1da177e4 802
d876dfbb
TR
803 if (perf->states[0].core_frequency * 1000 != policy->cpuinfo.max_freq)
804 printk(KERN_WARNING FW_WARN "P-state 0 is not max freq\n");
805
a507ac4b 806 switch (perf->control_register.space_id) {
64be7eed 807 case ACPI_ADR_SPACE_SYSTEM_IO:
1bab64d5
VK
808 /*
809 * The core will not set policy->cur, because
810 * cpufreq_driver->get is NULL, so we need to set it here.
811 * However, we have to guess it, because the current speed is
812 * unknown and not detectable via IO ports.
813 */
dde9f7ba
VP
814 policy->cur = acpi_cpufreq_guess_freq(data, policy->cpu);
815 break;
64be7eed 816 case ACPI_ADR_SPACE_FIXED_HARDWARE:
7650b281 817 acpi_cpufreq_driver.get = get_cur_freq_on_cpu;
dde9f7ba 818 break;
64be7eed 819 default:
dde9f7ba
VP
820 break;
821 }
822
1da177e4
LT
823 /* notify BIOS that we exist */
824 acpi_processor_notify_smm(THIS_MODULE);
825
2d06d8c4 826 pr_debug("CPU%u - ACPI performance management activated.\n", cpu);
09b4d1ee 827 for (i = 0; i < perf->state_count; i++)
2d06d8c4 828 pr_debug(" %cP%d: %d MHz, %d mW, %d uS\n",
64be7eed 829 (i == perf->state ? '*' : ' '), i,
09b4d1ee
VP
830 (u32) perf->states[i].core_frequency,
831 (u32) perf->states[i].power,
832 (u32) perf->states[i].transition_latency);
1da177e4 833
4b31e774
DB
834 /*
835 * the first call to ->target() should result in us actually
836 * writing something to the appropriate registers.
837 */
838 data->resume = 1;
64be7eed 839
fe27cb35 840 return result;
1da177e4 841
95dd7227 842err_freqfree:
1da177e4 843 kfree(data->freq_table);
95dd7227 844err_unreg:
09b4d1ee 845 acpi_processor_unregister_performance(perf, cpu);
f4fd3797
LT
846err_free_mask:
847 free_cpumask_var(data->freqdomain_cpus);
95dd7227 848err_free:
1da177e4 849 kfree(data);
eb0b3e78 850 policy->driver_data = NULL;
1da177e4 851
64be7eed 852 return result;
1da177e4
LT
853}
854
64be7eed 855static int acpi_cpufreq_cpu_exit(struct cpufreq_policy *policy)
1da177e4 856{
eb0b3e78 857 struct acpi_cpufreq_data *data = policy->driver_data;
1da177e4 858
2d06d8c4 859 pr_debug("acpi_cpufreq_cpu_exit\n");
1da177e4
LT
860
861 if (data) {
eb0b3e78 862 policy->driver_data = NULL;
64be7eed
VP
863 acpi_processor_unregister_performance(data->acpi_data,
864 policy->cpu);
f4fd3797 865 free_cpumask_var(data->freqdomain_cpus);
dab5fff1 866 kfree(data->freq_table);
1da177e4
LT
867 kfree(data);
868 }
869
64be7eed 870 return 0;
1da177e4
LT
871}
872
64be7eed 873static int acpi_cpufreq_resume(struct cpufreq_policy *policy)
1da177e4 874{
eb0b3e78 875 struct acpi_cpufreq_data *data = policy->driver_data;
1da177e4 876
2d06d8c4 877 pr_debug("acpi_cpufreq_resume\n");
1da177e4
LT
878
879 data->resume = 1;
880
64be7eed 881 return 0;
1da177e4
LT
882}
883
64be7eed 884static struct freq_attr *acpi_cpufreq_attr[] = {
1da177e4 885 &cpufreq_freq_attr_scaling_available_freqs,
f4fd3797 886 &freqdomain_cpus,
11269ff5 887 NULL, /* this is a placeholder for cpb, do not remove */
1da177e4
LT
888 NULL,
889};
890
891static struct cpufreq_driver acpi_cpufreq_driver = {
db9be219 892 .verify = cpufreq_generic_frequency_table_verify,
9c0ebcf7 893 .target_index = acpi_cpufreq_target,
e2f74f35
TR
894 .bios_limit = acpi_processor_get_bios_limit,
895 .init = acpi_cpufreq_cpu_init,
896 .exit = acpi_cpufreq_cpu_exit,
897 .resume = acpi_cpufreq_resume,
898 .name = "acpi-cpufreq",
e2f74f35 899 .attr = acpi_cpufreq_attr,
cfc9c8ed 900 .set_boost = _store_boost,
1da177e4
LT
901};
902
615b7300
AP
903static void __init acpi_cpufreq_boost_init(void)
904{
905 if (boot_cpu_has(X86_FEATURE_CPB) || boot_cpu_has(X86_FEATURE_IDA)) {
906 msrs = msrs_alloc();
907
908 if (!msrs)
909 return;
910
cfc9c8ed
LM
911 acpi_cpufreq_driver.boost_supported = true;
912 acpi_cpufreq_driver.boost_enabled = boost_state(0);
0197fbd2
SB
913
914 cpu_notifier_register_begin();
615b7300
AP
915
916 /* Force all MSRs to the same value */
cfc9c8ed
LM
917 boost_set_msrs(acpi_cpufreq_driver.boost_enabled,
918 cpu_online_mask);
615b7300 919
0197fbd2 920 __register_cpu_notifier(&boost_nb);
615b7300 921
0197fbd2 922 cpu_notifier_register_done();
cfc9c8ed 923 }
615b7300
AP
924}
925
eb8c68ef 926static void acpi_cpufreq_boost_exit(void)
615b7300 927{
615b7300
AP
928 if (msrs) {
929 unregister_cpu_notifier(&boost_nb);
930
931 msrs_free(msrs);
932 msrs = NULL;
933 }
934}
935
64be7eed 936static int __init acpi_cpufreq_init(void)
1da177e4 937{
50109292
FY
938 int ret;
939
75c07581
RW
940 if (acpi_disabled)
941 return -ENODEV;
942
8a61e12e
YL
943 /* don't keep reloading if cpufreq_driver exists */
944 if (cpufreq_get_current_driver())
75c07581 945 return -EEXIST;
ee297533 946
2d06d8c4 947 pr_debug("acpi_cpufreq_init\n");
1da177e4 948
50109292
FY
949 ret = acpi_cpufreq_early_init();
950 if (ret)
951 return ret;
09b4d1ee 952
11269ff5
AP
953#ifdef CONFIG_X86_ACPI_CPUFREQ_CPB
954 /* this is a sysfs file with a strange name and an even stranger
955 * semantic - per CPU instantiation, but system global effect.
956 * Lets enable it only on AMD CPUs for compatibility reasons and
957 * only if configured. This is considered legacy code, which
958 * will probably be removed at some point in the future.
959 */
960 if (check_amd_hwpstate_cpu(0)) {
961 struct freq_attr **iter;
962
963 pr_debug("adding sysfs entry for cpb\n");
964
965 for (iter = acpi_cpufreq_attr; *iter != NULL; iter++)
966 ;
967
968 /* make sure there is a terminator behind it */
969 if (iter[1] == NULL)
970 *iter = &cpb;
971 }
972#endif
cfc9c8ed 973 acpi_cpufreq_boost_init();
11269ff5 974
847aef6f 975 ret = cpufreq_register_driver(&acpi_cpufreq_driver);
eb8c68ef 976 if (ret) {
2fdf66b4 977 free_acpi_perf_data();
eb8c68ef
KRW
978 acpi_cpufreq_boost_exit();
979 }
847aef6f 980 return ret;
1da177e4
LT
981}
982
64be7eed 983static void __exit acpi_cpufreq_exit(void)
1da177e4 984{
2d06d8c4 985 pr_debug("acpi_cpufreq_exit\n");
1da177e4 986
615b7300
AP
987 acpi_cpufreq_boost_exit();
988
1da177e4
LT
989 cpufreq_unregister_driver(&acpi_cpufreq_driver);
990
50f4ddd4 991 free_acpi_perf_data();
1da177e4
LT
992}
993
d395bf12 994module_param(acpi_pstate_strict, uint, 0644);
64be7eed 995MODULE_PARM_DESC(acpi_pstate_strict,
95dd7227
DJ
996 "value 0 or non-zero. non-zero -> strict ACPI checks are "
997 "performed during frequency changes.");
1da177e4
LT
998
999late_initcall(acpi_cpufreq_init);
1000module_exit(acpi_cpufreq_exit);
1001
efa17194
MG
1002static const struct x86_cpu_id acpi_cpufreq_ids[] = {
1003 X86_FEATURE_MATCH(X86_FEATURE_ACPI),
1004 X86_FEATURE_MATCH(X86_FEATURE_HW_PSTATE),
1005 {}
1006};
1007MODULE_DEVICE_TABLE(x86cpu, acpi_cpufreq_ids);
1008
c655affb
RW
1009static const struct acpi_device_id processor_device_ids[] = {
1010 {ACPI_PROCESSOR_OBJECT_HID, },
1011 {ACPI_PROCESSOR_DEVICE_HID, },
1012 {},
1013};
1014MODULE_DEVICE_TABLE(acpi, processor_device_ids);
1015
1da177e4 1016MODULE_ALIAS("acpi");