]> git.proxmox.com Git - mirror_ubuntu-artful-kernel.git/blame - drivers/hwmon/coretemp.c
Merge branch 'for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/viro/audit
[mirror_ubuntu-artful-kernel.git] / drivers / hwmon / coretemp.c
CommitLineData
bebe4678
RM
1/*
2 * coretemp.c - Linux kernel module for hardware monitoring
3 *
4 * Copyright (C) 2007 Rudolf Marek <r.marek@assembler.cz>
5 *
6 * Inspired from many hwmon drivers
7 *
8 * This program is free software; you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License as published by
10 * the Free Software Foundation; version 2 of the License.
11 *
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with this program; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
20 * 02110-1301 USA.
21 */
22
f8bb8925
JP
23#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
24
bebe4678 25#include <linux/module.h>
bebe4678
RM
26#include <linux/init.h>
27#include <linux/slab.h>
28#include <linux/jiffies.h>
29#include <linux/hwmon.h>
30#include <linux/sysfs.h>
31#include <linux/hwmon-sysfs.h>
32#include <linux/err.h>
33#include <linux/mutex.h>
34#include <linux/list.h>
35#include <linux/platform_device.h>
36#include <linux/cpu.h>
1fe63ab4 37#include <linux/pci.h>
4cc45275 38#include <linux/smp.h>
a45a8c85 39#include <linux/moduleparam.h>
bebe4678
RM
40#include <asm/msr.h>
41#include <asm/processor.h>
42
43#define DRVNAME "coretemp"
44
a45a8c85
JD
45/*
46 * force_tjmax only matters when TjMax can't be read from the CPU itself.
47 * When set, it replaces the driver's suboptimal heuristic.
48 */
49static int force_tjmax;
50module_param_named(tjmax, force_tjmax, int, 0444);
51MODULE_PARM_DESC(tjmax, "TjMax value in degrees Celsius");
52
199e0de7
D
53#define BASE_SYSFS_ATTR_NO 2 /* Sysfs Base attr no for coretemp */
54#define NUM_REAL_CORES 16 /* Number of Real cores per cpu */
55#define CORETEMP_NAME_LENGTH 17 /* String Length of attrs */
c814a4c7 56#define MAX_CORE_ATTRS 4 /* Maximum no of basic attrs */
f4af6fd6 57#define TOTAL_ATTRS (MAX_CORE_ATTRS + 1)
199e0de7
D
58#define MAX_CORE_DATA (NUM_REAL_CORES + BASE_SYSFS_ATTR_NO)
59
199e0de7
D
60#define TO_PHYS_ID(cpu) cpu_data(cpu).phys_proc_id
61#define TO_CORE_ID(cpu) cpu_data(cpu).cpu_core_id
141168c3
KW
62#define TO_ATTR_NO(cpu) (TO_CORE_ID(cpu) + BASE_SYSFS_ATTR_NO)
63
64#ifdef CONFIG_SMP
bb74e8ca 65#define for_each_sibling(i, cpu) for_each_cpu(i, cpu_sibling_mask(cpu))
199e0de7 66#else
bb74e8ca 67#define for_each_sibling(i, cpu) for (i = 0; false; )
199e0de7 68#endif
bebe4678
RM
69
70/*
199e0de7
D
71 * Per-Core Temperature Data
72 * @last_updated: The time when the current temperature value was updated
73 * earlier (in jiffies).
74 * @cpu_core_id: The CPU Core from which temperature values should be read
75 * This value is passed as "id" field to rdmsr/wrmsr functions.
76 * @status_reg: One of IA32_THERM_STATUS or IA32_PACKAGE_THERM_STATUS,
77 * from where the temperature values should be read.
c814a4c7 78 * @attr_size: Total number of pre-core attrs displayed in the sysfs.
199e0de7
D
79 * @is_pkg_data: If this is 1, the temp_data holds pkgtemp data.
80 * Otherwise, temp_data holds coretemp data.
81 * @valid: If this is 1, the current temperature is valid.
bebe4678 82 */
199e0de7 83struct temp_data {
bebe4678 84 int temp;
6369a288 85 int ttarget;
199e0de7
D
86 int tjmax;
87 unsigned long last_updated;
88 unsigned int cpu;
89 u32 cpu_core_id;
90 u32 status_reg;
c814a4c7 91 int attr_size;
199e0de7
D
92 bool is_pkg_data;
93 bool valid;
c814a4c7
D
94 struct sensor_device_attribute sd_attrs[TOTAL_ATTRS];
95 char attr_name[TOTAL_ATTRS][CORETEMP_NAME_LENGTH];
199e0de7 96 struct mutex update_lock;
bebe4678
RM
97};
98
199e0de7
D
99/* Platform Data per Physical CPU */
100struct platform_data {
101 struct device *hwmon_dev;
102 u16 phys_proc_id;
103 struct temp_data *core_data[MAX_CORE_DATA];
104 struct device_attribute name_attr;
105};
bebe4678 106
199e0de7
D
107struct pdev_entry {
108 struct list_head list;
109 struct platform_device *pdev;
199e0de7 110 u16 phys_proc_id;
199e0de7
D
111};
112
113static LIST_HEAD(pdev_list);
114static DEFINE_MUTEX(pdev_list_mutex);
115
116static ssize_t show_name(struct device *dev,
117 struct device_attribute *devattr, char *buf)
118{
119 return sprintf(buf, "%s\n", DRVNAME);
120}
121
122static ssize_t show_label(struct device *dev,
123 struct device_attribute *devattr, char *buf)
bebe4678 124{
bebe4678 125 struct sensor_device_attribute *attr = to_sensor_dev_attr(devattr);
199e0de7
D
126 struct platform_data *pdata = dev_get_drvdata(dev);
127 struct temp_data *tdata = pdata->core_data[attr->index];
128
129 if (tdata->is_pkg_data)
130 return sprintf(buf, "Physical id %u\n", pdata->phys_proc_id);
bebe4678 131
199e0de7 132 return sprintf(buf, "Core %u\n", tdata->cpu_core_id);
bebe4678
RM
133}
134
199e0de7
D
135static ssize_t show_crit_alarm(struct device *dev,
136 struct device_attribute *devattr, char *buf)
bebe4678 137{
199e0de7
D
138 u32 eax, edx;
139 struct sensor_device_attribute *attr = to_sensor_dev_attr(devattr);
140 struct platform_data *pdata = dev_get_drvdata(dev);
141 struct temp_data *tdata = pdata->core_data[attr->index];
142
143 rdmsr_on_cpu(tdata->cpu, tdata->status_reg, &eax, &edx);
144
145 return sprintf(buf, "%d\n", (eax >> 5) & 1);
bebe4678
RM
146}
147
199e0de7
D
148static ssize_t show_tjmax(struct device *dev,
149 struct device_attribute *devattr, char *buf)
bebe4678
RM
150{
151 struct sensor_device_attribute *attr = to_sensor_dev_attr(devattr);
199e0de7 152 struct platform_data *pdata = dev_get_drvdata(dev);
bebe4678 153
199e0de7 154 return sprintf(buf, "%d\n", pdata->core_data[attr->index]->tjmax);
bebe4678
RM
155}
156
199e0de7
D
157static ssize_t show_ttarget(struct device *dev,
158 struct device_attribute *devattr, char *buf)
159{
160 struct sensor_device_attribute *attr = to_sensor_dev_attr(devattr);
161 struct platform_data *pdata = dev_get_drvdata(dev);
bebe4678 162
199e0de7
D
163 return sprintf(buf, "%d\n", pdata->core_data[attr->index]->ttarget);
164}
bebe4678 165
199e0de7
D
166static ssize_t show_temp(struct device *dev,
167 struct device_attribute *devattr, char *buf)
bebe4678 168{
199e0de7
D
169 u32 eax, edx;
170 struct sensor_device_attribute *attr = to_sensor_dev_attr(devattr);
171 struct platform_data *pdata = dev_get_drvdata(dev);
172 struct temp_data *tdata = pdata->core_data[attr->index];
bebe4678 173
199e0de7 174 mutex_lock(&tdata->update_lock);
bebe4678 175
199e0de7
D
176 /* Check whether the time interval has elapsed */
177 if (!tdata->valid || time_after(jiffies, tdata->last_updated + HZ)) {
178 rdmsr_on_cpu(tdata->cpu, tdata->status_reg, &eax, &edx);
179 tdata->valid = 0;
180 /* Check whether the data is valid */
bebe4678 181 if (eax & 0x80000000) {
199e0de7 182 tdata->temp = tdata->tjmax -
4cc45275 183 ((eax >> 16) & 0x7f) * 1000;
199e0de7 184 tdata->valid = 1;
bebe4678 185 }
199e0de7 186 tdata->last_updated = jiffies;
bebe4678
RM
187 }
188
199e0de7
D
189 mutex_unlock(&tdata->update_lock);
190 return tdata->valid ? sprintf(buf, "%d\n", tdata->temp) : -EAGAIN;
bebe4678
RM
191}
192
d6db23c7
JD
193static int __cpuinit adjust_tjmax(struct cpuinfo_x86 *c, u32 id,
194 struct device *dev)
118a8871
RM
195{
196 /* The 100C is default for both mobile and non mobile CPUs */
197
198 int tjmax = 100000;
eccfed42 199 int tjmax_ee = 85000;
708a62bc 200 int usemsr_ee = 1;
118a8871
RM
201 int err;
202 u32 eax, edx;
1fe63ab4 203 struct pci_dev *host_bridge;
118a8871
RM
204
205 /* Early chips have no MSR for TjMax */
206
4cc45275 207 if (c->x86_model == 0xf && c->x86_mask < 4)
708a62bc 208 usemsr_ee = 0;
118a8871 209
1fe63ab4 210 /* Atom CPUs */
708a62bc
RM
211
212 if (c->x86_model == 0x1c) {
213 usemsr_ee = 0;
1fe63ab4
YW
214
215 host_bridge = pci_get_bus_and_slot(0, PCI_DEVFN(0, 0));
216
217 if (host_bridge && host_bridge->vendor == PCI_VENDOR_ID_INTEL
218 && (host_bridge->device == 0xa000 /* NM10 based nettop */
219 || host_bridge->device == 0xa010)) /* NM10 based netbook */
220 tjmax = 100000;
221 else
222 tjmax = 90000;
223
224 pci_dev_put(host_bridge);
708a62bc
RM
225 }
226
4cc45275 227 if (c->x86_model > 0xe && usemsr_ee) {
eccfed42 228 u8 platform_id;
118a8871 229
4cc45275
GR
230 /*
231 * Now we can detect the mobile CPU using Intel provided table
232 * http://softwarecommunity.intel.com/Wiki/Mobility/720.htm
233 * For Core2 cores, check MSR 0x17, bit 28 1 = Mobile CPU
234 */
118a8871
RM
235 err = rdmsr_safe_on_cpu(id, 0x17, &eax, &edx);
236 if (err) {
237 dev_warn(dev,
238 "Unable to access MSR 0x17, assuming desktop"
239 " CPU\n");
708a62bc 240 usemsr_ee = 0;
eccfed42 241 } else if (c->x86_model < 0x17 && !(eax & 0x10000000)) {
4cc45275
GR
242 /*
243 * Trust bit 28 up to Penryn, I could not find any
244 * documentation on that; if you happen to know
245 * someone at Intel please ask
246 */
708a62bc 247 usemsr_ee = 0;
eccfed42
RM
248 } else {
249 /* Platform ID bits 52:50 (EDX starts at bit 32) */
250 platform_id = (edx >> 18) & 0x7;
251
4cc45275
GR
252 /*
253 * Mobile Penryn CPU seems to be platform ID 7 or 5
254 * (guesswork)
255 */
256 if (c->x86_model == 0x17 &&
257 (platform_id == 5 || platform_id == 7)) {
258 /*
259 * If MSR EE bit is set, set it to 90 degrees C,
260 * otherwise 105 degrees C
261 */
eccfed42
RM
262 tjmax_ee = 90000;
263 tjmax = 105000;
264 }
118a8871
RM
265 }
266 }
267
708a62bc 268 if (usemsr_ee) {
118a8871
RM
269 err = rdmsr_safe_on_cpu(id, 0xee, &eax, &edx);
270 if (err) {
271 dev_warn(dev,
272 "Unable to access MSR 0xEE, for Tjmax, left"
4d7a5644 273 " at default\n");
118a8871 274 } else if (eax & 0x40000000) {
eccfed42 275 tjmax = tjmax_ee;
118a8871 276 }
708a62bc 277 } else if (tjmax == 100000) {
4cc45275
GR
278 /*
279 * If we don't use msr EE it means we are desktop CPU
280 * (with exeception of Atom)
281 */
118a8871
RM
282 dev_warn(dev, "Using relative temperature scale!\n");
283 }
284
285 return tjmax;
286}
287
d6db23c7
JD
288static int __cpuinit get_tjmax(struct cpuinfo_x86 *c, u32 id,
289 struct device *dev)
a321cedb 290{
a321cedb
CE
291 int err;
292 u32 eax, edx;
293 u32 val;
294
4cc45275
GR
295 /*
296 * A new feature of current Intel(R) processors, the
297 * IA32_TEMPERATURE_TARGET contains the TjMax value
298 */
a321cedb
CE
299 err = rdmsr_safe_on_cpu(id, MSR_IA32_TEMPERATURE_TARGET, &eax, &edx);
300 if (err) {
6bf9e9b0
JD
301 if (c->x86_model > 0xe && c->x86_model != 0x1c)
302 dev_warn(dev, "Unable to read TjMax from CPU %u\n", id);
a321cedb
CE
303 } else {
304 val = (eax >> 16) & 0xff;
305 /*
306 * If the TjMax is not plausible, an assumption
307 * will be used
308 */
bb9973e4 309 if (val) {
6bf9e9b0 310 dev_dbg(dev, "TjMax is %d degrees C\n", val);
a321cedb
CE
311 return val * 1000;
312 }
313 }
314
a45a8c85
JD
315 if (force_tjmax) {
316 dev_notice(dev, "TjMax forced to %d degrees C by user\n",
317 force_tjmax);
318 return force_tjmax * 1000;
319 }
320
a321cedb
CE
321 /*
322 * An assumption is made for early CPUs and unreadable MSR.
4f5f71a7 323 * NOTE: the calculated value may not be correct.
a321cedb 324 */
4f5f71a7 325 return adjust_tjmax(c, id, dev);
a321cedb
CE
326}
327
d6db23c7
JD
328static int __devinit create_name_attr(struct platform_data *pdata,
329 struct device *dev)
199e0de7 330{
4258781a 331 sysfs_attr_init(&pdata->name_attr.attr);
199e0de7
D
332 pdata->name_attr.attr.name = "name";
333 pdata->name_attr.attr.mode = S_IRUGO;
334 pdata->name_attr.show = show_name;
335 return device_create_file(dev, &pdata->name_attr);
336}
bebe4678 337
d6db23c7
JD
338static int __cpuinit create_core_attrs(struct temp_data *tdata,
339 struct device *dev, int attr_no)
199e0de7
D
340{
341 int err, i;
e3204ed3 342 static ssize_t (*const rd_ptr[TOTAL_ATTRS]) (struct device *dev,
199e0de7 343 struct device_attribute *devattr, char *buf) = {
c814a4c7 344 show_label, show_crit_alarm, show_temp, show_tjmax,
f4af6fd6 345 show_ttarget };
e3204ed3 346 static const char *const names[TOTAL_ATTRS] = {
199e0de7 347 "temp%d_label", "temp%d_crit_alarm",
c814a4c7 348 "temp%d_input", "temp%d_crit",
f4af6fd6 349 "temp%d_max" };
199e0de7 350
c814a4c7 351 for (i = 0; i < tdata->attr_size; i++) {
199e0de7
D
352 snprintf(tdata->attr_name[i], CORETEMP_NAME_LENGTH, names[i],
353 attr_no);
4258781a 354 sysfs_attr_init(&tdata->sd_attrs[i].dev_attr.attr);
199e0de7
D
355 tdata->sd_attrs[i].dev_attr.attr.name = tdata->attr_name[i];
356 tdata->sd_attrs[i].dev_attr.attr.mode = S_IRUGO;
357 tdata->sd_attrs[i].dev_attr.show = rd_ptr[i];
199e0de7
D
358 tdata->sd_attrs[i].index = attr_no;
359 err = device_create_file(dev, &tdata->sd_attrs[i].dev_attr);
360 if (err)
361 goto exit_free;
bebe4678 362 }
199e0de7
D
363 return 0;
364
365exit_free:
366 while (--i >= 0)
367 device_remove_file(dev, &tdata->sd_attrs[i].dev_attr);
368 return err;
369}
370
199e0de7 371
0eb9782a 372static int __cpuinit chk_ucode_version(unsigned int cpu)
199e0de7 373{
0eb9782a 374 struct cpuinfo_x86 *c = &cpu_data(cpu);
67f363b1 375
199e0de7
D
376 /*
377 * Check if we have problem with errata AE18 of Core processors:
378 * Readings might stop update when processor visited too deep sleep,
379 * fixed for stepping D0 (6EC).
380 */
ca8bc8dc
AK
381 if (c->x86_model == 0xe && c->x86_mask < 0xc && c->microcode < 0x39) {
382 pr_err("Errata AE18 not fixed, update BIOS or "
383 "microcode of the CPU!\n");
384 return -ENODEV;
67f363b1 385 }
199e0de7
D
386 return 0;
387}
388
d6db23c7 389static struct platform_device __cpuinit *coretemp_get_pdev(unsigned int cpu)
199e0de7
D
390{
391 u16 phys_proc_id = TO_PHYS_ID(cpu);
392 struct pdev_entry *p;
393
394 mutex_lock(&pdev_list_mutex);
395
396 list_for_each_entry(p, &pdev_list, list)
397 if (p->phys_proc_id == phys_proc_id) {
398 mutex_unlock(&pdev_list_mutex);
399 return p->pdev;
400 }
401
402 mutex_unlock(&pdev_list_mutex);
403 return NULL;
404}
405
d6db23c7
JD
406static struct temp_data __cpuinit *init_temp_data(unsigned int cpu,
407 int pkg_flag)
199e0de7
D
408{
409 struct temp_data *tdata;
410
411 tdata = kzalloc(sizeof(struct temp_data), GFP_KERNEL);
412 if (!tdata)
413 return NULL;
414
415 tdata->status_reg = pkg_flag ? MSR_IA32_PACKAGE_THERM_STATUS :
416 MSR_IA32_THERM_STATUS;
417 tdata->is_pkg_data = pkg_flag;
418 tdata->cpu = cpu;
419 tdata->cpu_core_id = TO_CORE_ID(cpu);
c814a4c7 420 tdata->attr_size = MAX_CORE_ATTRS;
199e0de7
D
421 mutex_init(&tdata->update_lock);
422 return tdata;
423}
67f363b1 424
d6db23c7 425static int __cpuinit create_core_data(struct platform_device *pdev,
199e0de7
D
426 unsigned int cpu, int pkg_flag)
427{
428 struct temp_data *tdata;
2f1c3db0 429 struct platform_data *pdata = platform_get_drvdata(pdev);
199e0de7
D
430 struct cpuinfo_x86 *c = &cpu_data(cpu);
431 u32 eax, edx;
432 int err, attr_no;
bebe4678 433
a321cedb 434 /*
199e0de7
D
435 * Find attr number for sysfs:
436 * We map the attr number to core id of the CPU
437 * The attr number is always core id + 2
438 * The Pkgtemp will always show up as temp1_*, if available
a321cedb 439 */
199e0de7 440 attr_no = pkg_flag ? 1 : TO_ATTR_NO(cpu);
6369a288 441
199e0de7
D
442 if (attr_no > MAX_CORE_DATA - 1)
443 return -ERANGE;
444
f4e0bcf0
GR
445 /*
446 * Provide a single set of attributes for all HT siblings of a core
447 * to avoid duplicate sensors (the processor ID and core ID of all
6777b9e4
GR
448 * HT siblings of a core are the same).
449 * Skip if a HT sibling of this core is already registered.
f4e0bcf0
GR
450 * This is not an error.
451 */
199e0de7
D
452 if (pdata->core_data[attr_no] != NULL)
453 return 0;
6369a288 454
199e0de7
D
455 tdata = init_temp_data(cpu, pkg_flag);
456 if (!tdata)
457 return -ENOMEM;
bebe4678 458
199e0de7
D
459 /* Test if we can access the status register */
460 err = rdmsr_safe_on_cpu(cpu, tdata->status_reg, &eax, &edx);
461 if (err)
462 goto exit_free;
463
464 /* We can access status register. Get Critical Temperature */
6bf9e9b0 465 tdata->tjmax = get_tjmax(c, cpu, &pdev->dev);
199e0de7 466
c814a4c7 467 /*
f4af6fd6
GR
468 * Read the still undocumented bits 8:15 of IA32_TEMPERATURE_TARGET.
469 * The target temperature is available on older CPUs but not in this
470 * register. Atoms don't have the register at all.
c814a4c7 471 */
f4af6fd6
GR
472 if (c->x86_model > 0xe && c->x86_model != 0x1c) {
473 err = rdmsr_safe_on_cpu(cpu, MSR_IA32_TEMPERATURE_TARGET,
474 &eax, &edx);
475 if (!err) {
476 tdata->ttarget
477 = tdata->tjmax - ((eax >> 8) & 0xff) * 1000;
478 tdata->attr_size++;
479 }
c814a4c7
D
480 }
481
199e0de7
D
482 pdata->core_data[attr_no] = tdata;
483
484 /* Create sysfs interfaces */
485 err = create_core_attrs(tdata, &pdev->dev, attr_no);
486 if (err)
487 goto exit_free;
bebe4678
RM
488
489 return 0;
199e0de7 490exit_free:
20ecb499 491 pdata->core_data[attr_no] = NULL;
199e0de7
D
492 kfree(tdata);
493 return err;
494}
495
d6db23c7 496static void __cpuinit coretemp_add_core(unsigned int cpu, int pkg_flag)
199e0de7 497{
199e0de7
D
498 struct platform_device *pdev = coretemp_get_pdev(cpu);
499 int err;
500
501 if (!pdev)
502 return;
503
2f1c3db0 504 err = create_core_data(pdev, cpu, pkg_flag);
199e0de7
D
505 if (err)
506 dev_err(&pdev->dev, "Adding Core %u failed\n", cpu);
507}
508
509static void coretemp_remove_core(struct platform_data *pdata,
510 struct device *dev, int indx)
511{
512 int i;
513 struct temp_data *tdata = pdata->core_data[indx];
514
515 /* Remove the sysfs attributes */
c814a4c7 516 for (i = 0; i < tdata->attr_size; i++)
199e0de7
D
517 device_remove_file(dev, &tdata->sd_attrs[i].dev_attr);
518
519 kfree(pdata->core_data[indx]);
520 pdata->core_data[indx] = NULL;
521}
522
523static int __devinit coretemp_probe(struct platform_device *pdev)
524{
525 struct platform_data *pdata;
526 int err;
bebe4678 527
199e0de7
D
528 /* Initialize the per-package data structures */
529 pdata = kzalloc(sizeof(struct platform_data), GFP_KERNEL);
530 if (!pdata)
531 return -ENOMEM;
532
533 err = create_name_attr(pdata, &pdev->dev);
534 if (err)
535 goto exit_free;
536
b3a242a6 537 pdata->phys_proc_id = pdev->id;
199e0de7
D
538 platform_set_drvdata(pdev, pdata);
539
540 pdata->hwmon_dev = hwmon_device_register(&pdev->dev);
541 if (IS_ERR(pdata->hwmon_dev)) {
542 err = PTR_ERR(pdata->hwmon_dev);
543 dev_err(&pdev->dev, "Class registration failed (%d)\n", err);
544 goto exit_name;
545 }
546 return 0;
547
548exit_name:
549 device_remove_file(&pdev->dev, &pdata->name_attr);
550 platform_set_drvdata(pdev, NULL);
bebe4678 551exit_free:
199e0de7 552 kfree(pdata);
bebe4678
RM
553 return err;
554}
555
556static int __devexit coretemp_remove(struct platform_device *pdev)
557{
199e0de7
D
558 struct platform_data *pdata = platform_get_drvdata(pdev);
559 int i;
bebe4678 560
199e0de7
D
561 for (i = MAX_CORE_DATA - 1; i >= 0; --i)
562 if (pdata->core_data[i])
563 coretemp_remove_core(pdata, &pdev->dev, i);
564
565 device_remove_file(&pdev->dev, &pdata->name_attr);
566 hwmon_device_unregister(pdata->hwmon_dev);
bebe4678 567 platform_set_drvdata(pdev, NULL);
199e0de7 568 kfree(pdata);
bebe4678
RM
569 return 0;
570}
571
572static struct platform_driver coretemp_driver = {
573 .driver = {
574 .owner = THIS_MODULE,
575 .name = DRVNAME,
576 },
577 .probe = coretemp_probe,
578 .remove = __devexit_p(coretemp_remove),
579};
580
bebe4678
RM
581static int __cpuinit coretemp_device_add(unsigned int cpu)
582{
583 int err;
584 struct platform_device *pdev;
585 struct pdev_entry *pdev_entry;
d883b9f0
JD
586
587 mutex_lock(&pdev_list_mutex);
588
b3a242a6 589 pdev = platform_device_alloc(DRVNAME, TO_PHYS_ID(cpu));
bebe4678
RM
590 if (!pdev) {
591 err = -ENOMEM;
f8bb8925 592 pr_err("Device allocation failed\n");
bebe4678
RM
593 goto exit;
594 }
595
596 pdev_entry = kzalloc(sizeof(struct pdev_entry), GFP_KERNEL);
597 if (!pdev_entry) {
598 err = -ENOMEM;
599 goto exit_device_put;
600 }
601
602 err = platform_device_add(pdev);
603 if (err) {
f8bb8925 604 pr_err("Device addition failed (%d)\n", err);
bebe4678
RM
605 goto exit_device_free;
606 }
607
608 pdev_entry->pdev = pdev;
0eb9782a 609 pdev_entry->phys_proc_id = pdev->id;
199e0de7 610
bebe4678
RM
611 list_add_tail(&pdev_entry->list, &pdev_list);
612 mutex_unlock(&pdev_list_mutex);
613
614 return 0;
615
616exit_device_free:
617 kfree(pdev_entry);
618exit_device_put:
619 platform_device_put(pdev);
620exit:
d883b9f0 621 mutex_unlock(&pdev_list_mutex);
bebe4678
RM
622 return err;
623}
624
d6db23c7 625static void __cpuinit coretemp_device_remove(unsigned int cpu)
bebe4678 626{
199e0de7
D
627 struct pdev_entry *p, *n;
628 u16 phys_proc_id = TO_PHYS_ID(cpu);
e40cc4bd 629
bebe4678 630 mutex_lock(&pdev_list_mutex);
199e0de7
D
631 list_for_each_entry_safe(p, n, &pdev_list, list) {
632 if (p->phys_proc_id != phys_proc_id)
e40cc4bd 633 continue;
e40cc4bd
JB
634 platform_device_unregister(p->pdev);
635 list_del(&p->list);
e40cc4bd 636 kfree(p);
bebe4678
RM
637 }
638 mutex_unlock(&pdev_list_mutex);
639}
640
d6db23c7 641static bool __cpuinit is_any_core_online(struct platform_data *pdata)
199e0de7
D
642{
643 int i;
644
645 /* Find online cores, except pkgtemp data */
646 for (i = MAX_CORE_DATA - 1; i >= 0; --i) {
647 if (pdata->core_data[i] &&
648 !pdata->core_data[i]->is_pkg_data) {
649 return true;
650 }
651 }
652 return false;
653}
654
655static void __cpuinit get_core_online(unsigned int cpu)
656{
657 struct cpuinfo_x86 *c = &cpu_data(cpu);
658 struct platform_device *pdev = coretemp_get_pdev(cpu);
659 int err;
660
661 /*
662 * CPUID.06H.EAX[0] indicates whether the CPU has thermal
663 * sensors. We check this bit only, all the early CPUs
664 * without thermal sensors will be filtered out.
665 */
666 if (!cpu_has(c, X86_FEATURE_DTS))
667 return;
668
669 if (!pdev) {
0eb9782a
JD
670 /* Check the microcode version of the CPU */
671 if (chk_ucode_version(cpu))
672 return;
673
199e0de7
D
674 /*
675 * Alright, we have DTS support.
676 * We are bringing the _first_ core in this pkg
677 * online. So, initialize per-pkg data structures and
678 * then bring this core online.
679 */
680 err = coretemp_device_add(cpu);
681 if (err)
682 return;
683 /*
684 * Check whether pkgtemp support is available.
685 * If so, add interfaces for pkgtemp.
686 */
687 if (cpu_has(c, X86_FEATURE_PTS))
688 coretemp_add_core(cpu, 1);
689 }
690 /*
691 * Physical CPU device already exists.
692 * So, just add interfaces for this core.
693 */
694 coretemp_add_core(cpu, 0);
695}
696
697static void __cpuinit put_core_offline(unsigned int cpu)
698{
699 int i, indx;
700 struct platform_data *pdata;
701 struct platform_device *pdev = coretemp_get_pdev(cpu);
702
703 /* If the physical CPU device does not exist, just return */
704 if (!pdev)
705 return;
706
707 pdata = platform_get_drvdata(pdev);
708
709 indx = TO_ATTR_NO(cpu);
710
711 if (pdata->core_data[indx] && pdata->core_data[indx]->cpu == cpu)
712 coretemp_remove_core(pdata, &pdev->dev, indx);
713
f4e0bcf0 714 /*
6777b9e4
GR
715 * If a HT sibling of a core is taken offline, but another HT sibling
716 * of the same core is still online, register the alternate sibling.
717 * This ensures that exactly one set of attributes is provided as long
718 * as at least one HT sibling of a core is online.
f4e0bcf0 719 */
bb74e8ca 720 for_each_sibling(i, cpu) {
199e0de7
D
721 if (i != cpu) {
722 get_core_online(i);
f4e0bcf0
GR
723 /*
724 * Display temperature sensor data for one HT sibling
725 * per core only, so abort the loop after one such
726 * sibling has been found.
727 */
199e0de7
D
728 break;
729 }
730 }
731 /*
732 * If all cores in this pkg are offline, remove the device.
733 * coretemp_device_remove calls unregister_platform_device,
734 * which in turn calls coretemp_remove. This removes the
735 * pkgtemp entry and does other clean ups.
736 */
737 if (!is_any_core_online(pdata))
738 coretemp_device_remove(cpu);
739}
740
ba7c1927 741static int __cpuinit coretemp_cpu_callback(struct notifier_block *nfb,
bebe4678
RM
742 unsigned long action, void *hcpu)
743{
744 unsigned int cpu = (unsigned long) hcpu;
745
746 switch (action) {
747 case CPU_ONLINE:
561d9a96 748 case CPU_DOWN_FAILED:
199e0de7 749 get_core_online(cpu);
bebe4678 750 break;
561d9a96 751 case CPU_DOWN_PREPARE:
199e0de7 752 put_core_offline(cpu);
bebe4678
RM
753 break;
754 }
755 return NOTIFY_OK;
756}
757
ba7c1927 758static struct notifier_block coretemp_cpu_notifier __refdata = {
bebe4678
RM
759 .notifier_call = coretemp_cpu_callback,
760};
bebe4678
RM
761
762static int __init coretemp_init(void)
763{
764 int i, err = -ENODEV;
bebe4678 765
bebe4678 766 /* quick check if we run Intel */
92cb7612 767 if (cpu_data(0).x86_vendor != X86_VENDOR_INTEL)
bebe4678
RM
768 goto exit;
769
770 err = platform_driver_register(&coretemp_driver);
771 if (err)
772 goto exit;
773
a4659053 774 for_each_online_cpu(i)
199e0de7 775 get_core_online(i);
89a3fd35
JB
776
777#ifndef CONFIG_HOTPLUG_CPU
bebe4678
RM
778 if (list_empty(&pdev_list)) {
779 err = -ENODEV;
780 goto exit_driver_unreg;
781 }
89a3fd35 782#endif
bebe4678 783
bebe4678 784 register_hotcpu_notifier(&coretemp_cpu_notifier);
bebe4678
RM
785 return 0;
786
0dca94ba 787#ifndef CONFIG_HOTPLUG_CPU
89a3fd35 788exit_driver_unreg:
bebe4678 789 platform_driver_unregister(&coretemp_driver);
0dca94ba 790#endif
bebe4678
RM
791exit:
792 return err;
793}
794
795static void __exit coretemp_exit(void)
796{
797 struct pdev_entry *p, *n;
17c10d61 798
bebe4678 799 unregister_hotcpu_notifier(&coretemp_cpu_notifier);
bebe4678
RM
800 mutex_lock(&pdev_list_mutex);
801 list_for_each_entry_safe(p, n, &pdev_list, list) {
802 platform_device_unregister(p->pdev);
803 list_del(&p->list);
804 kfree(p);
805 }
806 mutex_unlock(&pdev_list_mutex);
807 platform_driver_unregister(&coretemp_driver);
808}
809
810MODULE_AUTHOR("Rudolf Marek <r.marek@assembler.cz>");
811MODULE_DESCRIPTION("Intel Core temperature monitor");
812MODULE_LICENSE("GPL");
813
814module_init(coretemp_init)
815module_exit(coretemp_exit)