coretemp.c 21 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838
  1. /*
  2. * coretemp.c - Linux kernel module for hardware monitoring
  3. *
  4. * Copyright (C) 2007 Rudolf Marek <r.marek@assembler.cz>
  5. *
  6. * Inspired from many hwmon drivers
  7. *
  8. * This program is free software; you can redistribute it and/or modify
  9. * it under the terms of the GNU General Public License as published by
  10. * the Free Software Foundation; version 2 of the License.
  11. *
  12. * This program is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  15. * GNU General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU General Public License
  18. * along with this program; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
  20. * 02110-1301 USA.
  21. */
  22. #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
  23. #include <linux/module.h>
  24. #include <linux/init.h>
  25. #include <linux/slab.h>
  26. #include <linux/jiffies.h>
  27. #include <linux/hwmon.h>
  28. #include <linux/sysfs.h>
  29. #include <linux/hwmon-sysfs.h>
  30. #include <linux/err.h>
  31. #include <linux/mutex.h>
  32. #include <linux/list.h>
  33. #include <linux/platform_device.h>
  34. #include <linux/cpu.h>
  35. #include <linux/pci.h>
  36. #include <linux/smp.h>
  37. #include <linux/moduleparam.h>
  38. #include <asm/msr.h>
  39. #include <asm/processor.h>
  40. #define DRVNAME "coretemp"
  41. /*
  42. * force_tjmax only matters when TjMax can't be read from the CPU itself.
  43. * When set, it replaces the driver's suboptimal heuristic.
  44. */
  45. static int force_tjmax;
  46. module_param_named(tjmax, force_tjmax, int, 0444);
  47. MODULE_PARM_DESC(tjmax, "TjMax value in degrees Celsius");
  48. #define BASE_SYSFS_ATTR_NO 2 /* Sysfs Base attr no for coretemp */
  49. #define NUM_REAL_CORES 16 /* Number of Real cores per cpu */
  50. #define CORETEMP_NAME_LENGTH 17 /* String Length of attrs */
  51. #define MAX_CORE_ATTRS 4 /* Maximum no of basic attrs */
  52. #define TOTAL_ATTRS (MAX_CORE_ATTRS + 1)
  53. #define MAX_CORE_DATA (NUM_REAL_CORES + BASE_SYSFS_ATTR_NO)
  54. #ifdef CONFIG_SMP
  55. #define TO_PHYS_ID(cpu) cpu_data(cpu).phys_proc_id
  56. #define TO_CORE_ID(cpu) cpu_data(cpu).cpu_core_id
  57. #define TO_ATTR_NO(cpu) (TO_CORE_ID(cpu) + BASE_SYSFS_ATTR_NO)
  58. #define for_each_sibling(i, cpu) for_each_cpu(i, cpu_sibling_mask(cpu))
  59. #else
  60. #define TO_PHYS_ID(cpu) (cpu)
  61. #define TO_CORE_ID(cpu) (cpu)
  62. #define TO_ATTR_NO(cpu) (cpu)
  63. #define for_each_sibling(i, cpu) for (i = 0; false; )
  64. #endif
  65. /*
  66. * Per-Core Temperature Data
  67. * @last_updated: The time when the current temperature value was updated
  68. * earlier (in jiffies).
  69. * @cpu_core_id: The CPU Core from which temperature values should be read
  70. * This value is passed as "id" field to rdmsr/wrmsr functions.
  71. * @status_reg: One of IA32_THERM_STATUS or IA32_PACKAGE_THERM_STATUS,
  72. * from where the temperature values should be read.
  73. * @attr_size: Total number of pre-core attrs displayed in the sysfs.
  74. * @is_pkg_data: If this is 1, the temp_data holds pkgtemp data.
  75. * Otherwise, temp_data holds coretemp data.
  76. * @valid: If this is 1, the current temperature is valid.
  77. */
  78. struct temp_data {
  79. int temp;
  80. int ttarget;
  81. int tjmax;
  82. unsigned long last_updated;
  83. unsigned int cpu;
  84. u32 cpu_core_id;
  85. u32 status_reg;
  86. int attr_size;
  87. bool is_pkg_data;
  88. bool valid;
  89. struct sensor_device_attribute sd_attrs[TOTAL_ATTRS];
  90. char attr_name[TOTAL_ATTRS][CORETEMP_NAME_LENGTH];
  91. struct mutex update_lock;
  92. };
  93. /* Platform Data per Physical CPU */
  94. struct platform_data {
  95. struct device *hwmon_dev;
  96. u16 phys_proc_id;
  97. struct temp_data *core_data[MAX_CORE_DATA];
  98. struct device_attribute name_attr;
  99. };
  100. struct pdev_entry {
  101. struct list_head list;
  102. struct platform_device *pdev;
  103. u16 phys_proc_id;
  104. };
  105. static LIST_HEAD(pdev_list);
  106. static DEFINE_MUTEX(pdev_list_mutex);
  107. static ssize_t show_name(struct device *dev,
  108. struct device_attribute *devattr, char *buf)
  109. {
  110. return sprintf(buf, "%s\n", DRVNAME);
  111. }
  112. static ssize_t show_label(struct device *dev,
  113. struct device_attribute *devattr, char *buf)
  114. {
  115. struct sensor_device_attribute *attr = to_sensor_dev_attr(devattr);
  116. struct platform_data *pdata = dev_get_drvdata(dev);
  117. struct temp_data *tdata = pdata->core_data[attr->index];
  118. if (tdata->is_pkg_data)
  119. return sprintf(buf, "Physical id %u\n", pdata->phys_proc_id);
  120. return sprintf(buf, "Core %u\n", tdata->cpu_core_id);
  121. }
  122. static ssize_t show_crit_alarm(struct device *dev,
  123. struct device_attribute *devattr, char *buf)
  124. {
  125. u32 eax, edx;
  126. struct sensor_device_attribute *attr = to_sensor_dev_attr(devattr);
  127. struct platform_data *pdata = dev_get_drvdata(dev);
  128. struct temp_data *tdata = pdata->core_data[attr->index];
  129. rdmsr_on_cpu(tdata->cpu, tdata->status_reg, &eax, &edx);
  130. return sprintf(buf, "%d\n", (eax >> 5) & 1);
  131. }
  132. static ssize_t show_tjmax(struct device *dev,
  133. struct device_attribute *devattr, char *buf)
  134. {
  135. struct sensor_device_attribute *attr = to_sensor_dev_attr(devattr);
  136. struct platform_data *pdata = dev_get_drvdata(dev);
  137. return sprintf(buf, "%d\n", pdata->core_data[attr->index]->tjmax);
  138. }
  139. static ssize_t show_ttarget(struct device *dev,
  140. struct device_attribute *devattr, char *buf)
  141. {
  142. struct sensor_device_attribute *attr = to_sensor_dev_attr(devattr);
  143. struct platform_data *pdata = dev_get_drvdata(dev);
  144. return sprintf(buf, "%d\n", pdata->core_data[attr->index]->ttarget);
  145. }
  146. static ssize_t show_temp(struct device *dev,
  147. struct device_attribute *devattr, char *buf)
  148. {
  149. u32 eax, edx;
  150. struct sensor_device_attribute *attr = to_sensor_dev_attr(devattr);
  151. struct platform_data *pdata = dev_get_drvdata(dev);
  152. struct temp_data *tdata = pdata->core_data[attr->index];
  153. mutex_lock(&tdata->update_lock);
  154. /* Check whether the time interval has elapsed */
  155. if (!tdata->valid || time_after(jiffies, tdata->last_updated + HZ)) {
  156. rdmsr_on_cpu(tdata->cpu, tdata->status_reg, &eax, &edx);
  157. tdata->valid = 0;
  158. /* Check whether the data is valid */
  159. if (eax & 0x80000000) {
  160. tdata->temp = tdata->tjmax -
  161. ((eax >> 16) & 0x7f) * 1000;
  162. tdata->valid = 1;
  163. }
  164. tdata->last_updated = jiffies;
  165. }
  166. mutex_unlock(&tdata->update_lock);
  167. return tdata->valid ? sprintf(buf, "%d\n", tdata->temp) : -EAGAIN;
  168. }
  169. static int adjust_tjmax(struct cpuinfo_x86 *c, u32 id, struct device *dev)
  170. {
  171. /* The 100C is default for both mobile and non mobile CPUs */
  172. int tjmax = 100000;
  173. int tjmax_ee = 85000;
  174. int usemsr_ee = 1;
  175. int err;
  176. u32 eax, edx;
  177. struct pci_dev *host_bridge;
  178. /* Early chips have no MSR for TjMax */
  179. if (c->x86_model == 0xf && c->x86_mask < 4)
  180. usemsr_ee = 0;
  181. /* Atom CPUs */
  182. if (c->x86_model == 0x1c) {
  183. usemsr_ee = 0;
  184. host_bridge = pci_get_bus_and_slot(0, PCI_DEVFN(0, 0));
  185. if (host_bridge && host_bridge->vendor == PCI_VENDOR_ID_INTEL
  186. && (host_bridge->device == 0xa000 /* NM10 based nettop */
  187. || host_bridge->device == 0xa010)) /* NM10 based netbook */
  188. tjmax = 100000;
  189. else
  190. tjmax = 90000;
  191. pci_dev_put(host_bridge);
  192. }
  193. if (c->x86_model > 0xe && usemsr_ee) {
  194. u8 platform_id;
  195. /*
  196. * Now we can detect the mobile CPU using Intel provided table
  197. * http://softwarecommunity.intel.com/Wiki/Mobility/720.htm
  198. * For Core2 cores, check MSR 0x17, bit 28 1 = Mobile CPU
  199. */
  200. err = rdmsr_safe_on_cpu(id, 0x17, &eax, &edx);
  201. if (err) {
  202. dev_warn(dev,
  203. "Unable to access MSR 0x17, assuming desktop"
  204. " CPU\n");
  205. usemsr_ee = 0;
  206. } else if (c->x86_model < 0x17 && !(eax & 0x10000000)) {
  207. /*
  208. * Trust bit 28 up to Penryn, I could not find any
  209. * documentation on that; if you happen to know
  210. * someone at Intel please ask
  211. */
  212. usemsr_ee = 0;
  213. } else {
  214. /* Platform ID bits 52:50 (EDX starts at bit 32) */
  215. platform_id = (edx >> 18) & 0x7;
  216. /*
  217. * Mobile Penryn CPU seems to be platform ID 7 or 5
  218. * (guesswork)
  219. */
  220. if (c->x86_model == 0x17 &&
  221. (platform_id == 5 || platform_id == 7)) {
  222. /*
  223. * If MSR EE bit is set, set it to 90 degrees C,
  224. * otherwise 105 degrees C
  225. */
  226. tjmax_ee = 90000;
  227. tjmax = 105000;
  228. }
  229. }
  230. }
  231. if (usemsr_ee) {
  232. err = rdmsr_safe_on_cpu(id, 0xee, &eax, &edx);
  233. if (err) {
  234. dev_warn(dev,
  235. "Unable to access MSR 0xEE, for Tjmax, left"
  236. " at default\n");
  237. } else if (eax & 0x40000000) {
  238. tjmax = tjmax_ee;
  239. }
  240. } else if (tjmax == 100000) {
  241. /*
  242. * If we don't use msr EE it means we are desktop CPU
  243. * (with exeception of Atom)
  244. */
  245. dev_warn(dev, "Using relative temperature scale!\n");
  246. }
  247. return tjmax;
  248. }
  249. static int get_tjmax(struct cpuinfo_x86 *c, u32 id, struct device *dev)
  250. {
  251. int err;
  252. u32 eax, edx;
  253. u32 val;
  254. /*
  255. * A new feature of current Intel(R) processors, the
  256. * IA32_TEMPERATURE_TARGET contains the TjMax value
  257. */
  258. err = rdmsr_safe_on_cpu(id, MSR_IA32_TEMPERATURE_TARGET, &eax, &edx);
  259. if (err) {
  260. if (c->x86_model > 0xe && c->x86_model != 0x1c)
  261. dev_warn(dev, "Unable to read TjMax from CPU %u\n", id);
  262. } else {
  263. val = (eax >> 16) & 0xff;
  264. /*
  265. * If the TjMax is not plausible, an assumption
  266. * will be used
  267. */
  268. if (val) {
  269. dev_dbg(dev, "TjMax is %d degrees C\n", val);
  270. return val * 1000;
  271. }
  272. }
  273. if (force_tjmax) {
  274. dev_notice(dev, "TjMax forced to %d degrees C by user\n",
  275. force_tjmax);
  276. return force_tjmax * 1000;
  277. }
  278. /*
  279. * An assumption is made for early CPUs and unreadable MSR.
  280. * NOTE: the calculated value may not be correct.
  281. */
  282. return adjust_tjmax(c, id, dev);
  283. }
  284. static void __devinit get_ucode_rev_on_cpu(void *edx)
  285. {
  286. u32 eax;
  287. wrmsr(MSR_IA32_UCODE_REV, 0, 0);
  288. sync_core();
  289. rdmsr(MSR_IA32_UCODE_REV, eax, *(u32 *)edx);
  290. }
  291. static int create_name_attr(struct platform_data *pdata, struct device *dev)
  292. {
  293. sysfs_attr_init(&pdata->name_attr.attr);
  294. pdata->name_attr.attr.name = "name";
  295. pdata->name_attr.attr.mode = S_IRUGO;
  296. pdata->name_attr.show = show_name;
  297. return device_create_file(dev, &pdata->name_attr);
  298. }
  299. static int create_core_attrs(struct temp_data *tdata, struct device *dev,
  300. int attr_no)
  301. {
  302. int err, i;
  303. static ssize_t (*rd_ptr[TOTAL_ATTRS]) (struct device *dev,
  304. struct device_attribute *devattr, char *buf) = {
  305. show_label, show_crit_alarm, show_temp, show_tjmax,
  306. show_ttarget };
  307. static const char *names[TOTAL_ATTRS] = {
  308. "temp%d_label", "temp%d_crit_alarm",
  309. "temp%d_input", "temp%d_crit",
  310. "temp%d_max" };
  311. for (i = 0; i < tdata->attr_size; i++) {
  312. snprintf(tdata->attr_name[i], CORETEMP_NAME_LENGTH, names[i],
  313. attr_no);
  314. sysfs_attr_init(&tdata->sd_attrs[i].dev_attr.attr);
  315. tdata->sd_attrs[i].dev_attr.attr.name = tdata->attr_name[i];
  316. tdata->sd_attrs[i].dev_attr.attr.mode = S_IRUGO;
  317. tdata->sd_attrs[i].dev_attr.show = rd_ptr[i];
  318. tdata->sd_attrs[i].index = attr_no;
  319. err = device_create_file(dev, &tdata->sd_attrs[i].dev_attr);
  320. if (err)
  321. goto exit_free;
  322. }
  323. return 0;
  324. exit_free:
  325. while (--i >= 0)
  326. device_remove_file(dev, &tdata->sd_attrs[i].dev_attr);
  327. return err;
  328. }
  329. static int __devinit chk_ucode_version(struct platform_device *pdev)
  330. {
  331. struct cpuinfo_x86 *c = &cpu_data(pdev->id);
  332. int err;
  333. u32 edx;
  334. /*
  335. * Check if we have problem with errata AE18 of Core processors:
  336. * Readings might stop update when processor visited too deep sleep,
  337. * fixed for stepping D0 (6EC).
  338. */
  339. if (c->x86_model == 0xe && c->x86_mask < 0xc) {
  340. /* check for microcode update */
  341. err = smp_call_function_single(pdev->id, get_ucode_rev_on_cpu,
  342. &edx, 1);
  343. if (err) {
  344. dev_err(&pdev->dev,
  345. "Cannot determine microcode revision of "
  346. "CPU#%u (%d)!\n", pdev->id, err);
  347. return -ENODEV;
  348. } else if (edx < 0x39) {
  349. dev_err(&pdev->dev,
  350. "Errata AE18 not fixed, update BIOS or "
  351. "microcode of the CPU!\n");
  352. return -ENODEV;
  353. }
  354. }
  355. return 0;
  356. }
  357. static struct platform_device *coretemp_get_pdev(unsigned int cpu)
  358. {
  359. u16 phys_proc_id = TO_PHYS_ID(cpu);
  360. struct pdev_entry *p;
  361. mutex_lock(&pdev_list_mutex);
  362. list_for_each_entry(p, &pdev_list, list)
  363. if (p->phys_proc_id == phys_proc_id) {
  364. mutex_unlock(&pdev_list_mutex);
  365. return p->pdev;
  366. }
  367. mutex_unlock(&pdev_list_mutex);
  368. return NULL;
  369. }
  370. static struct temp_data *init_temp_data(unsigned int cpu, int pkg_flag)
  371. {
  372. struct temp_data *tdata;
  373. tdata = kzalloc(sizeof(struct temp_data), GFP_KERNEL);
  374. if (!tdata)
  375. return NULL;
  376. tdata->status_reg = pkg_flag ? MSR_IA32_PACKAGE_THERM_STATUS :
  377. MSR_IA32_THERM_STATUS;
  378. tdata->is_pkg_data = pkg_flag;
  379. tdata->cpu = cpu;
  380. tdata->cpu_core_id = TO_CORE_ID(cpu);
  381. tdata->attr_size = MAX_CORE_ATTRS;
  382. mutex_init(&tdata->update_lock);
  383. return tdata;
  384. }
  385. static int create_core_data(struct platform_data *pdata,
  386. struct platform_device *pdev,
  387. unsigned int cpu, int pkg_flag)
  388. {
  389. struct temp_data *tdata;
  390. struct cpuinfo_x86 *c = &cpu_data(cpu);
  391. u32 eax, edx;
  392. int err, attr_no;
  393. /*
  394. * Find attr number for sysfs:
  395. * We map the attr number to core id of the CPU
  396. * The attr number is always core id + 2
  397. * The Pkgtemp will always show up as temp1_*, if available
  398. */
  399. attr_no = pkg_flag ? 1 : TO_ATTR_NO(cpu);
  400. if (attr_no > MAX_CORE_DATA - 1)
  401. return -ERANGE;
  402. /*
  403. * Provide a single set of attributes for all HT siblings of a core
  404. * to avoid duplicate sensors (the processor ID and core ID of all
  405. * HT siblings of a core are the same).
  406. * Skip if a HT sibling of this core is already registered.
  407. * This is not an error.
  408. */
  409. if (pdata->core_data[attr_no] != NULL)
  410. return 0;
  411. tdata = init_temp_data(cpu, pkg_flag);
  412. if (!tdata)
  413. return -ENOMEM;
  414. /* Test if we can access the status register */
  415. err = rdmsr_safe_on_cpu(cpu, tdata->status_reg, &eax, &edx);
  416. if (err)
  417. goto exit_free;
  418. /* We can access status register. Get Critical Temperature */
  419. tdata->tjmax = get_tjmax(c, cpu, &pdev->dev);
  420. /*
  421. * Read the still undocumented bits 8:15 of IA32_TEMPERATURE_TARGET.
  422. * The target temperature is available on older CPUs but not in this
  423. * register. Atoms don't have the register at all.
  424. */
  425. if (c->x86_model > 0xe && c->x86_model != 0x1c) {
  426. err = rdmsr_safe_on_cpu(cpu, MSR_IA32_TEMPERATURE_TARGET,
  427. &eax, &edx);
  428. if (!err) {
  429. tdata->ttarget
  430. = tdata->tjmax - ((eax >> 8) & 0xff) * 1000;
  431. tdata->attr_size++;
  432. }
  433. }
  434. pdata->core_data[attr_no] = tdata;
  435. /* Create sysfs interfaces */
  436. err = create_core_attrs(tdata, &pdev->dev, attr_no);
  437. if (err)
  438. goto exit_free;
  439. return 0;
  440. exit_free:
  441. kfree(tdata);
  442. return err;
  443. }
  444. static void coretemp_add_core(unsigned int cpu, int pkg_flag)
  445. {
  446. struct platform_data *pdata;
  447. struct platform_device *pdev = coretemp_get_pdev(cpu);
  448. int err;
  449. if (!pdev)
  450. return;
  451. pdata = platform_get_drvdata(pdev);
  452. err = create_core_data(pdata, pdev, cpu, pkg_flag);
  453. if (err)
  454. dev_err(&pdev->dev, "Adding Core %u failed\n", cpu);
  455. }
  456. static void coretemp_remove_core(struct platform_data *pdata,
  457. struct device *dev, int indx)
  458. {
  459. int i;
  460. struct temp_data *tdata = pdata->core_data[indx];
  461. /* Remove the sysfs attributes */
  462. for (i = 0; i < tdata->attr_size; i++)
  463. device_remove_file(dev, &tdata->sd_attrs[i].dev_attr);
  464. kfree(pdata->core_data[indx]);
  465. pdata->core_data[indx] = NULL;
  466. }
  467. static int __devinit coretemp_probe(struct platform_device *pdev)
  468. {
  469. struct platform_data *pdata;
  470. int err;
  471. /* Check the microcode version of the CPU */
  472. err = chk_ucode_version(pdev);
  473. if (err)
  474. return err;
  475. /* Initialize the per-package data structures */
  476. pdata = kzalloc(sizeof(struct platform_data), GFP_KERNEL);
  477. if (!pdata)
  478. return -ENOMEM;
  479. err = create_name_attr(pdata, &pdev->dev);
  480. if (err)
  481. goto exit_free;
  482. pdata->phys_proc_id = pdev->id;
  483. platform_set_drvdata(pdev, pdata);
  484. pdata->hwmon_dev = hwmon_device_register(&pdev->dev);
  485. if (IS_ERR(pdata->hwmon_dev)) {
  486. err = PTR_ERR(pdata->hwmon_dev);
  487. dev_err(&pdev->dev, "Class registration failed (%d)\n", err);
  488. goto exit_name;
  489. }
  490. return 0;
  491. exit_name:
  492. device_remove_file(&pdev->dev, &pdata->name_attr);
  493. platform_set_drvdata(pdev, NULL);
  494. exit_free:
  495. kfree(pdata);
  496. return err;
  497. }
  498. static int __devexit coretemp_remove(struct platform_device *pdev)
  499. {
  500. struct platform_data *pdata = platform_get_drvdata(pdev);
  501. int i;
  502. for (i = MAX_CORE_DATA - 1; i >= 0; --i)
  503. if (pdata->core_data[i])
  504. coretemp_remove_core(pdata, &pdev->dev, i);
  505. device_remove_file(&pdev->dev, &pdata->name_attr);
  506. hwmon_device_unregister(pdata->hwmon_dev);
  507. platform_set_drvdata(pdev, NULL);
  508. kfree(pdata);
  509. return 0;
  510. }
  511. static struct platform_driver coretemp_driver = {
  512. .driver = {
  513. .owner = THIS_MODULE,
  514. .name = DRVNAME,
  515. },
  516. .probe = coretemp_probe,
  517. .remove = __devexit_p(coretemp_remove),
  518. };
  519. static int __cpuinit coretemp_device_add(unsigned int cpu)
  520. {
  521. int err;
  522. struct platform_device *pdev;
  523. struct pdev_entry *pdev_entry;
  524. mutex_lock(&pdev_list_mutex);
  525. pdev = platform_device_alloc(DRVNAME, TO_PHYS_ID(cpu));
  526. if (!pdev) {
  527. err = -ENOMEM;
  528. pr_err("Device allocation failed\n");
  529. goto exit;
  530. }
  531. pdev_entry = kzalloc(sizeof(struct pdev_entry), GFP_KERNEL);
  532. if (!pdev_entry) {
  533. err = -ENOMEM;
  534. goto exit_device_put;
  535. }
  536. err = platform_device_add(pdev);
  537. if (err) {
  538. pr_err("Device addition failed (%d)\n", err);
  539. goto exit_device_free;
  540. }
  541. pdev_entry->pdev = pdev;
  542. pdev_entry->phys_proc_id = TO_PHYS_ID(cpu);
  543. list_add_tail(&pdev_entry->list, &pdev_list);
  544. mutex_unlock(&pdev_list_mutex);
  545. return 0;
  546. exit_device_free:
  547. kfree(pdev_entry);
  548. exit_device_put:
  549. platform_device_put(pdev);
  550. exit:
  551. mutex_unlock(&pdev_list_mutex);
  552. return err;
  553. }
  554. static void coretemp_device_remove(unsigned int cpu)
  555. {
  556. struct pdev_entry *p, *n;
  557. u16 phys_proc_id = TO_PHYS_ID(cpu);
  558. mutex_lock(&pdev_list_mutex);
  559. list_for_each_entry_safe(p, n, &pdev_list, list) {
  560. if (p->phys_proc_id != phys_proc_id)
  561. continue;
  562. platform_device_unregister(p->pdev);
  563. list_del(&p->list);
  564. kfree(p);
  565. }
  566. mutex_unlock(&pdev_list_mutex);
  567. }
  568. static bool is_any_core_online(struct platform_data *pdata)
  569. {
  570. int i;
  571. /* Find online cores, except pkgtemp data */
  572. for (i = MAX_CORE_DATA - 1; i >= 0; --i) {
  573. if (pdata->core_data[i] &&
  574. !pdata->core_data[i]->is_pkg_data) {
  575. return true;
  576. }
  577. }
  578. return false;
  579. }
  580. static void __cpuinit get_core_online(unsigned int cpu)
  581. {
  582. struct cpuinfo_x86 *c = &cpu_data(cpu);
  583. struct platform_device *pdev = coretemp_get_pdev(cpu);
  584. int err;
  585. /*
  586. * CPUID.06H.EAX[0] indicates whether the CPU has thermal
  587. * sensors. We check this bit only, all the early CPUs
  588. * without thermal sensors will be filtered out.
  589. */
  590. if (!cpu_has(c, X86_FEATURE_DTS))
  591. return;
  592. if (!pdev) {
  593. /*
  594. * Alright, we have DTS support.
  595. * We are bringing the _first_ core in this pkg
  596. * online. So, initialize per-pkg data structures and
  597. * then bring this core online.
  598. */
  599. err = coretemp_device_add(cpu);
  600. if (err)
  601. return;
  602. /*
  603. * Check whether pkgtemp support is available.
  604. * If so, add interfaces for pkgtemp.
  605. */
  606. if (cpu_has(c, X86_FEATURE_PTS))
  607. coretemp_add_core(cpu, 1);
  608. }
  609. /*
  610. * Physical CPU device already exists.
  611. * So, just add interfaces for this core.
  612. */
  613. coretemp_add_core(cpu, 0);
  614. }
  615. static void __cpuinit put_core_offline(unsigned int cpu)
  616. {
  617. int i, indx;
  618. struct platform_data *pdata;
  619. struct platform_device *pdev = coretemp_get_pdev(cpu);
  620. /* If the physical CPU device does not exist, just return */
  621. if (!pdev)
  622. return;
  623. pdata = platform_get_drvdata(pdev);
  624. indx = TO_ATTR_NO(cpu);
  625. if (pdata->core_data[indx] && pdata->core_data[indx]->cpu == cpu)
  626. coretemp_remove_core(pdata, &pdev->dev, indx);
  627. /*
  628. * If a HT sibling of a core is taken offline, but another HT sibling
  629. * of the same core is still online, register the alternate sibling.
  630. * This ensures that exactly one set of attributes is provided as long
  631. * as at least one HT sibling of a core is online.
  632. */
  633. for_each_sibling(i, cpu) {
  634. if (i != cpu) {
  635. get_core_online(i);
  636. /*
  637. * Display temperature sensor data for one HT sibling
  638. * per core only, so abort the loop after one such
  639. * sibling has been found.
  640. */
  641. break;
  642. }
  643. }
  644. /*
  645. * If all cores in this pkg are offline, remove the device.
  646. * coretemp_device_remove calls unregister_platform_device,
  647. * which in turn calls coretemp_remove. This removes the
  648. * pkgtemp entry and does other clean ups.
  649. */
  650. if (!is_any_core_online(pdata))
  651. coretemp_device_remove(cpu);
  652. }
  653. static int __cpuinit coretemp_cpu_callback(struct notifier_block *nfb,
  654. unsigned long action, void *hcpu)
  655. {
  656. unsigned int cpu = (unsigned long) hcpu;
  657. switch (action) {
  658. case CPU_ONLINE:
  659. case CPU_DOWN_FAILED:
  660. get_core_online(cpu);
  661. break;
  662. case CPU_DOWN_PREPARE:
  663. put_core_offline(cpu);
  664. break;
  665. }
  666. return NOTIFY_OK;
  667. }
  668. static struct notifier_block coretemp_cpu_notifier __refdata = {
  669. .notifier_call = coretemp_cpu_callback,
  670. };
  671. static int __init coretemp_init(void)
  672. {
  673. int i, err = -ENODEV;
  674. /* quick check if we run Intel */
  675. if (cpu_data(0).x86_vendor != X86_VENDOR_INTEL)
  676. goto exit;
  677. err = platform_driver_register(&coretemp_driver);
  678. if (err)
  679. goto exit;
  680. for_each_online_cpu(i)
  681. get_core_online(i);
  682. #ifndef CONFIG_HOTPLUG_CPU
  683. if (list_empty(&pdev_list)) {
  684. err = -ENODEV;
  685. goto exit_driver_unreg;
  686. }
  687. #endif
  688. register_hotcpu_notifier(&coretemp_cpu_notifier);
  689. return 0;
  690. #ifndef CONFIG_HOTPLUG_CPU
  691. exit_driver_unreg:
  692. platform_driver_unregister(&coretemp_driver);
  693. #endif
  694. exit:
  695. return err;
  696. }
  697. static void __exit coretemp_exit(void)
  698. {
  699. struct pdev_entry *p, *n;
  700. unregister_hotcpu_notifier(&coretemp_cpu_notifier);
  701. mutex_lock(&pdev_list_mutex);
  702. list_for_each_entry_safe(p, n, &pdev_list, list) {
  703. platform_device_unregister(p->pdev);
  704. list_del(&p->list);
  705. kfree(p);
  706. }
  707. mutex_unlock(&pdev_list_mutex);
  708. platform_driver_unregister(&coretemp_driver);
  709. }
  710. MODULE_AUTHOR("Rudolf Marek <r.marek@assembler.cz>");
  711. MODULE_DESCRIPTION("Intel Core temperature monitor");
  712. MODULE_LICENSE("GPL");
  713. module_init(coretemp_init)
  714. module_exit(coretemp_exit)