|  | // SPDX-License-Identifier: GPL-2.0-only | 
|  | /* | 
|  | * coretemp.c - Linux kernel module for hardware monitoring | 
|  | * | 
|  | * Copyright (C) 2007 Rudolf Marek <r.marek@assembler.cz> | 
|  | * | 
|  | * Inspired from many hwmon drivers | 
|  | */ | 
|  |  | 
|  | #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt | 
|  |  | 
|  | #include <linux/module.h> | 
|  | #include <linux/init.h> | 
|  | #include <linux/slab.h> | 
|  | #include <linux/jiffies.h> | 
|  | #include <linux/hwmon.h> | 
|  | #include <linux/sysfs.h> | 
|  | #include <linux/hwmon-sysfs.h> | 
|  | #include <linux/err.h> | 
|  | #include <linux/mutex.h> | 
|  | #include <linux/list.h> | 
|  | #include <linux/platform_device.h> | 
|  | #include <linux/cpu.h> | 
|  | #include <linux/smp.h> | 
|  | #include <linux/moduleparam.h> | 
|  | #include <linux/pci.h> | 
|  | #include <asm/msr.h> | 
|  | #include <asm/processor.h> | 
|  | #include <asm/cpu_device_id.h> | 
|  | #include <linux/sched/isolation.h> | 
|  |  | 
|  | #define DRVNAME	"coretemp" | 
|  |  | 
|  | /* | 
|  | * force_tjmax only matters when TjMax can't be read from the CPU itself. | 
|  | * When set, it replaces the driver's suboptimal heuristic. | 
|  | */ | 
|  | static int force_tjmax; | 
|  | module_param_named(tjmax, force_tjmax, int, 0444); | 
|  | MODULE_PARM_DESC(tjmax, "TjMax value in degrees Celsius"); | 
|  |  | 
|  | #define NUM_REAL_CORES		512	/* Number of Real cores per cpu */ | 
|  | #define CORETEMP_NAME_LENGTH	28	/* String Length of attrs */ | 
|  |  | 
|  | enum coretemp_attr_index { | 
|  | ATTR_LABEL, | 
|  | ATTR_CRIT_ALARM, | 
|  | ATTR_TEMP, | 
|  | ATTR_TJMAX, | 
|  | ATTR_TTARGET, | 
|  | MAX_CORE_ATTRS = ATTR_TJMAX + 1,	/* Maximum no of basic attrs */ | 
|  | TOTAL_ATTRS = ATTR_TTARGET + 1		/* Maximum no of possible attrs */ | 
|  | }; | 
|  |  | 
|  | #ifdef CONFIG_SMP | 
|  | #define for_each_sibling(i, cpu) \ | 
|  | for_each_cpu(i, topology_sibling_cpumask(cpu)) | 
|  | #else | 
|  | #define for_each_sibling(i, cpu)	for (i = 0; false; ) | 
|  | #endif | 
|  |  | 
|  | /* | 
|  | * Per-Core Temperature Data | 
|  | * @tjmax: The static tjmax value when tjmax cannot be retrieved from | 
|  | *		IA32_TEMPERATURE_TARGET MSR. | 
|  | * @last_updated: The time when the current temperature value was updated | 
|  | *		earlier (in jiffies). | 
|  | * @cpu_core_id: The CPU Core from which temperature values should be read | 
|  | *		This value is passed as "id" field to rdmsr/wrmsr functions. | 
|  | * @status_reg: One of IA32_THERM_STATUS or IA32_PACKAGE_THERM_STATUS, | 
|  | *		from where the temperature values should be read. | 
|  | * @attr_size:  Total number of pre-core attrs displayed in the sysfs. | 
|  | */ | 
|  | struct temp_data { | 
|  | int temp; | 
|  | int tjmax; | 
|  | unsigned long last_updated; | 
|  | unsigned int cpu; | 
|  | int index; | 
|  | u32 cpu_core_id; | 
|  | u32 status_reg; | 
|  | int attr_size; | 
|  | struct device_attribute sd_attrs[TOTAL_ATTRS]; | 
|  | char attr_name[TOTAL_ATTRS][CORETEMP_NAME_LENGTH]; | 
|  | struct attribute *attrs[TOTAL_ATTRS + 1]; | 
|  | struct attribute_group attr_group; | 
|  | struct mutex update_lock; | 
|  | }; | 
|  |  | 
|  | /* Platform Data per Physical CPU */ | 
|  | struct platform_data { | 
|  | struct device		*hwmon_dev; | 
|  | u16			pkg_id; | 
|  | int			nr_cores; | 
|  | struct ida		ida; | 
|  | struct cpumask		cpumask; | 
|  | struct temp_data	*pkg_data; | 
|  | struct temp_data	**core_data; | 
|  | struct device_attribute name_attr; | 
|  | }; | 
|  |  | 
|  | struct tjmax_pci { | 
|  | unsigned int device; | 
|  | int tjmax; | 
|  | }; | 
|  |  | 
|  | static const struct tjmax_pci tjmax_pci_table[] = { | 
|  | { 0x0708, 110000 },	/* CE41x0 (Sodaville ) */ | 
|  | { 0x0c72, 102000 },	/* Atom S1240 (Centerton) */ | 
|  | { 0x0c73, 95000 },	/* Atom S1220 (Centerton) */ | 
|  | { 0x0c75, 95000 },	/* Atom S1260 (Centerton) */ | 
|  | }; | 
|  |  | 
|  | struct tjmax { | 
|  | char const *id; | 
|  | int tjmax; | 
|  | }; | 
|  |  | 
|  | static const struct tjmax tjmax_table[] = { | 
|  | { "CPU  230", 100000 },		/* Model 0x1c, stepping 2	*/ | 
|  | { "CPU  330", 125000 },		/* Model 0x1c, stepping 2	*/ | 
|  | }; | 
|  |  | 
|  | struct tjmax_model { | 
|  | u8 model; | 
|  | u8 mask; | 
|  | int tjmax; | 
|  | }; | 
|  |  | 
|  | #define ANY 0xff | 
|  |  | 
|  | static const struct tjmax_model tjmax_model_table[] = { | 
|  | { 0x1c, 10, 100000 },	/* D4xx, K4xx, N4xx, D5xx, K5xx, N5xx */ | 
|  | { 0x1c, ANY, 90000 },	/* Z5xx, N2xx, possibly others | 
|  | * Note: Also matches 230 and 330, | 
|  | * which are covered by tjmax_table | 
|  | */ | 
|  | { 0x26, ANY, 90000 },	/* Atom Tunnel Creek (Exx), Lincroft (Z6xx) | 
|  | * Note: TjMax for E6xxT is 110C, but CPU type | 
|  | * is undetectable by software | 
|  | */ | 
|  | { 0x27, ANY, 90000 },	/* Atom Medfield (Z2460) */ | 
|  | { 0x35, ANY, 90000 },	/* Atom Clover Trail/Cloverview (Z27x0) */ | 
|  | { 0x36, ANY, 100000 },	/* Atom Cedar Trail/Cedarview (N2xxx, D2xxx) | 
|  | * Also matches S12x0 (stepping 9), covered by | 
|  | * PCI table | 
|  | */ | 
|  | }; | 
|  |  | 
|  | static bool is_pkg_temp_data(struct temp_data *tdata) | 
|  | { | 
|  | return tdata->index < 0; | 
|  | } | 
|  |  | 
|  | static int adjust_tjmax(struct cpuinfo_x86 *c, u32 id, struct device *dev) | 
|  | { | 
|  | /* The 100C is default for both mobile and non mobile CPUs */ | 
|  |  | 
|  | int tjmax = 100000; | 
|  | int tjmax_ee = 85000; | 
|  | int usemsr_ee = 1; | 
|  | int err; | 
|  | u32 eax, edx; | 
|  | int i; | 
|  | u16 devfn = PCI_DEVFN(0, 0); | 
|  | struct pci_dev *host_bridge = pci_get_domain_bus_and_slot(0, 0, devfn); | 
|  |  | 
|  | /* | 
|  | * Explicit tjmax table entries override heuristics. | 
|  | * First try PCI host bridge IDs, followed by model ID strings | 
|  | * and model/stepping information. | 
|  | */ | 
|  | if (host_bridge && host_bridge->vendor == PCI_VENDOR_ID_INTEL) { | 
|  | for (i = 0; i < ARRAY_SIZE(tjmax_pci_table); i++) { | 
|  | if (host_bridge->device == tjmax_pci_table[i].device) { | 
|  | pci_dev_put(host_bridge); | 
|  | return tjmax_pci_table[i].tjmax; | 
|  | } | 
|  | } | 
|  | } | 
|  | pci_dev_put(host_bridge); | 
|  |  | 
|  | for (i = 0; i < ARRAY_SIZE(tjmax_table); i++) { | 
|  | if (strstr(c->x86_model_id, tjmax_table[i].id)) | 
|  | return tjmax_table[i].tjmax; | 
|  | } | 
|  |  | 
|  | for (i = 0; i < ARRAY_SIZE(tjmax_model_table); i++) { | 
|  | const struct tjmax_model *tm = &tjmax_model_table[i]; | 
|  | if (c->x86_model == tm->model && | 
|  | (tm->mask == ANY || c->x86_stepping == tm->mask)) | 
|  | return tm->tjmax; | 
|  | } | 
|  |  | 
|  | /* Early chips have no MSR for TjMax */ | 
|  |  | 
|  | if (c->x86_model == 0xf && c->x86_stepping < 4) | 
|  | usemsr_ee = 0; | 
|  |  | 
|  | if (c->x86_model > 0xe && usemsr_ee) { | 
|  | u8 platform_id; | 
|  |  | 
|  | /* | 
|  | * Now we can detect the mobile CPU using Intel provided table | 
|  | * http://softwarecommunity.intel.com/Wiki/Mobility/720.htm | 
|  | * For Core2 cores, check MSR 0x17, bit 28 1 = Mobile CPU | 
|  | */ | 
|  | err = rdmsr_safe_on_cpu(id, 0x17, &eax, &edx); | 
|  | if (err) { | 
|  | dev_warn(dev, | 
|  | "Unable to access MSR 0x17, assuming desktop" | 
|  | " CPU\n"); | 
|  | usemsr_ee = 0; | 
|  | } else if (c->x86_model < 0x17 && !(eax & 0x10000000)) { | 
|  | /* | 
|  | * Trust bit 28 up to Penryn, I could not find any | 
|  | * documentation on that; if you happen to know | 
|  | * someone at Intel please ask | 
|  | */ | 
|  | usemsr_ee = 0; | 
|  | } else { | 
|  | /* Platform ID bits 52:50 (EDX starts at bit 32) */ | 
|  | platform_id = (edx >> 18) & 0x7; | 
|  |  | 
|  | /* | 
|  | * Mobile Penryn CPU seems to be platform ID 7 or 5 | 
|  | * (guesswork) | 
|  | */ | 
|  | if (c->x86_model == 0x17 && | 
|  | (platform_id == 5 || platform_id == 7)) { | 
|  | /* | 
|  | * If MSR EE bit is set, set it to 90 degrees C, | 
|  | * otherwise 105 degrees C | 
|  | */ | 
|  | tjmax_ee = 90000; | 
|  | tjmax = 105000; | 
|  | } | 
|  | } | 
|  | } | 
|  |  | 
|  | if (usemsr_ee) { | 
|  | err = rdmsr_safe_on_cpu(id, 0xee, &eax, &edx); | 
|  | if (err) { | 
|  | dev_warn(dev, | 
|  | "Unable to access MSR 0xEE, for Tjmax, left" | 
|  | " at default\n"); | 
|  | } else if (eax & 0x40000000) { | 
|  | tjmax = tjmax_ee; | 
|  | } | 
|  | } else if (tjmax == 100000) { | 
|  | /* | 
|  | * If we don't use msr EE it means we are desktop CPU | 
|  | * (with exeception of Atom) | 
|  | */ | 
|  | dev_warn(dev, "Using relative temperature scale!\n"); | 
|  | } | 
|  |  | 
|  | return tjmax; | 
|  | } | 
|  |  | 
|  | static bool cpu_has_tjmax(struct cpuinfo_x86 *c) | 
|  | { | 
|  | u8 model = c->x86_model; | 
|  |  | 
|  | return model > 0xe && | 
|  | model != 0x1c && | 
|  | model != 0x26 && | 
|  | model != 0x27 && | 
|  | model != 0x35 && | 
|  | model != 0x36; | 
|  | } | 
|  |  | 
|  | static int get_tjmax(struct temp_data *tdata, struct device *dev) | 
|  | { | 
|  | struct cpuinfo_x86 *c = &cpu_data(tdata->cpu); | 
|  | int err; | 
|  | u32 eax, edx; | 
|  | u32 val; | 
|  |  | 
|  | /* use static tjmax once it is set */ | 
|  | if (tdata->tjmax) | 
|  | return tdata->tjmax; | 
|  |  | 
|  | /* | 
|  | * A new feature of current Intel(R) processors, the | 
|  | * IA32_TEMPERATURE_TARGET contains the TjMax value | 
|  | */ | 
|  | err = rdmsr_safe_on_cpu(tdata->cpu, MSR_IA32_TEMPERATURE_TARGET, &eax, &edx); | 
|  | if (err) { | 
|  | if (cpu_has_tjmax(c)) | 
|  | dev_warn(dev, "Unable to read TjMax from CPU %u\n", tdata->cpu); | 
|  | } else { | 
|  | val = (eax >> 16) & 0xff; | 
|  | if (val) | 
|  | return val * 1000; | 
|  | } | 
|  |  | 
|  | if (force_tjmax) { | 
|  | dev_notice(dev, "TjMax forced to %d degrees C by user\n", | 
|  | force_tjmax); | 
|  | tdata->tjmax = force_tjmax * 1000; | 
|  | } else { | 
|  | /* | 
|  | * An assumption is made for early CPUs and unreadable MSR. | 
|  | * NOTE: the calculated value may not be correct. | 
|  | */ | 
|  | tdata->tjmax = adjust_tjmax(c, tdata->cpu, dev); | 
|  | } | 
|  | return tdata->tjmax; | 
|  | } | 
|  |  | 
|  | static int get_ttarget(struct temp_data *tdata, struct device *dev) | 
|  | { | 
|  | u32 eax, edx; | 
|  | int tjmax, ttarget_offset, ret; | 
|  |  | 
|  | /* | 
|  | * ttarget is valid only if tjmax can be retrieved from | 
|  | * MSR_IA32_TEMPERATURE_TARGET | 
|  | */ | 
|  | if (tdata->tjmax) | 
|  | return -ENODEV; | 
|  |  | 
|  | ret = rdmsr_safe_on_cpu(tdata->cpu, MSR_IA32_TEMPERATURE_TARGET, &eax, &edx); | 
|  | if (ret) | 
|  | return ret; | 
|  |  | 
|  | tjmax = (eax >> 16) & 0xff; | 
|  |  | 
|  | /* Read the still undocumented bits 8:15 of IA32_TEMPERATURE_TARGET. */ | 
|  | ttarget_offset = (eax >> 8) & 0xff; | 
|  |  | 
|  | return (tjmax - ttarget_offset) * 1000; | 
|  | } | 
|  |  | 
|  | /* Keep track of how many zone pointers we allocated in init() */ | 
|  | static int max_zones __read_mostly; | 
|  | /* Array of zone pointers. Serialized by cpu hotplug lock */ | 
|  | static struct platform_device **zone_devices; | 
|  |  | 
|  | static ssize_t show_label(struct device *dev, | 
|  | struct device_attribute *devattr, char *buf) | 
|  | { | 
|  | struct platform_data *pdata = dev_get_drvdata(dev); | 
|  | struct temp_data *tdata = container_of(devattr, struct temp_data, sd_attrs[ATTR_LABEL]); | 
|  |  | 
|  | if (is_pkg_temp_data(tdata)) | 
|  | return sprintf(buf, "Package id %u\n", pdata->pkg_id); | 
|  |  | 
|  | return sprintf(buf, "Core %u\n", tdata->cpu_core_id); | 
|  | } | 
|  |  | 
|  | static ssize_t show_crit_alarm(struct device *dev, | 
|  | struct device_attribute *devattr, char *buf) | 
|  | { | 
|  | u32 eax, edx; | 
|  | struct temp_data *tdata = container_of(devattr, struct temp_data, | 
|  | sd_attrs[ATTR_CRIT_ALARM]); | 
|  |  | 
|  | mutex_lock(&tdata->update_lock); | 
|  | rdmsr_on_cpu(tdata->cpu, tdata->status_reg, &eax, &edx); | 
|  | mutex_unlock(&tdata->update_lock); | 
|  |  | 
|  | return sprintf(buf, "%d\n", (eax >> 5) & 1); | 
|  | } | 
|  |  | 
|  | static ssize_t show_tjmax(struct device *dev, | 
|  | struct device_attribute *devattr, char *buf) | 
|  | { | 
|  | struct temp_data *tdata = container_of(devattr, struct temp_data, sd_attrs[ATTR_TJMAX]); | 
|  | int tjmax; | 
|  |  | 
|  | mutex_lock(&tdata->update_lock); | 
|  | tjmax = get_tjmax(tdata, dev); | 
|  | mutex_unlock(&tdata->update_lock); | 
|  |  | 
|  | return sprintf(buf, "%d\n", tjmax); | 
|  | } | 
|  |  | 
|  | static ssize_t show_ttarget(struct device *dev, | 
|  | struct device_attribute *devattr, char *buf) | 
|  | { | 
|  | struct temp_data *tdata = container_of(devattr, struct temp_data, sd_attrs[ATTR_TTARGET]); | 
|  | int ttarget; | 
|  |  | 
|  | mutex_lock(&tdata->update_lock); | 
|  | ttarget = get_ttarget(tdata, dev); | 
|  | mutex_unlock(&tdata->update_lock); | 
|  |  | 
|  | if (ttarget < 0) | 
|  | return ttarget; | 
|  | return sprintf(buf, "%d\n", ttarget); | 
|  | } | 
|  |  | 
|  | static ssize_t show_temp(struct device *dev, | 
|  | struct device_attribute *devattr, char *buf) | 
|  | { | 
|  | u32 eax, edx; | 
|  | struct temp_data *tdata = container_of(devattr, struct temp_data, sd_attrs[ATTR_TEMP]); | 
|  | int tjmax; | 
|  |  | 
|  | mutex_lock(&tdata->update_lock); | 
|  |  | 
|  | tjmax = get_tjmax(tdata, dev); | 
|  | /* Check whether the time interval has elapsed */ | 
|  | if (time_after(jiffies, tdata->last_updated + HZ)) { | 
|  | rdmsr_on_cpu(tdata->cpu, tdata->status_reg, &eax, &edx); | 
|  | /* | 
|  | * Ignore the valid bit. In all observed cases the register | 
|  | * value is either low or zero if the valid bit is 0. | 
|  | * Return it instead of reporting an error which doesn't | 
|  | * really help at all. | 
|  | */ | 
|  | tdata->temp = tjmax - ((eax >> 16) & 0xff) * 1000; | 
|  | tdata->last_updated = jiffies; | 
|  | } | 
|  |  | 
|  | mutex_unlock(&tdata->update_lock); | 
|  | return sprintf(buf, "%d\n", tdata->temp); | 
|  | } | 
|  |  | 
|  | static int create_core_attrs(struct temp_data *tdata, struct device *dev) | 
|  | { | 
|  | int i; | 
|  | static ssize_t (*const rd_ptr[TOTAL_ATTRS]) (struct device *dev, | 
|  | struct device_attribute *devattr, char *buf) = { | 
|  | show_label, show_crit_alarm, show_temp, show_tjmax, | 
|  | show_ttarget }; | 
|  | static const char *const suffixes[TOTAL_ATTRS] = { | 
|  | "label", "crit_alarm", "input", "crit", "max" | 
|  | }; | 
|  |  | 
|  | for (i = 0; i < tdata->attr_size; i++) { | 
|  | /* | 
|  | * We map the attr number to core id of the CPU | 
|  | * The attr number is always core id + 2 | 
|  | * The Pkgtemp will always show up as temp1_*, if available | 
|  | */ | 
|  | int attr_no = is_pkg_temp_data(tdata) ? 1 : tdata->cpu_core_id + 2; | 
|  |  | 
|  | snprintf(tdata->attr_name[i], CORETEMP_NAME_LENGTH, | 
|  | "temp%d_%s", attr_no, suffixes[i]); | 
|  | sysfs_attr_init(&tdata->sd_attrs[i].attr); | 
|  | tdata->sd_attrs[i].attr.name = tdata->attr_name[i]; | 
|  | tdata->sd_attrs[i].attr.mode = 0444; | 
|  | tdata->sd_attrs[i].show = rd_ptr[i]; | 
|  | tdata->attrs[i] = &tdata->sd_attrs[i].attr; | 
|  | } | 
|  | tdata->attr_group.attrs = tdata->attrs; | 
|  | return sysfs_create_group(&dev->kobj, &tdata->attr_group); | 
|  | } | 
|  |  | 
|  |  | 
|  | static int chk_ucode_version(unsigned int cpu) | 
|  | { | 
|  | struct cpuinfo_x86 *c = &cpu_data(cpu); | 
|  |  | 
|  | /* | 
|  | * Check if we have problem with errata AE18 of Core processors: | 
|  | * Readings might stop update when processor visited too deep sleep, | 
|  | * fixed for stepping D0 (6EC). | 
|  | */ | 
|  | if (c->x86_model == 0xe && c->x86_stepping < 0xc && c->microcode < 0x39) { | 
|  | pr_err("Errata AE18 not fixed, update BIOS or microcode of the CPU!\n"); | 
|  | return -ENODEV; | 
|  | } | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | static struct platform_device *coretemp_get_pdev(unsigned int cpu) | 
|  | { | 
|  | int id = topology_logical_die_id(cpu); | 
|  |  | 
|  | if (id >= 0 && id < max_zones) | 
|  | return zone_devices[id]; | 
|  | return NULL; | 
|  | } | 
|  |  | 
|  | static struct temp_data * | 
|  | init_temp_data(struct platform_data *pdata, unsigned int cpu, int pkg_flag) | 
|  | { | 
|  | struct temp_data *tdata; | 
|  |  | 
|  | if (!pdata->core_data) { | 
|  | /* | 
|  | * TODO: | 
|  | * The information of actual possible cores in a package is broken for now. | 
|  | * Will replace hardcoded NUM_REAL_CORES with actual per package core count | 
|  | * when this information becomes available. | 
|  | */ | 
|  | pdata->nr_cores = NUM_REAL_CORES; | 
|  | pdata->core_data = kcalloc(pdata->nr_cores, sizeof(struct temp_data *), | 
|  | GFP_KERNEL); | 
|  | if (!pdata->core_data) | 
|  | return NULL; | 
|  | } | 
|  |  | 
|  | tdata = kzalloc(sizeof(struct temp_data), GFP_KERNEL); | 
|  | if (!tdata) | 
|  | return NULL; | 
|  |  | 
|  | if (pkg_flag) { | 
|  | pdata->pkg_data = tdata; | 
|  | /* Use tdata->index as indicator of package temp data */ | 
|  | tdata->index = -1; | 
|  | } else { | 
|  | tdata->index = ida_alloc_max(&pdata->ida, pdata->nr_cores - 1, GFP_KERNEL); | 
|  | if (tdata->index < 0) { | 
|  | kfree(tdata); | 
|  | return NULL; | 
|  | } | 
|  | pdata->core_data[tdata->index] = tdata; | 
|  | } | 
|  |  | 
|  | tdata->status_reg = pkg_flag ? MSR_IA32_PACKAGE_THERM_STATUS : | 
|  | MSR_IA32_THERM_STATUS; | 
|  | tdata->cpu = cpu; | 
|  | tdata->cpu_core_id = topology_core_id(cpu); | 
|  | tdata->attr_size = MAX_CORE_ATTRS; | 
|  | mutex_init(&tdata->update_lock); | 
|  | return tdata; | 
|  | } | 
|  |  | 
|  | static void destroy_temp_data(struct platform_data *pdata, struct temp_data *tdata) | 
|  | { | 
|  | if (is_pkg_temp_data(tdata)) { | 
|  | pdata->pkg_data = NULL; | 
|  | kfree(pdata->core_data); | 
|  | pdata->core_data = NULL; | 
|  | pdata->nr_cores = 0; | 
|  | } else { | 
|  | pdata->core_data[tdata->index] = NULL; | 
|  | ida_free(&pdata->ida, tdata->index); | 
|  | } | 
|  | kfree(tdata); | 
|  | } | 
|  |  | 
|  | static struct temp_data *get_temp_data(struct platform_data *pdata, int cpu) | 
|  | { | 
|  | int i; | 
|  |  | 
|  | /* cpu < 0 means get pkg temp_data */ | 
|  | if (cpu < 0) | 
|  | return pdata->pkg_data; | 
|  |  | 
|  | for (i = 0; i < pdata->nr_cores; i++) { | 
|  | if (pdata->core_data[i] && | 
|  | pdata->core_data[i]->cpu_core_id == topology_core_id(cpu)) | 
|  | return pdata->core_data[i]; | 
|  | } | 
|  | return NULL; | 
|  | } | 
|  |  | 
|  | static int create_core_data(struct platform_device *pdev, unsigned int cpu, | 
|  | int pkg_flag) | 
|  | { | 
|  | struct temp_data *tdata; | 
|  | struct platform_data *pdata = platform_get_drvdata(pdev); | 
|  | struct cpuinfo_x86 *c = &cpu_data(cpu); | 
|  | u32 eax, edx; | 
|  | int err; | 
|  |  | 
|  | if (!housekeeping_cpu(cpu, HK_TYPE_MISC)) | 
|  | return 0; | 
|  |  | 
|  | tdata = init_temp_data(pdata, cpu, pkg_flag); | 
|  | if (!tdata) | 
|  | return -ENOMEM; | 
|  |  | 
|  | /* Test if we can access the status register */ | 
|  | err = rdmsr_safe_on_cpu(cpu, tdata->status_reg, &eax, &edx); | 
|  | if (err) | 
|  | goto err; | 
|  |  | 
|  | /* Make sure tdata->tjmax is a valid indicator for dynamic/static tjmax */ | 
|  | get_tjmax(tdata, &pdev->dev); | 
|  |  | 
|  | /* | 
|  | * The target temperature is available on older CPUs but not in the | 
|  | * MSR_IA32_TEMPERATURE_TARGET register. Atoms don't have the register | 
|  | * at all. | 
|  | */ | 
|  | if (c->x86_model > 0xe && c->x86_model != 0x1c) | 
|  | if (get_ttarget(tdata, &pdev->dev) >= 0) | 
|  | tdata->attr_size++; | 
|  |  | 
|  | /* Create sysfs interfaces */ | 
|  | err = create_core_attrs(tdata, pdata->hwmon_dev); | 
|  | if (err) | 
|  | goto err; | 
|  |  | 
|  | return 0; | 
|  |  | 
|  | err: | 
|  | destroy_temp_data(pdata, tdata); | 
|  | return err; | 
|  | } | 
|  |  | 
|  | static void | 
|  | coretemp_add_core(struct platform_device *pdev, unsigned int cpu, int pkg_flag) | 
|  | { | 
|  | if (create_core_data(pdev, cpu, pkg_flag)) | 
|  | dev_err(&pdev->dev, "Adding Core %u failed\n", cpu); | 
|  | } | 
|  |  | 
|  | static void coretemp_remove_core(struct platform_data *pdata, struct temp_data *tdata) | 
|  | { | 
|  | /* if we errored on add then this is already gone */ | 
|  | if (!tdata) | 
|  | return; | 
|  |  | 
|  | /* Remove the sysfs attributes */ | 
|  | sysfs_remove_group(&pdata->hwmon_dev->kobj, &tdata->attr_group); | 
|  |  | 
|  | destroy_temp_data(pdata, tdata); | 
|  | } | 
|  |  | 
|  | static int coretemp_device_add(int zoneid) | 
|  | { | 
|  | struct platform_device *pdev; | 
|  | struct platform_data *pdata; | 
|  | int err; | 
|  |  | 
|  | /* Initialize the per-zone data structures */ | 
|  | pdata = kzalloc(sizeof(*pdata), GFP_KERNEL); | 
|  | if (!pdata) | 
|  | return -ENOMEM; | 
|  |  | 
|  | pdata->pkg_id = zoneid; | 
|  | ida_init(&pdata->ida); | 
|  |  | 
|  | pdev = platform_device_alloc(DRVNAME, zoneid); | 
|  | if (!pdev) { | 
|  | err = -ENOMEM; | 
|  | goto err_free_pdata; | 
|  | } | 
|  |  | 
|  | err = platform_device_add(pdev); | 
|  | if (err) | 
|  | goto err_put_dev; | 
|  |  | 
|  | platform_set_drvdata(pdev, pdata); | 
|  | zone_devices[zoneid] = pdev; | 
|  | return 0; | 
|  |  | 
|  | err_put_dev: | 
|  | platform_device_put(pdev); | 
|  | err_free_pdata: | 
|  | kfree(pdata); | 
|  | return err; | 
|  | } | 
|  |  | 
|  | static void coretemp_device_remove(int zoneid) | 
|  | { | 
|  | struct platform_device *pdev = zone_devices[zoneid]; | 
|  | struct platform_data *pdata = platform_get_drvdata(pdev); | 
|  |  | 
|  | ida_destroy(&pdata->ida); | 
|  | kfree(pdata); | 
|  | platform_device_unregister(pdev); | 
|  | } | 
|  |  | 
|  | static int coretemp_cpu_online(unsigned int cpu) | 
|  | { | 
|  | struct platform_device *pdev = coretemp_get_pdev(cpu); | 
|  | struct cpuinfo_x86 *c = &cpu_data(cpu); | 
|  | struct platform_data *pdata; | 
|  |  | 
|  | /* | 
|  | * Don't execute this on resume as the offline callback did | 
|  | * not get executed on suspend. | 
|  | */ | 
|  | if (cpuhp_tasks_frozen) | 
|  | return 0; | 
|  |  | 
|  | /* | 
|  | * CPUID.06H.EAX[0] indicates whether the CPU has thermal | 
|  | * sensors. We check this bit only, all the early CPUs | 
|  | * without thermal sensors will be filtered out. | 
|  | */ | 
|  | if (!cpu_has(c, X86_FEATURE_DTHERM)) | 
|  | return -ENODEV; | 
|  |  | 
|  | pdata = platform_get_drvdata(pdev); | 
|  | if (!pdata->hwmon_dev) { | 
|  | struct device *hwmon; | 
|  |  | 
|  | /* Check the microcode version of the CPU */ | 
|  | if (chk_ucode_version(cpu)) | 
|  | return -EINVAL; | 
|  |  | 
|  | /* | 
|  | * Alright, we have DTS support. | 
|  | * We are bringing the _first_ core in this pkg | 
|  | * online. So, initialize per-pkg data structures and | 
|  | * then bring this core online. | 
|  | */ | 
|  | hwmon = hwmon_device_register_with_groups(&pdev->dev, DRVNAME, | 
|  | pdata, NULL); | 
|  | if (IS_ERR(hwmon)) | 
|  | return PTR_ERR(hwmon); | 
|  | pdata->hwmon_dev = hwmon; | 
|  |  | 
|  | /* | 
|  | * Check whether pkgtemp support is available. | 
|  | * If so, add interfaces for pkgtemp. | 
|  | */ | 
|  | if (cpu_has(c, X86_FEATURE_PTS)) | 
|  | coretemp_add_core(pdev, cpu, 1); | 
|  | } | 
|  |  | 
|  | /* | 
|  | * Check whether a thread sibling is already online. If not add the | 
|  | * interface for this CPU core. | 
|  | */ | 
|  | if (!cpumask_intersects(&pdata->cpumask, topology_sibling_cpumask(cpu))) | 
|  | coretemp_add_core(pdev, cpu, 0); | 
|  |  | 
|  | cpumask_set_cpu(cpu, &pdata->cpumask); | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | static int coretemp_cpu_offline(unsigned int cpu) | 
|  | { | 
|  | struct platform_device *pdev = coretemp_get_pdev(cpu); | 
|  | struct platform_data *pd; | 
|  | struct temp_data *tdata; | 
|  | int target; | 
|  |  | 
|  | /* No need to tear down any interfaces for suspend */ | 
|  | if (cpuhp_tasks_frozen) | 
|  | return 0; | 
|  |  | 
|  | /* If the physical CPU device does not exist, just return */ | 
|  | pd = platform_get_drvdata(pdev); | 
|  | if (!pd->hwmon_dev) | 
|  | return 0; | 
|  |  | 
|  | tdata = get_temp_data(pd, cpu); | 
|  |  | 
|  | cpumask_clear_cpu(cpu, &pd->cpumask); | 
|  |  | 
|  | /* | 
|  | * If this is the last thread sibling, remove the CPU core | 
|  | * interface, If there is still a sibling online, transfer the | 
|  | * target cpu of that core interface to it. | 
|  | */ | 
|  | target = cpumask_any_and(&pd->cpumask, topology_sibling_cpumask(cpu)); | 
|  | if (target >= nr_cpu_ids) { | 
|  | coretemp_remove_core(pd, tdata); | 
|  | } else if (tdata && tdata->cpu == cpu) { | 
|  | mutex_lock(&tdata->update_lock); | 
|  | tdata->cpu = target; | 
|  | mutex_unlock(&tdata->update_lock); | 
|  | } | 
|  |  | 
|  | /* | 
|  | * If all cores in this pkg are offline, remove the interface. | 
|  | */ | 
|  | tdata = get_temp_data(pd, -1); | 
|  | if (cpumask_empty(&pd->cpumask)) { | 
|  | if (tdata) | 
|  | coretemp_remove_core(pd, tdata); | 
|  | hwmon_device_unregister(pd->hwmon_dev); | 
|  | pd->hwmon_dev = NULL; | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | /* | 
|  | * Check whether this core is the target for the package | 
|  | * interface. We need to assign it to some other cpu. | 
|  | */ | 
|  | if (tdata && tdata->cpu == cpu) { | 
|  | target = cpumask_first(&pd->cpumask); | 
|  | mutex_lock(&tdata->update_lock); | 
|  | tdata->cpu = target; | 
|  | mutex_unlock(&tdata->update_lock); | 
|  | } | 
|  | return 0; | 
|  | } | 
|  | static const struct x86_cpu_id __initconst coretemp_ids[] = { | 
|  | X86_MATCH_VENDOR_FEATURE(INTEL, X86_FEATURE_DTHERM, NULL), | 
|  | {} | 
|  | }; | 
|  | MODULE_DEVICE_TABLE(x86cpu, coretemp_ids); | 
|  |  | 
|  | static enum cpuhp_state coretemp_hp_online; | 
|  |  | 
|  | static int __init coretemp_init(void) | 
|  | { | 
|  | int i, err; | 
|  |  | 
|  | /* | 
|  | * CPUID.06H.EAX[0] indicates whether the CPU has thermal | 
|  | * sensors. We check this bit only, all the early CPUs | 
|  | * without thermal sensors will be filtered out. | 
|  | */ | 
|  | if (!x86_match_cpu(coretemp_ids)) | 
|  | return -ENODEV; | 
|  |  | 
|  | max_zones = topology_max_packages() * topology_max_dies_per_package(); | 
|  | zone_devices = kcalloc(max_zones, sizeof(struct platform_device *), | 
|  | GFP_KERNEL); | 
|  | if (!zone_devices) | 
|  | return -ENOMEM; | 
|  |  | 
|  | for (i = 0; i < max_zones; i++) { | 
|  | err = coretemp_device_add(i); | 
|  | if (err) | 
|  | goto outzone; | 
|  | } | 
|  |  | 
|  | err = cpuhp_setup_state(CPUHP_AP_ONLINE_DYN, "hwmon/coretemp:online", | 
|  | coretemp_cpu_online, coretemp_cpu_offline); | 
|  | if (err < 0) | 
|  | goto outzone; | 
|  | coretemp_hp_online = err; | 
|  | return 0; | 
|  |  | 
|  | outzone: | 
|  | while (i--) | 
|  | coretemp_device_remove(i); | 
|  | kfree(zone_devices); | 
|  | return err; | 
|  | } | 
|  | module_init(coretemp_init) | 
|  |  | 
|  | static void __exit coretemp_exit(void) | 
|  | { | 
|  | int i; | 
|  |  | 
|  | cpuhp_remove_state(coretemp_hp_online); | 
|  | for (i = 0; i < max_zones; i++) | 
|  | coretemp_device_remove(i); | 
|  | kfree(zone_devices); | 
|  | } | 
|  | module_exit(coretemp_exit) | 
|  |  | 
|  | MODULE_AUTHOR("Rudolf Marek <r.marek@assembler.cz>"); | 
|  | MODULE_DESCRIPTION("Intel Core temperature monitor"); | 
|  | MODULE_LICENSE("GPL"); |