k10temp.c 10.9 KB
Newer Older
1
/*
2
 * k10temp.c - AMD Family 10h/11h/12h/14h/15h/16h processor hardware monitoring
3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25
 *
 * Copyright (c) 2009 Clemens Ladisch <clemens@ladisch.de>
 *
 *
 * This driver is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License; either
 * version 2 of the License, or (at your option) any later version.
 *
 * This driver is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
 * See the GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this driver; if not, see <http://www.gnu.org/licenses/>.
 */

#include <linux/err.h>
#include <linux/hwmon.h>
#include <linux/hwmon-sysfs.h>
#include <linux/init.h>
#include <linux/module.h>
#include <linux/pci.h>
26
#include <asm/amd_nb.h>
27 28
#include <asm/processor.h>

29
MODULE_DESCRIPTION("AMD Family 10h+ CPU core temperature monitor");
30 31 32 33 34 35 36
MODULE_AUTHOR("Clemens Ladisch <clemens@ladisch.de>");
MODULE_LICENSE("GPL");

static bool force;
module_param(force, bool, 0444);
MODULE_PARM_DESC(force, "force loading on processors with erratum 319");

37 38 39
/* Provide lock for writing to NB_SMU_IND_ADDR */
static DEFINE_MUTEX(nb_smu_ind_mutex);

40 41 42 43
#ifndef PCI_DEVICE_ID_AMD_15H_M70H_NB_F3
#define PCI_DEVICE_ID_AMD_15H_M70H_NB_F3	0x15b3
#endif

44 45 46 47
#ifndef PCI_DEVICE_ID_AMD_17H_DF_F3
#define PCI_DEVICE_ID_AMD_17H_DF_F3	0x1463
#endif

48 49
#ifndef PCI_DEVICE_ID_AMD_17H_M10H_DF_F3
#define PCI_DEVICE_ID_AMD_17H_M10H_DF_F3	0x15eb
50 51
#endif

52 53 54 55 56 57 58 59 60 61
/* CPUID function 0x80000001, ebx */
#define CPUID_PKGTYPE_MASK	0xf0000000
#define CPUID_PKGTYPE_F		0x00000000
#define CPUID_PKGTYPE_AM2R2_AM3	0x10000000

/* DRAM controller (PCI function 2) */
#define REG_DCT0_CONFIG_HIGH		0x094
#define  DDR3_MODE			0x00000100

/* miscellaneous (PCI function 3) */
62 63 64 65 66 67 68 69
#define REG_HARDWARE_THERMAL_CONTROL	0x64
#define  HTC_ENABLE			0x00000001

#define REG_REPORTED_TEMPERATURE	0xa4

#define REG_NORTHBRIDGE_CAPABILITIES	0xe8
#define  NB_CAP_HTC			0x00000400

70
/*
71 72 73 74
 * For F15h M60h and M70h, REG_HARDWARE_THERMAL_CONTROL
 * and REG_REPORTED_TEMPERATURE have been moved to
 * D0F0xBC_xD820_0C64 [Hardware Temperature Control]
 * D0F0xBC_xD820_0CA4 [Reported Temperature Control]
75
 */
76
#define F15H_M60H_HARDWARE_TEMP_CTRL_OFFSET	0xd8200c64
77 78
#define F15H_M60H_REPORTED_TEMP_CTRL_OFFSET	0xd8200ca4

79 80 81
/* F17h M01h Access througn SMN */
#define F17H_M01H_REPORTED_TEMP_CTRL_OFFSET	0x00059800

82 83
struct k10temp_data {
	struct pci_dev *pdev;
84
	void (*read_htcreg)(struct pci_dev *pdev, u32 *regval);
85
	void (*read_tempreg)(struct pci_dev *pdev, u32 *regval);
86
	int temp_offset;
87
	u32 temp_adjust_mask;
88
	bool show_tdie;
89 90 91 92 93 94 95 96 97
};

struct tctl_offset {
	u8 model;
	char const *id;
	int offset;
};

static const struct tctl_offset tctl_offset_table[] = {
98
	{ 0x17, "AMD Ryzen 5 1600X", 20000 },
99 100
	{ 0x17, "AMD Ryzen 7 1700X", 20000 },
	{ 0x17, "AMD Ryzen 7 1800X", 20000 },
101
	{ 0x17, "AMD Ryzen 7 2700X", 10000 },
102 103
	{ 0x17, "AMD Ryzen Threadripper 1950X", 27000 },
	{ 0x17, "AMD Ryzen Threadripper 1920X", 27000 },
104
	{ 0x17, "AMD Ryzen Threadripper 1900X", 27000 },
105 106 107
	{ 0x17, "AMD Ryzen Threadripper 1950", 10000 },
	{ 0x17, "AMD Ryzen Threadripper 1920", 10000 },
	{ 0x17, "AMD Ryzen Threadripper 1910", 10000 },
108 109
	{ 0x17, "AMD Ryzen Threadripper 2950X", 27000 },
	{ 0x17, "AMD Ryzen Threadripper 2990WX", 27000 },
110 111
};

112 113 114 115 116
static void read_htcreg_pci(struct pci_dev *pdev, u32 *regval)
{
	pci_read_config_dword(pdev, REG_HARDWARE_THERMAL_CONTROL, regval);
}

117 118 119 120 121 122 123
static void read_tempreg_pci(struct pci_dev *pdev, u32 *regval)
{
	pci_read_config_dword(pdev, REG_REPORTED_TEMPERATURE, regval);
}

static void amd_nb_index_read(struct pci_dev *pdev, unsigned int devfn,
			      unsigned int base, int offset, u32 *val)
124 125 126
{
	mutex_lock(&nb_smu_ind_mutex);
	pci_bus_write_config_dword(pdev->bus, devfn,
127
				   base, offset);
128
	pci_bus_read_config_dword(pdev->bus, devfn,
129
				  base + 4, val);
130 131 132
	mutex_unlock(&nb_smu_ind_mutex);
}

133 134 135 136 137 138
static void read_htcreg_nb_f15(struct pci_dev *pdev, u32 *regval)
{
	amd_nb_index_read(pdev, PCI_DEVFN(0, 0), 0xb8,
			  F15H_M60H_HARDWARE_TEMP_CTRL_OFFSET, regval);
}

139 140 141 142 143 144
static void read_tempreg_nb_f15(struct pci_dev *pdev, u32 *regval)
{
	amd_nb_index_read(pdev, PCI_DEVFN(0, 0), 0xb8,
			  F15H_M60H_REPORTED_TEMP_CTRL_OFFSET, regval);
}

145 146
static void read_tempreg_nb_f17(struct pci_dev *pdev, u32 *regval)
{
147 148
	amd_smn_read(amd_pci_dev_to_node_id(pdev),
		     F17H_M01H_REPORTED_TEMP_CTRL_OFFSET, regval);
149 150
}

151
static unsigned int get_raw_temp(struct k10temp_data *data)
152
{
153
	unsigned int temp;
154
	u32 regval;
155 156 157

	data->read_tempreg(data->pdev, &regval);
	temp = (regval >> 21) * 125;
158 159
	if (regval & data->temp_adjust_mask)
		temp -= 49000;
160 161 162 163 164 165 166 167 168
	return temp;
}

static ssize_t temp1_input_show(struct device *dev,
				struct device_attribute *attr, char *buf)
{
	struct k10temp_data *data = dev_get_drvdata(dev);
	unsigned int temp = get_raw_temp(data);

169 170 171 172
	if (temp > data->temp_offset)
		temp -= data->temp_offset;
	else
		temp = 0;
173 174

	return sprintf(buf, "%u\n", temp);
175 176
}

177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193
static ssize_t temp2_input_show(struct device *dev,
				struct device_attribute *devattr, char *buf)
{
	struct k10temp_data *data = dev_get_drvdata(dev);
	unsigned int temp = get_raw_temp(data);

	return sprintf(buf, "%u\n", temp);
}

static ssize_t temp_label_show(struct device *dev,
			       struct device_attribute *devattr, char *buf)
{
	struct sensor_device_attribute *attr = to_sensor_dev_attr(devattr);

	return sprintf(buf, "%s\n", attr->index ? "Tctl" : "Tdie");
}

194 195
static ssize_t temp1_max_show(struct device *dev,
			      struct device_attribute *attr, char *buf)
196 197 198 199 200 201 202 203
{
	return sprintf(buf, "%d\n", 70 * 1000);
}

static ssize_t show_temp_crit(struct device *dev,
			      struct device_attribute *devattr, char *buf)
{
	struct sensor_device_attribute *attr = to_sensor_dev_attr(devattr);
204
	struct k10temp_data *data = dev_get_drvdata(dev);
205 206 207 208
	int show_hyst = attr->index;
	u32 regval;
	int value;

209
	data->read_htcreg(data->pdev, &regval);
210 211 212 213 214 215
	value = ((regval >> 16) & 0x7f) * 500 + 52000;
	if (show_hyst)
		value -= ((regval >> 24) & 0xf) * 500;
	return sprintf(buf, "%d\n", value);
}

216 217
static DEVICE_ATTR_RO(temp1_input);
static DEVICE_ATTR_RO(temp1_max);
218 219
static SENSOR_DEVICE_ATTR(temp1_crit, S_IRUGO, show_temp_crit, NULL, 0);
static SENSOR_DEVICE_ATTR(temp1_crit_hyst, S_IRUGO, show_temp_crit, NULL, 1);
220

221 222 223 224
static SENSOR_DEVICE_ATTR(temp1_label, 0444, temp_label_show, NULL, 0);
static DEVICE_ATTR_RO(temp2_input);
static SENSOR_DEVICE_ATTR(temp2_label, 0444, temp_label_show, NULL, 1);

225 226 227 228
static umode_t k10temp_is_visible(struct kobject *kobj,
				  struct attribute *attr, int index)
{
	struct device *dev = container_of(kobj, struct device, kobj);
229 230
	struct k10temp_data *data = dev_get_drvdata(dev);
	struct pci_dev *pdev = data->pdev;
231
	u32 reg;
232

233 234 235 236 237
	switch (index) {
	case 0 ... 1:	/* temp1_input, temp1_max */
	default:
		break;
	case 2 ... 3:	/* temp1_crit, temp1_crit_hyst */
238 239
		if (!data->read_htcreg)
			return 0;
240 241

		pci_read_config_dword(pdev, REG_NORTHBRIDGE_CAPABILITIES,
242 243 244 245 246 247
				      &reg);
		if (!(reg & NB_CAP_HTC))
			return 0;

		data->read_htcreg(data->pdev, &reg);
		if (!(reg & HTC_ENABLE))
248
			return 0;
249 250 251 252 253
		break;
	case 4 ... 6:	/* temp1_label, temp2_input, temp2_label */
		if (!data->show_tdie)
			return 0;
		break;
254 255 256 257 258 259 260 261 262
	}
	return attr->mode;
}

static struct attribute *k10temp_attrs[] = {
	&dev_attr_temp1_input.attr,
	&dev_attr_temp1_max.attr,
	&sensor_dev_attr_temp1_crit.dev_attr.attr,
	&sensor_dev_attr_temp1_crit_hyst.dev_attr.attr,
263 264 265
	&sensor_dev_attr_temp1_label.dev_attr.attr,
	&dev_attr_temp2_input.attr,
	&sensor_dev_attr_temp2_label.dev_attr.attr,
266 267 268 269 270 271 272 273
	NULL
};

static const struct attribute_group k10temp_group = {
	.attrs = k10temp_attrs,
	.is_visible = k10temp_is_visible,
};
__ATTRIBUTE_GROUPS(k10temp);
274

B
Bill Pemberton 已提交
275
static bool has_erratum_319(struct pci_dev *pdev)
276
{
277 278 279 280 281
	u32 pkg_type, reg_dram_cfg;

	if (boot_cpu_data.x86 != 0x10)
		return false;

282
	/*
283 284
	 * Erratum 319: The thermal sensor of Socket F/AM2+ processors
	 *              may be unreliable.
285
	 */
286 287 288 289 290 291
	pkg_type = cpuid_ebx(0x80000001) & CPUID_PKGTYPE_MASK;
	if (pkg_type == CPUID_PKGTYPE_F)
		return true;
	if (pkg_type != CPUID_PKGTYPE_AM2R2_AM3)
		return false;

292
	/* DDR3 memory implies socket AM3, which is good */
293 294 295
	pci_bus_read_config_dword(pdev->bus,
				  PCI_DEVFN(PCI_SLOT(pdev->devfn), 2),
				  REG_DCT0_CONFIG_HIGH, &reg_dram_cfg);
296 297 298 299 300 301 302 303 304 305
	if (reg_dram_cfg & DDR3_MODE)
		return false;

	/*
	 * Unfortunately it is possible to run a socket AM3 CPU with DDR2
	 * memory. We blacklist all the cores which do exist in socket AM2+
	 * format. It still isn't perfect, as RB-C2 cores exist in both AM2+
	 * and AM3 formats, but that's the best we can do.
	 */
	return boot_cpu_data.x86_model < 4 ||
306
	       (boot_cpu_data.x86_model == 4 && boot_cpu_data.x86_stepping <= 2);
307 308
}

B
Bill Pemberton 已提交
309
static int k10temp_probe(struct pci_dev *pdev,
310 311
				   const struct pci_device_id *id)
{
312
	int unreliable = has_erratum_319(pdev);
313
	struct device *dev = &pdev->dev;
314
	struct k10temp_data *data;
315
	struct device *hwmon_dev;
316
	int i;
317

318 319 320 321 322 323 324
	if (unreliable) {
		if (!force) {
			dev_err(dev,
				"unreliable CPU thermal sensor; monitoring disabled\n");
			return -ENODEV;
		}
		dev_warn(dev,
325
			 "unreliable CPU thermal sensor; check erratum 319\n");
326
	}
327

328 329 330 331 332 333 334
	data = devm_kzalloc(dev, sizeof(*data), GFP_KERNEL);
	if (!data)
		return -ENOMEM;

	data->pdev = pdev;

	if (boot_cpu_data.x86 == 0x15 && (boot_cpu_data.x86_model == 0x60 ||
335
					  boot_cpu_data.x86_model == 0x70)) {
336
		data->read_htcreg = read_htcreg_nb_f15;
337
		data->read_tempreg = read_tempreg_nb_f15;
338 339
	} else if (boot_cpu_data.x86 == 0x17) {
		data->temp_adjust_mask = 0x80000;
340
		data->read_tempreg = read_tempreg_nb_f17;
341
		data->show_tdie = true;
342
	} else {
343
		data->read_htcreg = read_htcreg_pci;
344
		data->read_tempreg = read_tempreg_pci;
345
	}
346

347 348 349 350 351 352 353 354 355 356
	for (i = 0; i < ARRAY_SIZE(tctl_offset_table); i++) {
		const struct tctl_offset *entry = &tctl_offset_table[i];

		if (boot_cpu_data.x86 == entry->model &&
		    strstr(boot_cpu_data.x86_model_id, entry->id)) {
			data->temp_offset = entry->offset;
			break;
		}
	}

357
	hwmon_dev = devm_hwmon_device_register_with_groups(dev, "k10temp", data,
358 359
							   k10temp_groups);
	return PTR_ERR_OR_ZERO(hwmon_dev);
360 361
}

362
static const struct pci_device_id k10temp_id_table[] = {
363 364
	{ PCI_VDEVICE(AMD, PCI_DEVICE_ID_AMD_10H_NB_MISC) },
	{ PCI_VDEVICE(AMD, PCI_DEVICE_ID_AMD_11H_NB_MISC) },
365
	{ PCI_VDEVICE(AMD, PCI_DEVICE_ID_AMD_CNB17H_F3) },
366
	{ PCI_VDEVICE(AMD, PCI_DEVICE_ID_AMD_15H_NB_F3) },
367
	{ PCI_VDEVICE(AMD, PCI_DEVICE_ID_AMD_15H_M10H_F3) },
368
	{ PCI_VDEVICE(AMD, PCI_DEVICE_ID_AMD_15H_M30H_NB_F3) },
369
	{ PCI_VDEVICE(AMD, PCI_DEVICE_ID_AMD_15H_M60H_NB_F3) },
370
	{ PCI_VDEVICE(AMD, PCI_DEVICE_ID_AMD_15H_M70H_NB_F3) },
371
	{ PCI_VDEVICE(AMD, PCI_DEVICE_ID_AMD_16H_NB_F3) },
372
	{ PCI_VDEVICE(AMD, PCI_DEVICE_ID_AMD_16H_M30H_NB_F3) },
373
	{ PCI_VDEVICE(AMD, PCI_DEVICE_ID_AMD_17H_DF_F3) },
374
	{ PCI_VDEVICE(AMD, PCI_DEVICE_ID_AMD_17H_M10H_DF_F3) },
375 376 377 378 379 380 381 382 383 384
	{}
};
MODULE_DEVICE_TABLE(pci, k10temp_id_table);

static struct pci_driver k10temp_driver = {
	.name = "k10temp",
	.id_table = k10temp_id_table,
	.probe = k10temp_probe,
};

A
Axel Lin 已提交
385
module_pci_driver(k10temp_driver);