aspm.c 26.4 KB
Newer Older
S
Shaohua Li 已提交
1 2
/*
 * File:	drivers/pci/pcie/aspm.c
3
 * Enabling PCIe link L0s/L1 state and Clock Power Management
S
Shaohua Li 已提交
4 5 6 7 8 9 10 11 12 13 14 15 16 17 18
 *
 * Copyright (C) 2007 Intel
 * Copyright (C) Zhang Yanmin (yanmin.zhang@intel.com)
 * Copyright (C) Shaohua Li (shaohua.li@intel.com)
 */

#include <linux/kernel.h>
#include <linux/module.h>
#include <linux/moduleparam.h>
#include <linux/pci.h>
#include <linux/pci_regs.h>
#include <linux/errno.h>
#include <linux/pm.h>
#include <linux/init.h>
#include <linux/slab.h>
19
#include <linux/jiffies.h>
20
#include <linux/delay.h>
S
Shaohua Li 已提交
21 22 23 24 25 26 27 28
#include <linux/pci-aspm.h>
#include "../pci.h"

#ifdef MODULE_PARAM_PREFIX
#undef MODULE_PARAM_PREFIX
#endif
#define MODULE_PARAM_PREFIX "pcie_aspm."

29 30 31 32 33 34 35
/* Note: those are not register definitions */
#define ASPM_STATE_L0S_UP	(1)	/* Upstream direction L0s state */
#define ASPM_STATE_L0S_DW	(2)	/* Downstream direction L0s state */
#define ASPM_STATE_L1		(4)	/* L1 state */
#define ASPM_STATE_L0S		(ASPM_STATE_L0S_UP | ASPM_STATE_L0S_DW)
#define ASPM_STATE_ALL		(ASPM_STATE_L0S | ASPM_STATE_L1)

36 37 38
struct aspm_latency {
	u32 l0s;			/* L0s latency (nsec) */
	u32 l1;				/* L1 latency (nsec) */
S
Shaohua Li 已提交
39 40 41
};

struct pcie_link_state {
42
	struct pci_dev *pdev;		/* Upstream component of the Link */
43
	struct pcie_link_state *root;	/* pointer to the root port link */
44 45 46 47
	struct pcie_link_state *parent;	/* pointer to the parent Link state */
	struct list_head sibling;	/* node in link_list */
	struct list_head children;	/* list of child link states */
	struct list_head link;		/* node in parent's children list */
S
Shaohua Li 已提交
48 49

	/* ASPM state */
50 51 52 53 54
	u32 aspm_support:3;		/* Supported ASPM state */
	u32 aspm_enabled:3;		/* Enabled ASPM state */
	u32 aspm_capable:3;		/* Capable ASPM state with latency */
	u32 aspm_default:3;		/* Default ASPM state by BIOS */
	u32 aspm_disable:3;		/* Disabled ASPM state */
55

56 57 58 59 60
	/* Clock PM state */
	u32 clkpm_capable:1;		/* Clock PM capable? */
	u32 clkpm_enabled:1;		/* Current Clock PM state */
	u32 clkpm_default:1;		/* Default Clock PM state by BIOS */

61 62 63
	/* Exit latencies */
	struct aspm_latency latency_up;	/* Upstream direction exit latency */
	struct aspm_latency latency_dw;	/* Downstream direction exit latency */
S
Shaohua Li 已提交
64
	/*
65 66
	 * Endpoint acceptable latencies. A pcie downstream port only
	 * has one slot under it, so at most there are 8 functions.
S
Shaohua Li 已提交
67
	 */
68
	struct aspm_latency acceptable[8];
S
Shaohua Li 已提交
69 70
};

M
Matthew Garrett 已提交
71
static int aspm_disabled, aspm_force;
72
static bool aspm_support_enabled = true;
S
Shaohua Li 已提交
73 74 75 76 77 78
static DEFINE_MUTEX(aspm_lock);
static LIST_HEAD(link_list);

#define POLICY_DEFAULT 0	/* BIOS default setting */
#define POLICY_PERFORMANCE 1	/* high performance */
#define POLICY_POWERSAVE 2	/* high power saving */
79 80 81 82 83 84

#ifdef CONFIG_PCIEASPM_PERFORMANCE
static int aspm_policy = POLICY_PERFORMANCE;
#elif defined CONFIG_PCIEASPM_POWERSAVE
static int aspm_policy = POLICY_POWERSAVE;
#else
S
Shaohua Li 已提交
85
static int aspm_policy;
86 87
#endif

S
Shaohua Li 已提交
88 89 90 91 92 93
static const char *policy_str[] = {
	[POLICY_DEFAULT] = "default",
	[POLICY_PERFORMANCE] = "performance",
	[POLICY_POWERSAVE] = "powersave"
};

94 95
#define LINK_RETRAIN_TIMEOUT HZ

96
static int policy_to_aspm_state(struct pcie_link_state *link)
S
Shaohua Li 已提交
97 98 99 100 101 102 103
{
	switch (aspm_policy) {
	case POLICY_PERFORMANCE:
		/* Disable ASPM and Clock PM */
		return 0;
	case POLICY_POWERSAVE:
		/* Enable ASPM L0s/L1 */
104
		return ASPM_STATE_ALL;
S
Shaohua Li 已提交
105
	case POLICY_DEFAULT:
106
		return link->aspm_default;
S
Shaohua Li 已提交
107 108 109 110
	}
	return 0;
}

111
static int policy_to_clkpm_state(struct pcie_link_state *link)
S
Shaohua Li 已提交
112 113 114 115 116 117 118 119 120
{
	switch (aspm_policy) {
	case POLICY_PERFORMANCE:
		/* Disable ASPM and Clock PM */
		return 0;
	case POLICY_POWERSAVE:
		/* Disable Clock PM */
		return 1;
	case POLICY_DEFAULT:
121
		return link->clkpm_default;
S
Shaohua Li 已提交
122 123 124 125
	}
	return 0;
}

K
Kenji Kaneshige 已提交
126
static void pcie_set_clkpm_nocheck(struct pcie_link_state *link, int enable)
S
Shaohua Li 已提交
127
{
128 129
	struct pci_dev *child;
	struct pci_bus *linkbus = link->pdev->subordinate;
130
	u32 val = enable ? PCI_EXP_LNKCTL_CLKREQ_EN : 0;
S
Shaohua Li 已提交
131

132 133 134 135
	list_for_each_entry(child, &linkbus->devices, bus_list)
		pcie_capability_clear_and_set_word(child, PCI_EXP_LNKCTL,
						   PCI_EXP_LNKCTL_CLKREQ_EN,
						   val);
136
	link->clkpm_enabled = !!enable;
S
Shaohua Li 已提交
137 138
}

K
Kenji Kaneshige 已提交
139 140 141 142
static void pcie_set_clkpm(struct pcie_link_state *link, int enable)
{
	/* Don't enable Clock PM if the link is not Clock PM capable */
	if (!link->clkpm_capable && enable)
143
		enable = 0;
K
Kenji Kaneshige 已提交
144 145 146 147 148 149
	/* Need nothing if the specified equals to current state */
	if (link->clkpm_enabled == enable)
		return;
	pcie_set_clkpm_nocheck(link, enable);
}

150
static void pcie_clkpm_cap_init(struct pcie_link_state *link, int blacklist)
S
Shaohua Li 已提交
151
{
152
	int capable = 1, enabled = 1;
S
Shaohua Li 已提交
153 154
	u32 reg32;
	u16 reg16;
155 156
	struct pci_dev *child;
	struct pci_bus *linkbus = link->pdev->subordinate;
S
Shaohua Li 已提交
157 158

	/* All functions should have the same cap and state, take the worst */
159
	list_for_each_entry(child, &linkbus->devices, bus_list) {
160
		pcie_capability_read_dword(child, PCI_EXP_LNKCAP, &reg32);
S
Shaohua Li 已提交
161 162 163 164 165
		if (!(reg32 & PCI_EXP_LNKCAP_CLKPM)) {
			capable = 0;
			enabled = 0;
			break;
		}
166
		pcie_capability_read_word(child, PCI_EXP_LNKCTL, &reg16);
S
Shaohua Li 已提交
167 168 169
		if (!(reg16 & PCI_EXP_LNKCTL_CLKREQ_EN))
			enabled = 0;
	}
170 171
	link->clkpm_enabled = enabled;
	link->clkpm_default = enabled;
172
	link->clkpm_capable = (blacklist) ? 0 : capable;
173 174
}

S
Shaohua Li 已提交
175 176 177 178 179
/*
 * pcie_aspm_configure_common_clock: check if the 2 ends of a link
 *   could use common clock. If they are, configure them to use the
 *   common clock. That will reduce the ASPM state exit latency.
 */
180
static void pcie_aspm_configure_common_clock(struct pcie_link_state *link)
S
Shaohua Li 已提交
181
{
182
	int same_clock = 1;
183
	u16 reg16, parent_reg, child_reg[8];
184
	unsigned long start_jiffies;
185 186
	struct pci_dev *child, *parent = link->pdev;
	struct pci_bus *linkbus = parent->subordinate;
S
Shaohua Li 已提交
187
	/*
188
	 * All functions of a slot should have the same Slot Clock
S
Shaohua Li 已提交
189
	 * Configuration, so just check one function
190 191
	 */
	child = list_entry(linkbus->devices.next, struct pci_dev, bus_list);
K
Kenji Kaneshige 已提交
192
	BUG_ON(!pci_is_pcie(child));
S
Shaohua Li 已提交
193 194

	/* Check downstream component if bit Slot Clock Configuration is 1 */
195
	pcie_capability_read_word(child, PCI_EXP_LNKSTA, &reg16);
S
Shaohua Li 已提交
196 197 198 199
	if (!(reg16 & PCI_EXP_LNKSTA_SLC))
		same_clock = 0;

	/* Check upstream component if bit Slot Clock Configuration is 1 */
200
	pcie_capability_read_word(parent, PCI_EXP_LNKSTA, &reg16);
S
Shaohua Li 已提交
201 202 203 204
	if (!(reg16 & PCI_EXP_LNKSTA_SLC))
		same_clock = 0;

	/* Configure downstream component, all functions */
205
	list_for_each_entry(child, &linkbus->devices, bus_list) {
206
		pcie_capability_read_word(child, PCI_EXP_LNKCTL, &reg16);
207
		child_reg[PCI_FUNC(child->devfn)] = reg16;
S
Shaohua Li 已提交
208 209 210 211
		if (same_clock)
			reg16 |= PCI_EXP_LNKCTL_CCC;
		else
			reg16 &= ~PCI_EXP_LNKCTL_CCC;
212
		pcie_capability_write_word(child, PCI_EXP_LNKCTL, reg16);
S
Shaohua Li 已提交
213 214 215
	}

	/* Configure upstream component */
216
	pcie_capability_read_word(parent, PCI_EXP_LNKCTL, &reg16);
217
	parent_reg = reg16;
S
Shaohua Li 已提交
218 219 220 221
	if (same_clock)
		reg16 |= PCI_EXP_LNKCTL_CCC;
	else
		reg16 &= ~PCI_EXP_LNKCTL_CCC;
222
	pcie_capability_write_word(parent, PCI_EXP_LNKCTL, reg16);
S
Shaohua Li 已提交
223

224
	/* Retrain link */
S
Shaohua Li 已提交
225
	reg16 |= PCI_EXP_LNKCTL_RL;
226
	pcie_capability_write_word(parent, PCI_EXP_LNKCTL, reg16);
S
Shaohua Li 已提交
227

228
	/* Wait for link training end. Break out after waiting for timeout */
229
	start_jiffies = jiffies;
230
	for (;;) {
231
		pcie_capability_read_word(parent, PCI_EXP_LNKSTA, &reg16);
S
Shaohua Li 已提交
232 233
		if (!(reg16 & PCI_EXP_LNKSTA_LT))
			break;
234 235 236
		if (time_after(jiffies, start_jiffies + LINK_RETRAIN_TIMEOUT))
			break;
		msleep(1);
S
Shaohua Li 已提交
237
	}
238 239 240 241
	if (!(reg16 & PCI_EXP_LNKSTA_LT))
		return;

	/* Training failed. Restore common clock configurations */
242
	dev_err(&parent->dev, "ASPM: Could not configure common clock\n");
243 244 245 246
	list_for_each_entry(child, &linkbus->devices, bus_list)
		pcie_capability_write_word(child, PCI_EXP_LNKCTL,
					   child_reg[PCI_FUNC(child->devfn)]);
	pcie_capability_write_word(parent, PCI_EXP_LNKCTL, parent_reg);
S
Shaohua Li 已提交
247 248
}

249 250
/* Convert L0s latency encoding to ns */
static u32 calc_l0s_latency(u32 encoding)
S
Shaohua Li 已提交
251
{
252 253 254 255
	if (encoding == 0x7)
		return (5 * 1000);	/* > 4us */
	return (64 << encoding);
}
S
Shaohua Li 已提交
256

257 258 259 260 261 262
/* Convert L0s acceptable latency encoding to ns */
static u32 calc_l0s_acceptable(u32 encoding)
{
	if (encoding == 0x7)
		return -1U;
	return (64 << encoding);
S
Shaohua Li 已提交
263 264
}

265 266
/* Convert L1 latency encoding to ns */
static u32 calc_l1_latency(u32 encoding)
S
Shaohua Li 已提交
267
{
268 269 270 271
	if (encoding == 0x7)
		return (65 * 1000);	/* > 64us */
	return (1000 << encoding);
}
S
Shaohua Li 已提交
272

273 274 275 276 277 278
/* Convert L1 acceptable latency encoding to ns */
static u32 calc_l1_acceptable(u32 encoding)
{
	if (encoding == 0x7)
		return -1U;
	return (1000 << encoding);
S
Shaohua Li 已提交
279 280
}

281 282 283 284 285 286 287 288 289
struct aspm_register_info {
	u32 support:2;
	u32 enabled:2;
	u32 latency_encoding_l0s;
	u32 latency_encoding_l1;
};

static void pcie_get_aspm_reg(struct pci_dev *pdev,
			      struct aspm_register_info *info)
S
Shaohua Li 已提交
290 291
{
	u16 reg16;
292
	u32 reg32;
S
Shaohua Li 已提交
293

294
	pcie_capability_read_dword(pdev, PCI_EXP_LNKCAP, &reg32);
295 296 297
	info->support = (reg32 & PCI_EXP_LNKCAP_ASPMS) >> 10;
	info->latency_encoding_l0s = (reg32 & PCI_EXP_LNKCAP_L0SEL) >> 12;
	info->latency_encoding_l1  = (reg32 & PCI_EXP_LNKCAP_L1EL) >> 15;
298
	pcie_capability_read_word(pdev, PCI_EXP_LNKCTL, &reg16);
299
	info->enabled = reg16 & PCI_EXP_LNKCTL_ASPMC;
S
Shaohua Li 已提交
300 301
}

302 303
static void pcie_aspm_check_latency(struct pci_dev *endpoint)
{
304
	u32 latency, l1_switch_latency = 0;
305 306 307 308 309 310 311 312 313 314 315 316
	struct aspm_latency *acceptable;
	struct pcie_link_state *link;

	/* Device not in D0 doesn't need latency check */
	if ((endpoint->current_state != PCI_D0) &&
	    (endpoint->current_state != PCI_UNKNOWN))
		return;

	link = endpoint->bus->self->link_state;
	acceptable = &link->acceptable[PCI_FUNC(endpoint->devfn)];

	while (link) {
317 318 319 320 321 322 323 324 325
		/* Check upstream direction L0s latency */
		if ((link->aspm_capable & ASPM_STATE_L0S_UP) &&
		    (link->latency_up.l0s > acceptable->l0s))
			link->aspm_capable &= ~ASPM_STATE_L0S_UP;

		/* Check downstream direction L0s latency */
		if ((link->aspm_capable & ASPM_STATE_L0S_DW) &&
		    (link->latency_dw.l0s > acceptable->l0s))
			link->aspm_capable &= ~ASPM_STATE_L0S_DW;
326 327 328 329 330
		/*
		 * Check L1 latency.
		 * Every switch on the path to root complex need 1
		 * more microsecond for L1. Spec doesn't mention L0s.
		 */
331 332 333 334
		latency = max_t(u32, link->latency_up.l1, link->latency_dw.l1);
		if ((link->aspm_capable & ASPM_STATE_L1) &&
		    (latency + l1_switch_latency > acceptable->l1))
			link->aspm_capable &= ~ASPM_STATE_L1;
335 336 337 338 339 340
		l1_switch_latency += 1000;

		link = link->parent;
	}
}

341
static void pcie_aspm_cap_init(struct pcie_link_state *link, int blacklist)
S
Shaohua Li 已提交
342
{
343 344
	struct pci_dev *child, *parent = link->pdev;
	struct pci_bus *linkbus = parent->subordinate;
345
	struct aspm_register_info upreg, dwreg;
S
Shaohua Li 已提交
346

347
	if (blacklist) {
348
		/* Set enabled/disable so that we will disable ASPM later */
349 350
		link->aspm_enabled = ASPM_STATE_ALL;
		link->aspm_disable = ASPM_STATE_ALL;
351 352 353 354 355 356
		return;
	}

	/* Configure common clock before checking latencies */
	pcie_aspm_configure_common_clock(link);

357 358
	/* Get upstream/downstream components' register state */
	pcie_get_aspm_reg(parent, &upreg);
359
	child = list_entry(linkbus->devices.next, struct pci_dev, bus_list);
360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384
	pcie_get_aspm_reg(child, &dwreg);

	/*
	 * Setup L0s state
	 *
	 * Note that we must not enable L0s in either direction on a
	 * given link unless components on both sides of the link each
	 * support L0s.
	 */
	if (dwreg.support & upreg.support & PCIE_LINK_STATE_L0S)
		link->aspm_support |= ASPM_STATE_L0S;
	if (dwreg.enabled & PCIE_LINK_STATE_L0S)
		link->aspm_enabled |= ASPM_STATE_L0S_UP;
	if (upreg.enabled & PCIE_LINK_STATE_L0S)
		link->aspm_enabled |= ASPM_STATE_L0S_DW;
	link->latency_up.l0s = calc_l0s_latency(upreg.latency_encoding_l0s);
	link->latency_dw.l0s = calc_l0s_latency(dwreg.latency_encoding_l0s);

	/* Setup L1 state */
	if (upreg.support & dwreg.support & PCIE_LINK_STATE_L1)
		link->aspm_support |= ASPM_STATE_L1;
	if (upreg.enabled & dwreg.enabled & PCIE_LINK_STATE_L1)
		link->aspm_enabled |= ASPM_STATE_L1;
	link->latency_up.l1 = calc_l1_latency(upreg.latency_encoding_l1);
	link->latency_dw.l1 = calc_l1_latency(dwreg.latency_encoding_l1);
385

386 387
	/* Save default state */
	link->aspm_default = link->aspm_enabled;
388 389 390

	/* Setup initial capable state. Will be updated later */
	link->aspm_capable = link->aspm_support;
391 392 393 394 395
	/*
	 * If the downstream component has pci bridge function, don't
	 * do ASPM for now.
	 */
	list_for_each_entry(child, &linkbus->devices, bus_list) {
396
		if (pci_pcie_type(child) == PCI_EXP_TYPE_PCI_BRIDGE) {
397
			link->aspm_disable = ASPM_STATE_ALL;
398 399 400
			break;
		}
	}
401

402
	/* Get and check endpoint acceptable latencies */
403
	list_for_each_entry(child, &linkbus->devices, bus_list) {
404
		u32 reg32, encoding;
405
		struct aspm_latency *acceptable =
406
			&link->acceptable[PCI_FUNC(child->devfn)];
S
Shaohua Li 已提交
407

408 409
		if (pci_pcie_type(child) != PCI_EXP_TYPE_ENDPOINT &&
		    pci_pcie_type(child) != PCI_EXP_TYPE_LEG_END)
S
Shaohua Li 已提交
410 411
			continue;

412
		pcie_capability_read_dword(child, PCI_EXP_DEVCAP, &reg32);
413
		/* Calculate endpoint L0s acceptable latency */
414 415
		encoding = (reg32 & PCI_EXP_DEVCAP_L0S) >> 6;
		acceptable->l0s = calc_l0s_acceptable(encoding);
416 417 418 419 420
		/* Calculate endpoint L1 acceptable latency */
		encoding = (reg32 & PCI_EXP_DEVCAP_L1) >> 9;
		acceptable->l1 = calc_l1_acceptable(encoding);

		pcie_aspm_check_latency(child);
S
Shaohua Li 已提交
421 422 423
	}
}

424
static void pcie_config_aspm_dev(struct pci_dev *pdev, u32 val)
S
Shaohua Li 已提交
425
{
426 427
	pcie_capability_clear_and_set_word(pdev, PCI_EXP_LNKCTL,
					   PCI_EXP_LNKCTL_ASPMC, val);
S
Shaohua Li 已提交
428 429
}

430
static void pcie_config_aspm_link(struct pcie_link_state *link, u32 state)
S
Shaohua Li 已提交
431
{
432
	u32 upstream = 0, dwstream = 0;
433 434
	struct pci_dev *child, *parent = link->pdev;
	struct pci_bus *linkbus = parent->subordinate;
S
Shaohua Li 已提交
435

436
	/* Nothing to do if the link is already in the requested state */
437
	state &= (link->aspm_capable & ~link->aspm_disable);
438 439
	if (link->aspm_enabled == state)
		return;
440 441
	/* Convert ASPM state to upstream/downstream ASPM register state */
	if (state & ASPM_STATE_L0S_UP)
442
		dwstream |= PCI_EXP_LNKCTL_ASPM_L0S;
443
	if (state & ASPM_STATE_L0S_DW)
444
		upstream |= PCI_EXP_LNKCTL_ASPM_L0S;
445
	if (state & ASPM_STATE_L1) {
446 447
		upstream |= PCI_EXP_LNKCTL_ASPM_L1;
		dwstream |= PCI_EXP_LNKCTL_ASPM_L1;
448
	}
S
Shaohua Li 已提交
449
	/*
450 451 452 453
	 * Spec 2.0 suggests all functions should be configured the
	 * same setting for ASPM. Enabling ASPM L1 should be done in
	 * upstream component first and then downstream, and vice
	 * versa for disabling ASPM L1. Spec doesn't mention L0S.
S
Shaohua Li 已提交
454
	 */
455 456
	if (state & ASPM_STATE_L1)
		pcie_config_aspm_dev(parent, upstream);
457
	list_for_each_entry(child, &linkbus->devices, bus_list)
458 459 460
		pcie_config_aspm_dev(child, dwstream);
	if (!(state & ASPM_STATE_L1))
		pcie_config_aspm_dev(parent, upstream);
S
Shaohua Li 已提交
461

462
	link->aspm_enabled = state;
S
Shaohua Li 已提交
463 464
}

465
static void pcie_config_aspm_path(struct pcie_link_state *link)
S
Shaohua Li 已提交
466
{
467 468 469
	while (link) {
		pcie_config_aspm_link(link, policy_to_aspm_state(link));
		link = link->parent;
470
	}
S
Shaohua Li 已提交
471 472
}

473
static void free_link_state(struct pcie_link_state *link)
S
Shaohua Li 已提交
474
{
475 476
	link->pdev->link_state = NULL;
	kfree(link);
S
Shaohua Li 已提交
477 478
}

479 480
static int pcie_aspm_sanity_check(struct pci_dev *pdev)
{
481
	struct pci_dev *child;
482
	u32 reg32;
483

484
	/*
485
	 * Some functions in a slot might not all be PCIe functions,
486
	 * very strange. Disable ASPM for the whole slot
487
	 */
488
	list_for_each_entry(child, &pdev->subordinate->devices, bus_list) {
489
		if (!pci_is_pcie(child))
490
			return -EINVAL;
491 492 493 494 495 496 497 498 499 500

		/*
		 * If ASPM is disabled then we're not going to change
		 * the BIOS state. It's safe to continue even if it's a
		 * pre-1.1 device
		 */

		if (aspm_disabled)
			continue;

501 502 503 504
		/*
		 * Disable ASPM for pre-1.1 PCIe device, we follow MS to use
		 * RBER bit to determine if a function is 1.1 version device
		 */
505
		pcie_capability_read_dword(child, PCI_EXP_DEVCAP, &reg32);
S
Sitsofe Wheeler 已提交
506
		if (!(reg32 & PCI_EXP_DEVCAP_RBER) && !aspm_force) {
507
			dev_info(&child->dev, "disabling ASPM on pre-1.1 PCIe device.  You can enable it with 'pcie_aspm=force'\n");
508 509
			return -EINVAL;
		}
510 511 512 513
	}
	return 0;
}

514
static struct pcie_link_state *alloc_pcie_link_state(struct pci_dev *pdev)
515 516 517 518 519 520 521 522 523 524
{
	struct pcie_link_state *link;

	link = kzalloc(sizeof(*link), GFP_KERNEL);
	if (!link)
		return NULL;
	INIT_LIST_HEAD(&link->sibling);
	INIT_LIST_HEAD(&link->children);
	INIT_LIST_HEAD(&link->link);
	link->pdev = pdev;
525
	if (pci_pcie_type(pdev) != PCI_EXP_TYPE_ROOT_PORT) {
526 527 528 529 530 531 532 533 534
		struct pcie_link_state *parent;
		parent = pdev->bus->parent->self->link_state;
		if (!parent) {
			kfree(link);
			return NULL;
		}
		link->parent = parent;
		list_add(&link->link, &parent->children);
	}
535 536 537 538 539 540
	/* Setup a pointer to the root port link */
	if (!link->parent)
		link->root = link;
	else
		link->root = link->parent->root;

541 542 543 544 545
	list_add(&link->sibling, &link_list);
	pdev->link_state = link;
	return link;
}

S
Shaohua Li 已提交
546 547
/*
 * pcie_aspm_init_link_state: Initiate PCI express link state.
548
 * It is called after the pcie and its children devices are scanned.
S
Shaohua Li 已提交
549 550 551 552
 * @pdev: the root port or switch downstream port
 */
void pcie_aspm_init_link_state(struct pci_dev *pdev)
{
553
	struct pcie_link_state *link;
554
	int blacklist = !!pcie_aspm_sanity_check(pdev);
S
Shaohua Li 已提交
555

556 557 558
	if (!aspm_support_enabled)
		return;

559
	if (pdev->link_state)
S
Shaohua Li 已提交
560
		return;
561 562 563 564 565 566 567

	/*
	 * We allocate pcie_link_state for the component on the upstream
	 * end of a Link, so there's nothing to do unless this device has a
	 * Link on its secondary side.
	 */
	if (!pdev->has_secondary_link)
S
Shaohua Li 已提交
568
		return;
569

570
	/* VIA has a strange chipset, root port is under a bridge */
571
	if (pci_pcie_type(pdev) == PCI_EXP_TYPE_ROOT_PORT &&
572
	    pdev->bus->self)
573
		return;
574

S
Shaohua Li 已提交
575 576 577 578 579
	down_read(&pci_bus_sem);
	if (list_empty(&pdev->subordinate->devices))
		goto out;

	mutex_lock(&aspm_lock);
580
	link = alloc_pcie_link_state(pdev);
581 582 583
	if (!link)
		goto unlock;
	/*
584 585 586
	 * Setup initial ASPM state. Note that we need to configure
	 * upstream links also because capable state of them can be
	 * update through pcie_aspm_cap_init().
587
	 */
588
	pcie_aspm_cap_init(link, blacklist);
S
Shaohua Li 已提交
589

590
	/* Setup initial Clock PM state */
591
	pcie_clkpm_cap_init(link, blacklist);
592 593 594 595 596 597 598 599 600

	/*
	 * At this stage drivers haven't had an opportunity to change the
	 * link policy setting. Enabling ASPM on broken hardware can cripple
	 * it even before the driver has had a chance to disable ASPM, so
	 * default to a safe level right now. If we're enabling ASPM beyond
	 * the BIOS's expectation, we'll do so once pci_enable_device() is
	 * called.
	 */
M
Matthew Garrett 已提交
601
	if (aspm_policy != POLICY_POWERSAVE) {
602 603 604 605
		pcie_config_aspm_path(link);
		pcie_set_clkpm(link, policy_to_clkpm_state(link));
	}

606
unlock:
S
Shaohua Li 已提交
607 608 609 610 611
	mutex_unlock(&aspm_lock);
out:
	up_read(&pci_bus_sem);
}

612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627
/* Recheck latencies and update aspm_capable for links under the root */
static void pcie_update_aspm_capable(struct pcie_link_state *root)
{
	struct pcie_link_state *link;
	BUG_ON(root->parent);
	list_for_each_entry(link, &link_list, sibling) {
		if (link->root != root)
			continue;
		link->aspm_capable = link->aspm_support;
	}
	list_for_each_entry(link, &link_list, sibling) {
		struct pci_dev *child;
		struct pci_bus *linkbus = link->pdev->subordinate;
		if (link->root != root)
			continue;
		list_for_each_entry(child, &linkbus->devices, bus_list) {
628 629
			if ((pci_pcie_type(child) != PCI_EXP_TYPE_ENDPOINT) &&
			    (pci_pcie_type(child) != PCI_EXP_TYPE_LEG_END))
630 631 632 633 634 635
				continue;
			pcie_aspm_check_latency(child);
		}
	}
}

S
Shaohua Li 已提交
636 637 638 639
/* @pdev: the endpoint device */
void pcie_aspm_exit_link_state(struct pci_dev *pdev)
{
	struct pci_dev *parent = pdev->bus->self;
640
	struct pcie_link_state *link, *root, *parent_link;
S
Shaohua Li 已提交
641

642
	if (!parent || !parent->link_state)
S
Shaohua Li 已提交
643
		return;
644

S
Shaohua Li 已提交
645 646 647 648
	down_read(&pci_bus_sem);
	mutex_lock(&aspm_lock);
	/*
	 * All PCIe functions are in one slot, remove one function will remove
649
	 * the whole slot, so just wait until we are the last function left.
S
Shaohua Li 已提交
650
	 */
651
	if (!list_is_last(&pdev->bus_list, &parent->subordinate->devices))
S
Shaohua Li 已提交
652 653
		goto out;

654
	link = parent->link_state;
655
	root = link->root;
656
	parent_link = link->parent;
657

S
Shaohua Li 已提交
658
	/* All functions are removed, so just disable ASPM for the link */
659
	pcie_config_aspm_link(link, 0);
660 661
	list_del(&link->sibling);
	list_del(&link->link);
S
Shaohua Li 已提交
662
	/* Clock PM is for endpoint device */
663
	free_link_state(link);
664 665

	/* Recheck latencies and configure upstream links */
666 667 668 669
	if (parent_link) {
		pcie_update_aspm_capable(root);
		pcie_config_aspm_path(parent_link);
	}
S
Shaohua Li 已提交
670 671 672 673 674 675 676 677
out:
	mutex_unlock(&aspm_lock);
	up_read(&pci_bus_sem);
}

/* @pdev: the root port or switch downstream port */
void pcie_aspm_pm_state_change(struct pci_dev *pdev)
{
678
	struct pcie_link_state *link = pdev->link_state;
S
Shaohua Li 已提交
679

680
	if (aspm_disabled || !link)
S
Shaohua Li 已提交
681 682
		return;
	/*
683 684
	 * Devices changed PM state, we should recheck if latency
	 * meets all functions' requirement
S
Shaohua Li 已提交
685
	 */
686 687 688
	down_read(&pci_bus_sem);
	mutex_lock(&aspm_lock);
	pcie_update_aspm_capable(link->root);
689
	pcie_config_aspm_path(link);
690 691
	mutex_unlock(&aspm_lock);
	up_read(&pci_bus_sem);
S
Shaohua Li 已提交
692 693
}

694 695 696 697
void pcie_aspm_powersave_config_link(struct pci_dev *pdev)
{
	struct pcie_link_state *link = pdev->link_state;

698
	if (aspm_disabled || !link)
699 700 701 702 703 704 705 706 707 708 709 710 711
		return;

	if (aspm_policy != POLICY_POWERSAVE)
		return;

	down_read(&pci_bus_sem);
	mutex_lock(&aspm_lock);
	pcie_config_aspm_path(link);
	pcie_set_clkpm(link, policy_to_clkpm_state(link));
	mutex_unlock(&aspm_lock);
	up_read(&pci_bus_sem);
}

712
static void __pci_disable_link_state(struct pci_dev *pdev, int state, bool sem)
S
Shaohua Li 已提交
713 714
{
	struct pci_dev *parent = pdev->bus->self;
715
	struct pcie_link_state *link;
S
Shaohua Li 已提交
716

M
Matthew Garrett 已提交
717
	if (!pci_is_pcie(pdev))
S
Shaohua Li 已提交
718
		return;
M
Matthew Garrett 已提交
719

720
	if (pdev->has_secondary_link)
S
Shaohua Li 已提交
721 722 723 724
		parent = pdev;
	if (!parent || !parent->link_state)
		return;

725 726 727 728 729 730 731 732
	/*
	 * A driver requested that ASPM be disabled on this device, but
	 * if we don't have permission to manage ASPM (e.g., on ACPI
	 * systems we have to observe the FADT ACPI_FADT_NO_ASPM bit and
	 * the _OSC method), we can't honor that request.  Windows has
	 * a similar mechanism using "PciASPMOptOut", which is also
	 * ignored in this situation.
	 */
733
	if (aspm_disabled) {
734 735 736 737
		dev_warn(&pdev->dev, "can't disable ASPM; OS doesn't have ASPM control\n");
		return;
	}

738 739
	if (sem)
		down_read(&pci_bus_sem);
S
Shaohua Li 已提交
740
	mutex_lock(&aspm_lock);
741
	link = parent->link_state;
742 743 744 745
	if (state & PCIE_LINK_STATE_L0S)
		link->aspm_disable |= ASPM_STATE_L0S;
	if (state & PCIE_LINK_STATE_L1)
		link->aspm_disable |= ASPM_STATE_L1;
746 747
	pcie_config_aspm_link(link, policy_to_aspm_state(link));

K
Kenji Kaneshige 已提交
748
	if (state & PCIE_LINK_STATE_CLKPM) {
749 750
		link->clkpm_capable = 0;
		pcie_set_clkpm(link, 0);
K
Kenji Kaneshige 已提交
751
	}
S
Shaohua Li 已提交
752
	mutex_unlock(&aspm_lock);
753 754 755 756 757 758
	if (sem)
		up_read(&pci_bus_sem);
}

void pci_disable_link_state_locked(struct pci_dev *pdev, int state)
{
759
	__pci_disable_link_state(pdev, state, false);
760 761 762
}
EXPORT_SYMBOL(pci_disable_link_state_locked);

763 764 765 766 767 768 769 770 771
/**
 * pci_disable_link_state - Disable device's link state, so the link will
 * never enter specific states.  Note that if the BIOS didn't grant ASPM
 * control to the OS, this does nothing because we can't touch the LNKCTL
 * register.
 *
 * @pdev: PCI device
 * @state: ASPM link state to disable
 */
772 773
void pci_disable_link_state(struct pci_dev *pdev, int state)
{
774
	__pci_disable_link_state(pdev, state, true);
S
Shaohua Li 已提交
775 776 777 778 779 780
}
EXPORT_SYMBOL(pci_disable_link_state);

static int pcie_aspm_set_policy(const char *val, struct kernel_param *kp)
{
	int i;
781
	struct pcie_link_state *link;
S
Shaohua Li 已提交
782

783 784
	if (aspm_disabled)
		return -EPERM;
S
Shaohua Li 已提交
785 786 787 788 789 790 791 792 793 794 795
	for (i = 0; i < ARRAY_SIZE(policy_str); i++)
		if (!strncmp(val, policy_str[i], strlen(policy_str[i])))
			break;
	if (i >= ARRAY_SIZE(policy_str))
		return -EINVAL;
	if (i == aspm_policy)
		return 0;

	down_read(&pci_bus_sem);
	mutex_lock(&aspm_lock);
	aspm_policy = i;
796 797 798
	list_for_each_entry(link, &link_list, sibling) {
		pcie_config_aspm_link(link, policy_to_aspm_state(link));
		pcie_set_clkpm(link, policy_to_clkpm_state(link));
S
Shaohua Li 已提交
799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826
	}
	mutex_unlock(&aspm_lock);
	up_read(&pci_bus_sem);
	return 0;
}

static int pcie_aspm_get_policy(char *buffer, struct kernel_param *kp)
{
	int i, cnt = 0;
	for (i = 0; i < ARRAY_SIZE(policy_str); i++)
		if (i == aspm_policy)
			cnt += sprintf(buffer + cnt, "[%s] ", policy_str[i]);
		else
			cnt += sprintf(buffer + cnt, "%s ", policy_str[i]);
	return cnt;
}

module_param_call(policy, pcie_aspm_set_policy, pcie_aspm_get_policy,
	NULL, 0644);

#ifdef CONFIG_PCIEASPM_DEBUG
static ssize_t link_state_show(struct device *dev,
		struct device_attribute *attr,
		char *buf)
{
	struct pci_dev *pci_device = to_pci_dev(dev);
	struct pcie_link_state *link_state = pci_device->link_state;

827
	return sprintf(buf, "%d\n", link_state->aspm_enabled);
S
Shaohua Li 已提交
828 829 830 831 832 833 834
}

static ssize_t link_state_store(struct device *dev,
		struct device_attribute *attr,
		const char *buf,
		size_t n)
{
835
	struct pci_dev *pdev = to_pci_dev(dev);
836
	struct pcie_link_state *link, *root = pdev->link_state->root;
837 838 839 840
	u32 val, state = 0;

	if (kstrtouint(buf, 10, &val))
		return -EINVAL;
S
Shaohua Li 已提交
841

842 843
	if (aspm_disabled)
		return -EPERM;
844
	if (n < 1 || val > 3)
S
Shaohua Li 已提交
845 846
		return -EINVAL;

847 848 849 850 851 852
	/* Convert requested state to ASPM state */
	if (val & PCIE_LINK_STATE_L0S)
		state |= ASPM_STATE_L0S;
	if (val & PCIE_LINK_STATE_L1)
		state |= ASPM_STATE_L1;

853 854 855 856 857 858 859 860 861 862
	down_read(&pci_bus_sem);
	mutex_lock(&aspm_lock);
	list_for_each_entry(link, &link_list, sibling) {
		if (link->root != root)
			continue;
		pcie_config_aspm_link(link, state);
	}
	mutex_unlock(&aspm_lock);
	up_read(&pci_bus_sem);
	return n;
S
Shaohua Li 已提交
863 864 865 866 867 868 869 870 871
}

static ssize_t clk_ctl_show(struct device *dev,
		struct device_attribute *attr,
		char *buf)
{
	struct pci_dev *pci_device = to_pci_dev(dev);
	struct pcie_link_state *link_state = pci_device->link_state;

872
	return sprintf(buf, "%d\n", link_state->clkpm_enabled);
S
Shaohua Li 已提交
873 874 875 876 877 878 879
}

static ssize_t clk_ctl_store(struct device *dev,
		struct device_attribute *attr,
		const char *buf,
		size_t n)
{
K
Kenji Kaneshige 已提交
880
	struct pci_dev *pdev = to_pci_dev(dev);
881
	bool state;
S
Shaohua Li 已提交
882

883
	if (strtobool(buf, &state))
S
Shaohua Li 已提交
884 885 886 887
		return -EINVAL;

	down_read(&pci_bus_sem);
	mutex_lock(&aspm_lock);
888
	pcie_set_clkpm_nocheck(pdev->link_state, state);
S
Shaohua Li 已提交
889 890 891 892 893 894 895 896 897 898 899 900 901 902
	mutex_unlock(&aspm_lock);
	up_read(&pci_bus_sem);

	return n;
}

static DEVICE_ATTR(link_state, 0644, link_state_show, link_state_store);
static DEVICE_ATTR(clk_ctl, 0644, clk_ctl_show, clk_ctl_store);

static char power_group[] = "power";
void pcie_aspm_create_sysfs_dev_files(struct pci_dev *pdev)
{
	struct pcie_link_state *link_state = pdev->link_state;

903
	if (!link_state)
S
Shaohua Li 已提交
904 905
		return;

906
	if (link_state->aspm_support)
S
Shaohua Li 已提交
907 908
		sysfs_add_file_to_group(&pdev->dev.kobj,
			&dev_attr_link_state.attr, power_group);
909
	if (link_state->clkpm_capable)
S
Shaohua Li 已提交
910 911 912 913 914 915 916 917
		sysfs_add_file_to_group(&pdev->dev.kobj,
			&dev_attr_clk_ctl.attr, power_group);
}

void pcie_aspm_remove_sysfs_dev_files(struct pci_dev *pdev)
{
	struct pcie_link_state *link_state = pdev->link_state;

918
	if (!link_state)
S
Shaohua Li 已提交
919 920
		return;

921
	if (link_state->aspm_support)
S
Shaohua Li 已提交
922 923
		sysfs_remove_file_from_group(&pdev->dev.kobj,
			&dev_attr_link_state.attr, power_group);
924
	if (link_state->clkpm_capable)
S
Shaohua Li 已提交
925 926 927 928 929 930 931
		sysfs_remove_file_from_group(&pdev->dev.kobj,
			&dev_attr_clk_ctl.attr, power_group);
}
#endif

static int __init pcie_aspm_disable(char *str)
{
932
	if (!strcmp(str, "off")) {
M
Matthew Garrett 已提交
933
		aspm_policy = POLICY_DEFAULT;
934
		aspm_disabled = 1;
935
		aspm_support_enabled = false;
936 937 938
		printk(KERN_INFO "PCIe ASPM is disabled\n");
	} else if (!strcmp(str, "force")) {
		aspm_force = 1;
M
Michael Witten 已提交
939
		printk(KERN_INFO "PCIe ASPM is forcibly enabled\n");
940
	}
S
Shaohua Li 已提交
941 942 943
	return 1;
}

944
__setup("pcie_aspm=", pcie_aspm_disable);
S
Shaohua Li 已提交
945

946 947
void pcie_no_aspm(void)
{
M
Matthew Garrett 已提交
948 949 950 951 952 953 954 955
	/*
	 * Disabling ASPM is intended to prevent the kernel from modifying
	 * existing hardware state, not to clear existing state. To that end:
	 * (a) set policy to POLICY_DEFAULT in order to avoid changing state
	 * (b) prevent userspace from changing policy
	 */
	if (!aspm_force) {
		aspm_policy = POLICY_DEFAULT;
956
		aspm_disabled = 1;
M
Matthew Garrett 已提交
957
	}
958 959
}

960 961 962 963 964
bool pcie_aspm_support_enabled(void)
{
	return aspm_support_enabled;
}
EXPORT_SYMBOL(pcie_aspm_support_enabled);