aspm.c 25.3 KB
Newer Older
S
Shaohua Li 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18
/*
 * File:	drivers/pci/pcie/aspm.c
 * Enabling PCIE link L0s/L1 state and Clock Power Management
 *
 * Copyright (C) 2007 Intel
 * Copyright (C) Zhang Yanmin (yanmin.zhang@intel.com)
 * Copyright (C) Shaohua Li (shaohua.li@intel.com)
 */

#include <linux/kernel.h>
#include <linux/module.h>
#include <linux/moduleparam.h>
#include <linux/pci.h>
#include <linux/pci_regs.h>
#include <linux/errno.h>
#include <linux/pm.h>
#include <linux/init.h>
#include <linux/slab.h>
19
#include <linux/jiffies.h>
20
#include <linux/delay.h>
S
Shaohua Li 已提交
21 22 23 24 25 26 27 28
#include <linux/pci-aspm.h>
#include "../pci.h"

#ifdef MODULE_PARAM_PREFIX
#undef MODULE_PARAM_PREFIX
#endif
#define MODULE_PARAM_PREFIX "pcie_aspm."

29 30 31
struct aspm_latency {
	u32 l0s;			/* L0s latency (nsec) */
	u32 l1;				/* L1 latency (nsec) */
S
Shaohua Li 已提交
32 33 34
};

struct pcie_link_state {
35
	struct pci_dev *pdev;		/* Upstream component of the Link */
36
	struct pcie_link_state *root;	/* pointer to the root port link */
37 38 39 40
	struct pcie_link_state *parent;	/* pointer to the parent Link state */
	struct list_head sibling;	/* node in link_list */
	struct list_head children;	/* list of child link states */
	struct list_head link;		/* node in parent's children list */
S
Shaohua Li 已提交
41 42

	/* ASPM state */
43 44 45
	u32 aspm_support:2;		/* Supported ASPM state */
	u32 aspm_enabled:2;		/* Enabled ASPM state */
	u32 aspm_default:2;		/* Default ASPM state by BIOS */
46
	u32 aspm_disable:2;		/* Disabled ASPM state */
47

48 49 50 51 52
	/* Clock PM state */
	u32 clkpm_capable:1;		/* Clock PM capable? */
	u32 clkpm_enabled:1;		/* Current Clock PM state */
	u32 clkpm_default:1;		/* Default Clock PM state by BIOS */

53 54
	/* Latencies */
	struct aspm_latency latency;	/* Exit latency */
S
Shaohua Li 已提交
55
	/*
56 57
	 * Endpoint acceptable latencies. A pcie downstream port only
	 * has one slot under it, so at most there are 8 functions.
S
Shaohua Li 已提交
58
	 */
59
	struct aspm_latency acceptable[8];
S
Shaohua Li 已提交
60 61
};

62
static int aspm_disabled, aspm_force;
S
Shaohua Li 已提交
63 64 65 66 67 68 69 70 71 72 73 74 75
static DEFINE_MUTEX(aspm_lock);
static LIST_HEAD(link_list);

#define POLICY_DEFAULT 0	/* BIOS default setting */
#define POLICY_PERFORMANCE 1	/* high performance */
#define POLICY_POWERSAVE 2	/* high power saving */
static int aspm_policy;
static const char *policy_str[] = {
	[POLICY_DEFAULT] = "default",
	[POLICY_PERFORMANCE] = "performance",
	[POLICY_POWERSAVE] = "powersave"
};

76 77
#define LINK_RETRAIN_TIMEOUT HZ

78
static int policy_to_aspm_state(struct pcie_link_state *link)
S
Shaohua Li 已提交
79 80 81 82 83 84 85
{
	switch (aspm_policy) {
	case POLICY_PERFORMANCE:
		/* Disable ASPM and Clock PM */
		return 0;
	case POLICY_POWERSAVE:
		/* Enable ASPM L0s/L1 */
86
		return PCIE_LINK_STATE_L0S | PCIE_LINK_STATE_L1;
S
Shaohua Li 已提交
87
	case POLICY_DEFAULT:
88
		return link->aspm_default;
S
Shaohua Li 已提交
89 90 91 92
	}
	return 0;
}

93
static int policy_to_clkpm_state(struct pcie_link_state *link)
S
Shaohua Li 已提交
94 95 96 97 98 99 100 101 102
{
	switch (aspm_policy) {
	case POLICY_PERFORMANCE:
		/* Disable ASPM and Clock PM */
		return 0;
	case POLICY_POWERSAVE:
		/* Disable Clock PM */
		return 1;
	case POLICY_DEFAULT:
103
		return link->clkpm_default;
S
Shaohua Li 已提交
104 105 106 107
	}
	return 0;
}

K
Kenji Kaneshige 已提交
108
static void pcie_set_clkpm_nocheck(struct pcie_link_state *link, int enable)
S
Shaohua Li 已提交
109 110 111
{
	int pos;
	u16 reg16;
112 113
	struct pci_dev *child;
	struct pci_bus *linkbus = link->pdev->subordinate;
S
Shaohua Li 已提交
114

115 116
	list_for_each_entry(child, &linkbus->devices, bus_list) {
		pos = pci_find_capability(child, PCI_CAP_ID_EXP);
S
Shaohua Li 已提交
117 118
		if (!pos)
			return;
119
		pci_read_config_word(child, pos + PCI_EXP_LNKCTL, &reg16);
S
Shaohua Li 已提交
120 121 122 123
		if (enable)
			reg16 |= PCI_EXP_LNKCTL_CLKREQ_EN;
		else
			reg16 &= ~PCI_EXP_LNKCTL_CLKREQ_EN;
124
		pci_write_config_word(child, pos + PCI_EXP_LNKCTL, reg16);
S
Shaohua Li 已提交
125
	}
126
	link->clkpm_enabled = !!enable;
S
Shaohua Li 已提交
127 128
}

K
Kenji Kaneshige 已提交
129 130 131 132 133 134 135 136 137 138 139
static void pcie_set_clkpm(struct pcie_link_state *link, int enable)
{
	/* Don't enable Clock PM if the link is not Clock PM capable */
	if (!link->clkpm_capable && enable)
		return;
	/* Need nothing if the specified equals to current state */
	if (link->clkpm_enabled == enable)
		return;
	pcie_set_clkpm_nocheck(link, enable);
}

140
static void pcie_clkpm_cap_init(struct pcie_link_state *link, int blacklist)
S
Shaohua Li 已提交
141
{
142
	int pos, capable = 1, enabled = 1;
S
Shaohua Li 已提交
143 144
	u32 reg32;
	u16 reg16;
145 146
	struct pci_dev *child;
	struct pci_bus *linkbus = link->pdev->subordinate;
S
Shaohua Li 已提交
147 148

	/* All functions should have the same cap and state, take the worst */
149 150
	list_for_each_entry(child, &linkbus->devices, bus_list) {
		pos = pci_find_capability(child, PCI_CAP_ID_EXP);
S
Shaohua Li 已提交
151 152
		if (!pos)
			return;
153
		pci_read_config_dword(child, pos + PCI_EXP_LNKCAP, &reg32);
S
Shaohua Li 已提交
154 155 156 157 158
		if (!(reg32 & PCI_EXP_LNKCAP_CLKPM)) {
			capable = 0;
			enabled = 0;
			break;
		}
159
		pci_read_config_word(child, pos + PCI_EXP_LNKCTL, &reg16);
S
Shaohua Li 已提交
160 161 162
		if (!(reg16 & PCI_EXP_LNKCTL_CLKREQ_EN))
			enabled = 0;
	}
163 164
	link->clkpm_enabled = enabled;
	link->clkpm_default = enabled;
165
	link->clkpm_capable = (blacklist) ? 0 : capable;
166 167
}

168
static bool pcie_aspm_downstream_has_switch(struct pcie_link_state *link)
169
{
170 171
	struct pci_dev *child;
	struct pci_bus *linkbus = link->pdev->subordinate;
172

173 174
	list_for_each_entry(child, &linkbus->devices, bus_list) {
		if (child->pcie_type == PCI_EXP_TYPE_UPSTREAM)
175 176 177
			return true;
	}
	return false;
S
Shaohua Li 已提交
178 179 180 181 182 183 184
}

/*
 * pcie_aspm_configure_common_clock: check if the 2 ends of a link
 *   could use common clock. If they are, configure them to use the
 *   common clock. That will reduce the ASPM state exit latency.
 */
185
static void pcie_aspm_configure_common_clock(struct pcie_link_state *link)
S
Shaohua Li 已提交
186
{
187 188
	int ppos, cpos, same_clock = 1;
	u16 reg16, parent_reg, child_reg[8];
189
	unsigned long start_jiffies;
190 191
	struct pci_dev *child, *parent = link->pdev;
	struct pci_bus *linkbus = parent->subordinate;
S
Shaohua Li 已提交
192
	/*
193
	 * All functions of a slot should have the same Slot Clock
S
Shaohua Li 已提交
194
	 * Configuration, so just check one function
195 196 197
	 */
	child = list_entry(linkbus->devices.next, struct pci_dev, bus_list);
	BUG_ON(!child->is_pcie);
S
Shaohua Li 已提交
198 199

	/* Check downstream component if bit Slot Clock Configuration is 1 */
200 201
	cpos = pci_find_capability(child, PCI_CAP_ID_EXP);
	pci_read_config_word(child, cpos + PCI_EXP_LNKSTA, &reg16);
S
Shaohua Li 已提交
202 203 204 205
	if (!(reg16 & PCI_EXP_LNKSTA_SLC))
		same_clock = 0;

	/* Check upstream component if bit Slot Clock Configuration is 1 */
206 207
	ppos = pci_find_capability(parent, PCI_CAP_ID_EXP);
	pci_read_config_word(parent, ppos + PCI_EXP_LNKSTA, &reg16);
S
Shaohua Li 已提交
208 209 210 211
	if (!(reg16 & PCI_EXP_LNKSTA_SLC))
		same_clock = 0;

	/* Configure downstream component, all functions */
212 213 214 215
	list_for_each_entry(child, &linkbus->devices, bus_list) {
		cpos = pci_find_capability(child, PCI_CAP_ID_EXP);
		pci_read_config_word(child, cpos + PCI_EXP_LNKCTL, &reg16);
		child_reg[PCI_FUNC(child->devfn)] = reg16;
S
Shaohua Li 已提交
216 217 218 219
		if (same_clock)
			reg16 |= PCI_EXP_LNKCTL_CCC;
		else
			reg16 &= ~PCI_EXP_LNKCTL_CCC;
220
		pci_write_config_word(child, cpos + PCI_EXP_LNKCTL, reg16);
S
Shaohua Li 已提交
221 222 223
	}

	/* Configure upstream component */
224
	pci_read_config_word(parent, ppos + PCI_EXP_LNKCTL, &reg16);
225
	parent_reg = reg16;
S
Shaohua Li 已提交
226 227 228 229
	if (same_clock)
		reg16 |= PCI_EXP_LNKCTL_CCC;
	else
		reg16 &= ~PCI_EXP_LNKCTL_CCC;
230
	pci_write_config_word(parent, ppos + PCI_EXP_LNKCTL, reg16);
S
Shaohua Li 已提交
231

232
	/* Retrain link */
S
Shaohua Li 已提交
233
	reg16 |= PCI_EXP_LNKCTL_RL;
234
	pci_write_config_word(parent, ppos + PCI_EXP_LNKCTL, reg16);
S
Shaohua Li 已提交
235

236
	/* Wait for link training end. Break out after waiting for timeout */
237
	start_jiffies = jiffies;
238
	for (;;) {
239
		pci_read_config_word(parent, ppos + PCI_EXP_LNKSTA, &reg16);
S
Shaohua Li 已提交
240 241
		if (!(reg16 & PCI_EXP_LNKSTA_LT))
			break;
242 243 244
		if (time_after(jiffies, start_jiffies + LINK_RETRAIN_TIMEOUT))
			break;
		msleep(1);
S
Shaohua Li 已提交
245
	}
246 247 248 249 250 251 252 253 254 255
	if (!(reg16 & PCI_EXP_LNKSTA_LT))
		return;

	/* Training failed. Restore common clock configurations */
	dev_printk(KERN_ERR, &parent->dev,
		   "ASPM: Could not configure common clock\n");
	list_for_each_entry(child, &linkbus->devices, bus_list) {
		cpos = pci_find_capability(child, PCI_CAP_ID_EXP);
		pci_write_config_word(child, cpos + PCI_EXP_LNKCTL,
				      child_reg[PCI_FUNC(child->devfn)]);
256
	}
257
	pci_write_config_word(parent, ppos + PCI_EXP_LNKCTL, parent_reg);
S
Shaohua Li 已提交
258 259
}

260 261
/* Convert L0s latency encoding to ns */
static u32 calc_l0s_latency(u32 encoding)
S
Shaohua Li 已提交
262
{
263 264 265 266
	if (encoding == 0x7)
		return (5 * 1000);	/* > 4us */
	return (64 << encoding);
}
S
Shaohua Li 已提交
267

268 269 270 271 272 273
/* Convert L0s acceptable latency encoding to ns */
static u32 calc_l0s_acceptable(u32 encoding)
{
	if (encoding == 0x7)
		return -1U;
	return (64 << encoding);
S
Shaohua Li 已提交
274 275
}

276 277
/* Convert L1 latency encoding to ns */
static u32 calc_l1_latency(u32 encoding)
S
Shaohua Li 已提交
278
{
279 280 281 282
	if (encoding == 0x7)
		return (65 * 1000);	/* > 64us */
	return (1000 << encoding);
}
S
Shaohua Li 已提交
283

284 285 286 287 288 289
/* Convert L1 acceptable latency encoding to ns */
static u32 calc_l1_acceptable(u32 encoding)
{
	if (encoding == 0x7)
		return -1U;
	return (1000 << encoding);
S
Shaohua Li 已提交
290 291 292
}

static void pcie_aspm_get_cap_device(struct pci_dev *pdev, u32 *state,
293
				     u32 *l0s, u32 *l1, u32 *enabled)
S
Shaohua Li 已提交
294 295 296
{
	int pos;
	u16 reg16;
297
	u32 reg32, encoding;
S
Shaohua Li 已提交
298

299
	*l0s = *l1 = *enabled = 0;
S
Shaohua Li 已提交
300 301 302 303
	pos = pci_find_capability(pdev, PCI_CAP_ID_EXP);
	pci_read_config_dword(pdev, pos + PCI_EXP_LNKCAP, &reg32);
	*state = (reg32 & PCI_EXP_LNKCAP_ASPMS) >> 10;
	if (*state != PCIE_LINK_STATE_L0S &&
304
	    *state != (PCIE_LINK_STATE_L1 | PCIE_LINK_STATE_L0S))
S
Shaohua Li 已提交
305 306 307 308
		*state = 0;
	if (*state == 0)
		return;

309 310
	encoding = (reg32 & PCI_EXP_LNKCAP_L0SEL) >> 12;
	*l0s = calc_l0s_latency(encoding);
S
Shaohua Li 已提交
311
	if (*state & PCIE_LINK_STATE_L1) {
312 313
		encoding = (reg32 & PCI_EXP_LNKCAP_L1EL) >> 15;
		*l1 = calc_l1_latency(encoding);
S
Shaohua Li 已提交
314 315
	}
	pci_read_config_word(pdev, pos + PCI_EXP_LNKCTL, &reg16);
316
	*enabled = reg16 & (PCIE_LINK_STATE_L0S | PCIE_LINK_STATE_L1);
S
Shaohua Li 已提交
317 318
}

319
static void pcie_aspm_cap_init(struct pcie_link_state *link, int blacklist)
S
Shaohua Li 已提交
320
{
321
	u32 support, l0s, l1, enabled;
322 323
	struct pci_dev *child, *parent = link->pdev;
	struct pci_bus *linkbus = parent->subordinate;
S
Shaohua Li 已提交
324

325
	if (blacklist) {
326
		/* Set enabled/disable so that we will disable ASPM later */
327
		link->aspm_enabled = PCIE_LINK_STATE_L0S | PCIE_LINK_STATE_L1;
328
		link->aspm_disable = PCIE_LINK_STATE_L0S | PCIE_LINK_STATE_L1;
329 330 331 332 333 334
		return;
	}

	/* Configure common clock before checking latencies */
	pcie_aspm_configure_common_clock(link);

S
Shaohua Li 已提交
335
	/* upstream component states */
336 337 338 339 340
	pcie_aspm_get_cap_device(parent, &support, &l0s, &l1, &enabled);
	link->aspm_support = support;
	link->latency.l0s = l0s;
	link->latency.l1 = l1;
	link->aspm_enabled = enabled;
341

S
Shaohua Li 已提交
342
	/* downstream component states, all functions have the same setting */
343 344 345 346 347 348
	child = list_entry(linkbus->devices.next, struct pci_dev, bus_list);
	pcie_aspm_get_cap_device(child, &support, &l0s, &l1, &enabled);
	link->aspm_support &= support;
	link->latency.l0s = max_t(u32, link->latency.l0s, l0s);
	link->latency.l1 = max_t(u32, link->latency.l1, l1);

349 350
	/* Save default state */
	link->aspm_default = link->aspm_enabled;
351 352 353 354 355 356 357 358 359 360 361
	/*
	 * If the downstream component has pci bridge function, don't
	 * do ASPM for now.
	 */
	list_for_each_entry(child, &linkbus->devices, bus_list) {
		if (child->pcie_type == PCI_EXP_TYPE_PCI_BRIDGE) {
			link->aspm_disable =
				PCIE_LINK_STATE_L0S | PCIE_LINK_STATE_L1;
			break;
		}
	}
362

363
	if (!link->aspm_support)
S
Shaohua Li 已提交
364
		return;
365

S
Shaohua Li 已提交
366
	/* ENDPOINT states*/
367
	list_for_each_entry(child, &linkbus->devices, bus_list) {
S
Shaohua Li 已提交
368
		int pos;
369
		u32 reg32, encoding;
370
		struct aspm_latency *acceptable =
371
			&link->acceptable[PCI_FUNC(child->devfn)];
S
Shaohua Li 已提交
372

373 374
		if (child->pcie_type != PCI_EXP_TYPE_ENDPOINT &&
		    child->pcie_type != PCI_EXP_TYPE_LEG_END)
S
Shaohua Li 已提交
375 376
			continue;

377 378
		pos = pci_find_capability(child, PCI_CAP_ID_EXP);
		pci_read_config_dword(child, pos + PCI_EXP_DEVCAP, &reg32);
379 380
		encoding = (reg32 & PCI_EXP_DEVCAP_L0S) >> 6;
		acceptable->l0s = calc_l0s_acceptable(encoding);
381
		if (link->aspm_support & PCIE_LINK_STATE_L1) {
382 383
			encoding = (reg32 & PCI_EXP_DEVCAP_L1) >> 9;
			acceptable->l1 = calc_l1_acceptable(encoding);
S
Shaohua Li 已提交
384 385 386 387
		}
	}
}

388 389 390 391 392 393 394 395 396 397 398
/**
 * __pcie_aspm_check_state_one - check latency for endpoint device.
 * @endpoint: pointer to the struct pci_dev of endpoint device
 *
 * TBD: The latency from the endpoint to root complex vary per switch's
 * upstream link state above the device. Here we just do a simple check
 * which assumes all links above the device can be in L1 state, that
 * is we just consider the worst case. If switch's upstream link can't
 * be put into L0S/L1, then our check is too strictly.
 */
static u32 __pcie_aspm_check_state_one(struct pci_dev *endpoint, u32 state)
S
Shaohua Li 已提交
399
{
400
	u32 l1_switch_latency = 0;
401
	struct aspm_latency *acceptable;
402
	struct pcie_link_state *link;
S
Shaohua Li 已提交
403

404 405 406
	link = endpoint->bus->self->link_state;
	state &= link->aspm_support;
	acceptable = &link->acceptable[PCI_FUNC(endpoint->devfn)];
S
Shaohua Li 已提交
407

408
	while (link && state) {
409
		if ((state & PCIE_LINK_STATE_L0S) &&
410
		    (link->latency.l0s > acceptable->l0s))
411 412
			state &= ~PCIE_LINK_STATE_L0S;
		if ((state & PCIE_LINK_STATE_L1) &&
413
		    (link->latency.l1 + l1_switch_latency > acceptable->l1))
414
			state &= ~PCIE_LINK_STATE_L1;
415 416 417 418 419 420
		link = link->parent;
		/*
		 * Every switch on the path to root complex need 1
		 * more microsecond for L1. Spec doesn't mention L0s.
		 */
		l1_switch_latency += 1000;
S
Shaohua Li 已提交
421 422 423 424
	}
	return state;
}

425
static u32 pcie_aspm_check_state(struct pcie_link_state *link, u32 state)
S
Shaohua Li 已提交
426
{
427 428 429
	pci_power_t power_state;
	struct pci_dev *child;
	struct pci_bus *linkbus = link->pdev->subordinate;
S
Shaohua Li 已提交
430

431
	/* If no child, ignore the link */
432
	if (list_empty(&linkbus->devices))
433
		return state;
434 435 436 437 438 439 440 441 442 443 444

	list_for_each_entry(child, &linkbus->devices, bus_list) {
		/*
		 * If downstream component of a link is pci bridge, we
		 * disable ASPM for now for the link
		 */
		if (child->pcie_type == PCI_EXP_TYPE_PCI_BRIDGE)
			return 0;

		if ((child->pcie_type != PCI_EXP_TYPE_ENDPOINT &&
		     child->pcie_type != PCI_EXP_TYPE_LEG_END))
S
Shaohua Li 已提交
445 446
			continue;
		/* Device not in D0 doesn't need check latency */
447 448 449
		power_state = child->current_state;
		if (power_state == PCI_D1 || power_state == PCI_D2 ||
		    power_state == PCI_D3hot || power_state == PCI_D3cold)
S
Shaohua Li 已提交
450
			continue;
451
		state = __pcie_aspm_check_state_one(child, state);
S
Shaohua Li 已提交
452 453 454 455 456 457 458 459 460 461 462 463 464 465 466
	}
	return state;
}

static void __pcie_aspm_config_one_dev(struct pci_dev *pdev, unsigned int state)
{
	u16 reg16;
	int pos = pci_find_capability(pdev, PCI_CAP_ID_EXP);

	pci_read_config_word(pdev, pos + PCI_EXP_LNKCTL, &reg16);
	reg16 &= ~0x3;
	reg16 |= state;
	pci_write_config_word(pdev, pos + PCI_EXP_LNKCTL, reg16);
}

467
static void __pcie_aspm_config_link(struct pcie_link_state *link, u32 state)
S
Shaohua Li 已提交
468
{
469 470
	struct pci_dev *child, *parent = link->pdev;
	struct pci_bus *linkbus = parent->subordinate;
S
Shaohua Li 已提交
471

472 473 474 475
	state &= ~link->aspm_disable;
	/* Nothing to do if the link is already in the requested state */
	if (link->aspm_enabled == state)
		return;
S
Shaohua Li 已提交
476
	/*
477 478 479 480
	 * Spec 2.0 suggests all functions should be configured the
	 * same setting for ASPM. Enabling ASPM L1 should be done in
	 * upstream component first and then downstream, and vice
	 * versa for disabling ASPM L1. Spec doesn't mention L0S.
S
Shaohua Li 已提交
481 482
	 */
	if (state & PCIE_LINK_STATE_L1)
483
		__pcie_aspm_config_one_dev(parent, state);
S
Shaohua Li 已提交
484

485 486
	list_for_each_entry(child, &linkbus->devices, bus_list)
		__pcie_aspm_config_one_dev(child, state);
S
Shaohua Li 已提交
487 488

	if (!(state & PCIE_LINK_STATE_L1))
489
		__pcie_aspm_config_one_dev(parent, state);
S
Shaohua Li 已提交
490

491
	link->aspm_enabled = state;
S
Shaohua Li 已提交
492 493
}

494 495 496
/* Check the whole hierarchy, and configure each link in the hierarchy */
static void __pcie_aspm_configure_link_state(struct pcie_link_state *link,
					     u32 state)
S
Shaohua Li 已提交
497
{
498
	struct pcie_link_state *leaf, *root = link->root;
S
Shaohua Li 已提交
499

500
	state &= (PCIE_LINK_STATE_L0S | PCIE_LINK_STATE_L1);
S
Shaohua Li 已提交
501

502
	/* Check all links who have specific root port link */
503
	list_for_each_entry(leaf, &link_list, sibling) {
504
		if (!list_empty(&leaf->children) || (leaf->root != root))
505
			continue;
506
		state = pcie_aspm_check_state(leaf, state);
507
	}
508 509 510
	/* Check root port link too in case it hasn't children */
	state = pcie_aspm_check_state(root, state);
	if (link->aspm_enabled == state)
S
Shaohua Li 已提交
511
		return;
512
	/*
513
	 * We must change the hierarchy. See comments in
514 515 516
	 * __pcie_aspm_config_link for the order
	 **/
	if (state & PCIE_LINK_STATE_L1) {
517
		list_for_each_entry(leaf, &link_list, sibling) {
518
			if (leaf->root == root)
519
				__pcie_aspm_config_link(leaf, state);
520 521
		}
	} else {
522
		list_for_each_entry_reverse(leaf, &link_list, sibling) {
523
			if (leaf->root == root)
524
				__pcie_aspm_config_link(leaf, state);
525 526
		}
	}
S
Shaohua Li 已提交
527 528 529 530 531 532
}

/*
 * pcie_aspm_configure_link_state: enable/disable PCI express link state
 * @pdev: the root port or switch downstream port
 */
533 534
static void pcie_aspm_configure_link_state(struct pcie_link_state *link,
					   u32 state)
S
Shaohua Li 已提交
535 536 537
{
	down_read(&pci_bus_sem);
	mutex_lock(&aspm_lock);
538
	__pcie_aspm_configure_link_state(link, state);
S
Shaohua Li 已提交
539 540 541 542
	mutex_unlock(&aspm_lock);
	up_read(&pci_bus_sem);
}

543
static void free_link_state(struct pcie_link_state *link)
S
Shaohua Li 已提交
544
{
545 546
	link->pdev->link_state = NULL;
	kfree(link);
S
Shaohua Li 已提交
547 548
}

549 550
static int pcie_aspm_sanity_check(struct pci_dev *pdev)
{
551 552
	struct pci_dev *child;
	int pos;
553
	u32 reg32;
554
	/*
555 556
	 * Some functions in a slot might not all be PCIE functions,
	 * very strange. Disable ASPM for the whole slot
557
	 */
558 559 560
	list_for_each_entry(child, &pdev->subordinate->devices, bus_list) {
		pos = pci_find_capability(child, PCI_CAP_ID_EXP);
		if (!pos)
561
			return -EINVAL;
562 563 564 565
		/*
		 * Disable ASPM for pre-1.1 PCIe device, we follow MS to use
		 * RBER bit to determine if a function is 1.1 version device
		 */
566
		pci_read_config_dword(child, pos + PCI_EXP_DEVCAP, &reg32);
S
Sitsofe Wheeler 已提交
567
		if (!(reg32 & PCI_EXP_DEVCAP_RBER) && !aspm_force) {
568
			dev_printk(KERN_INFO, &child->dev, "disabling ASPM"
569 570
				" on pre-1.1 PCIe device.  You can enable it"
				" with 'pcie_aspm=force'\n");
571 572
			return -EINVAL;
		}
573 574 575 576
	}
	return 0;
}

577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598
static struct pcie_link_state *pcie_aspm_setup_link_state(struct pci_dev *pdev)
{
	struct pcie_link_state *link;
	int blacklist = !!pcie_aspm_sanity_check(pdev);

	link = kzalloc(sizeof(*link), GFP_KERNEL);
	if (!link)
		return NULL;
	INIT_LIST_HEAD(&link->sibling);
	INIT_LIST_HEAD(&link->children);
	INIT_LIST_HEAD(&link->link);
	link->pdev = pdev;
	if (pdev->pcie_type == PCI_EXP_TYPE_DOWNSTREAM) {
		struct pcie_link_state *parent;
		parent = pdev->bus->parent->self->link_state;
		if (!parent) {
			kfree(link);
			return NULL;
		}
		link->parent = parent;
		list_add(&link->link, &parent->children);
	}
599 600 601 602 603 604
	/* Setup a pointer to the root port link */
	if (!link->parent)
		link->root = link;
	else
		link->root = link->parent->root;

605 606 607 608 609 610 611 612 613 614 615 616 617
	list_add(&link->sibling, &link_list);

	pdev->link_state = link;

	/* Check ASPM capability */
	pcie_aspm_cap_init(link, blacklist);

	/* Check Clock PM capability */
	pcie_clkpm_cap_init(link, blacklist);

	return link;
}

S
Shaohua Li 已提交
618 619 620 621 622 623 624
/*
 * pcie_aspm_init_link_state: Initiate PCI express link state.
 * It is called after the pcie and its children devices are scaned.
 * @pdev: the root port or switch downstream port
 */
void pcie_aspm_init_link_state(struct pci_dev *pdev)
{
625 626
	u32 state;
	struct pcie_link_state *link;
S
Shaohua Li 已提交
627 628 629 630

	if (aspm_disabled || !pdev->is_pcie || pdev->link_state)
		return;
	if (pdev->pcie_type != PCI_EXP_TYPE_ROOT_PORT &&
631
	    pdev->pcie_type != PCI_EXP_TYPE_DOWNSTREAM)
S
Shaohua Li 已提交
632
		return;
633

634 635
	/* VIA has a strange chipset, root port is under a bridge */
	if (pdev->pcie_type == PCI_EXP_TYPE_ROOT_PORT &&
636
	    pdev->bus->self)
637
		return;
638

S
Shaohua Li 已提交
639 640 641 642 643
	down_read(&pci_bus_sem);
	if (list_empty(&pdev->subordinate->devices))
		goto out;

	mutex_lock(&aspm_lock);
644 645 646 647 648 649 650 651 652 653
	link = pcie_aspm_setup_link_state(pdev);
	if (!link)
		goto unlock;
	/*
	 * Setup initial ASPM state
	 *
	 * If link has switch, delay the link config. The leaf link
	 * initialization will config the whole hierarchy. But we must
	 * make sure BIOS doesn't set unsupported link state.
	 */
654
	if (pcie_aspm_downstream_has_switch(link)) {
655 656
		state = pcie_aspm_check_state(link, link->aspm_default);
		__pcie_aspm_config_link(link, state);
657
	} else {
658 659
		state = policy_to_aspm_state(link);
		__pcie_aspm_configure_link_state(link, state);
660
	}
S
Shaohua Li 已提交
661

662 663
	/* Setup initial Clock PM state */
	state = (link->clkpm_capable) ? policy_to_clkpm_state(link) : 0;
K
Kenji Kaneshige 已提交
664
	pcie_set_clkpm(link, state);
665
unlock:
S
Shaohua Li 已提交
666 667 668 669 670 671 672 673 674
	mutex_unlock(&aspm_lock);
out:
	up_read(&pci_bus_sem);
}

/* @pdev: the endpoint device */
void pcie_aspm_exit_link_state(struct pci_dev *pdev)
{
	struct pci_dev *parent = pdev->bus->self;
675
	struct pcie_link_state *link;
S
Shaohua Li 已提交
676

677
	if (aspm_disabled || !pdev->is_pcie || !parent || !parent->link_state)
S
Shaohua Li 已提交
678 679
		return;
	if (parent->pcie_type != PCI_EXP_TYPE_ROOT_PORT &&
680
	    parent->pcie_type != PCI_EXP_TYPE_DOWNSTREAM)
S
Shaohua Li 已提交
681
		return;
682

S
Shaohua Li 已提交
683 684 685 686
	down_read(&pci_bus_sem);
	mutex_lock(&aspm_lock);
	/*
	 * All PCIe functions are in one slot, remove one function will remove
687
	 * the whole slot, so just wait until we are the last function left.
S
Shaohua Li 已提交
688
	 */
689
	if (!list_is_last(&pdev->bus_list, &parent->subordinate->devices))
S
Shaohua Li 已提交
690 691
		goto out;

692 693
	link = parent->link_state;

S
Shaohua Li 已提交
694 695
	/* All functions are removed, so just disable ASPM for the link */
	__pcie_aspm_config_one_dev(parent, 0);
696 697
	list_del(&link->sibling);
	list_del(&link->link);
S
Shaohua Li 已提交
698
	/* Clock PM is for endpoint device */
699
	free_link_state(link);
S
Shaohua Li 已提交
700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718
out:
	mutex_unlock(&aspm_lock);
	up_read(&pci_bus_sem);
}

/* @pdev: the root port or switch downstream port */
void pcie_aspm_pm_state_change(struct pci_dev *pdev)
{
	struct pcie_link_state *link_state = pdev->link_state;

	if (aspm_disabled || !pdev->is_pcie || !pdev->link_state)
		return;
	if (pdev->pcie_type != PCI_EXP_TYPE_ROOT_PORT &&
		pdev->pcie_type != PCI_EXP_TYPE_DOWNSTREAM)
		return;
	/*
	 * devices changed PM state, we should recheck if latency meets all
	 * functions' requirement
	 */
719
	pcie_aspm_configure_link_state(link_state, link_state->aspm_enabled);
S
Shaohua Li 已提交
720 721 722 723 724 725 726 727 728
}

/*
 * pci_disable_link_state - disable pci device's link state, so the link will
 * never enter specific states
 */
void pci_disable_link_state(struct pci_dev *pdev, int state)
{
	struct pci_dev *parent = pdev->bus->self;
729
	struct pcie_link_state *link;
S
Shaohua Li 已提交
730 731 732 733 734 735 736 737 738 739 740

	if (aspm_disabled || !pdev->is_pcie)
		return;
	if (pdev->pcie_type == PCI_EXP_TYPE_ROOT_PORT ||
	    pdev->pcie_type == PCI_EXP_TYPE_DOWNSTREAM)
		parent = pdev;
	if (!parent || !parent->link_state)
		return;

	down_read(&pci_bus_sem);
	mutex_lock(&aspm_lock);
741 742 743
	link = parent->link_state;
	link->aspm_disable |= state;
	__pcie_aspm_configure_link_state(link, link->aspm_enabled);
K
Kenji Kaneshige 已提交
744
	if (state & PCIE_LINK_STATE_CLKPM) {
745 746
		link->clkpm_capable = 0;
		pcie_set_clkpm(link, 0);
K
Kenji Kaneshige 已提交
747
	}
S
Shaohua Li 已提交
748 749 750 751 752 753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768
	mutex_unlock(&aspm_lock);
	up_read(&pci_bus_sem);
}
EXPORT_SYMBOL(pci_disable_link_state);

static int pcie_aspm_set_policy(const char *val, struct kernel_param *kp)
{
	int i;
	struct pcie_link_state *link_state;

	for (i = 0; i < ARRAY_SIZE(policy_str); i++)
		if (!strncmp(val, policy_str[i], strlen(policy_str[i])))
			break;
	if (i >= ARRAY_SIZE(policy_str))
		return -EINVAL;
	if (i == aspm_policy)
		return 0;

	down_read(&pci_bus_sem);
	mutex_lock(&aspm_lock);
	aspm_policy = i;
769
	list_for_each_entry(link_state, &link_list, sibling) {
770 771
		__pcie_aspm_configure_link_state(link_state,
			policy_to_aspm_state(link_state));
K
Kenji Kaneshige 已提交
772
		pcie_set_clkpm(link_state, policy_to_clkpm_state(link_state));
S
Shaohua Li 已提交
773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800
	}
	mutex_unlock(&aspm_lock);
	up_read(&pci_bus_sem);
	return 0;
}

static int pcie_aspm_get_policy(char *buffer, struct kernel_param *kp)
{
	int i, cnt = 0;
	for (i = 0; i < ARRAY_SIZE(policy_str); i++)
		if (i == aspm_policy)
			cnt += sprintf(buffer + cnt, "[%s] ", policy_str[i]);
		else
			cnt += sprintf(buffer + cnt, "%s ", policy_str[i]);
	return cnt;
}

module_param_call(policy, pcie_aspm_set_policy, pcie_aspm_get_policy,
	NULL, 0644);

#ifdef CONFIG_PCIEASPM_DEBUG
static ssize_t link_state_show(struct device *dev,
		struct device_attribute *attr,
		char *buf)
{
	struct pci_dev *pci_device = to_pci_dev(dev);
	struct pcie_link_state *link_state = pci_device->link_state;

801
	return sprintf(buf, "%d\n", link_state->aspm_enabled);
S
Shaohua Li 已提交
802 803 804 805 806 807 808
}

static ssize_t link_state_store(struct device *dev,
		struct device_attribute *attr,
		const char *buf,
		size_t n)
{
809
	struct pci_dev *pdev = to_pci_dev(dev);
S
Shaohua Li 已提交
810 811 812 813 814 815 816
	int state;

	if (n < 1)
		return -EINVAL;
	state = buf[0]-'0';
	if (state >= 0 && state <= 3) {
		/* setup link aspm state */
817
		pcie_aspm_configure_link_state(pdev->link_state, state);
S
Shaohua Li 已提交
818 819 820 821 822 823 824 825 826 827 828 829 830
		return n;
	}

	return -EINVAL;
}

static ssize_t clk_ctl_show(struct device *dev,
		struct device_attribute *attr,
		char *buf)
{
	struct pci_dev *pci_device = to_pci_dev(dev);
	struct pcie_link_state *link_state = pci_device->link_state;

831
	return sprintf(buf, "%d\n", link_state->clkpm_enabled);
S
Shaohua Li 已提交
832 833 834 835 836 837 838
}

static ssize_t clk_ctl_store(struct device *dev,
		struct device_attribute *attr,
		const char *buf,
		size_t n)
{
K
Kenji Kaneshige 已提交
839
	struct pci_dev *pdev = to_pci_dev(dev);
S
Shaohua Li 已提交
840 841 842 843 844 845 846 847
	int state;

	if (n < 1)
		return -EINVAL;
	state = buf[0]-'0';

	down_read(&pci_bus_sem);
	mutex_lock(&aspm_lock);
K
Kenji Kaneshige 已提交
848
	pcie_set_clkpm_nocheck(pdev->link_state, !!state);
S
Shaohua Li 已提交
849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865 866
	mutex_unlock(&aspm_lock);
	up_read(&pci_bus_sem);

	return n;
}

static DEVICE_ATTR(link_state, 0644, link_state_show, link_state_store);
static DEVICE_ATTR(clk_ctl, 0644, clk_ctl_show, clk_ctl_store);

static char power_group[] = "power";
void pcie_aspm_create_sysfs_dev_files(struct pci_dev *pdev)
{
	struct pcie_link_state *link_state = pdev->link_state;

	if (!pdev->is_pcie || (pdev->pcie_type != PCI_EXP_TYPE_ROOT_PORT &&
		pdev->pcie_type != PCI_EXP_TYPE_DOWNSTREAM) || !link_state)
		return;

867
	if (link_state->aspm_support)
S
Shaohua Li 已提交
868 869
		sysfs_add_file_to_group(&pdev->dev.kobj,
			&dev_attr_link_state.attr, power_group);
870
	if (link_state->clkpm_capable)
S
Shaohua Li 已提交
871 872 873 874 875 876 877 878 879 880 881 882
		sysfs_add_file_to_group(&pdev->dev.kobj,
			&dev_attr_clk_ctl.attr, power_group);
}

void pcie_aspm_remove_sysfs_dev_files(struct pci_dev *pdev)
{
	struct pcie_link_state *link_state = pdev->link_state;

	if (!pdev->is_pcie || (pdev->pcie_type != PCI_EXP_TYPE_ROOT_PORT &&
		pdev->pcie_type != PCI_EXP_TYPE_DOWNSTREAM) || !link_state)
		return;

883
	if (link_state->aspm_support)
S
Shaohua Li 已提交
884 885
		sysfs_remove_file_from_group(&pdev->dev.kobj,
			&dev_attr_link_state.attr, power_group);
886
	if (link_state->clkpm_capable)
S
Shaohua Li 已提交
887 888 889 890 891 892 893
		sysfs_remove_file_from_group(&pdev->dev.kobj,
			&dev_attr_clk_ctl.attr, power_group);
}
#endif

static int __init pcie_aspm_disable(char *str)
{
894 895 896 897 898 899 900
	if (!strcmp(str, "off")) {
		aspm_disabled = 1;
		printk(KERN_INFO "PCIe ASPM is disabled\n");
	} else if (!strcmp(str, "force")) {
		aspm_force = 1;
		printk(KERN_INFO "PCIe ASPM is forcedly enabled\n");
	}
S
Shaohua Li 已提交
901 902 903
	return 1;
}

904
__setup("pcie_aspm=", pcie_aspm_disable);
S
Shaohua Li 已提交
905

906 907
void pcie_no_aspm(void)
{
908 909
	if (!aspm_force)
		aspm_disabled = 1;
910 911
}

912 913 914 915 916 917 918
/**
 * pcie_aspm_enabled - is PCIe ASPM enabled?
 *
 * Returns true if ASPM has not been disabled by the command-line option
 * pcie_aspm=off.
 **/
int pcie_aspm_enabled(void)
S
Shaohua Li 已提交
919
{
920
       return !aspm_disabled;
S
Shaohua Li 已提交
921
}
922
EXPORT_SYMBOL(pcie_aspm_enabled);
S
Shaohua Li 已提交
923