aspm.c 37.6 KB
Newer Older
1
// SPDX-License-Identifier: GPL-2.0
S
Shaohua Li 已提交
2
/*
B
Bjorn Helgaas 已提交
3
 * Enable PCIe link L0s/L1 state and Clock Power Management
S
Shaohua Li 已提交
4 5 6 7 8 9 10 11 12 13 14 15 16 17 18
 *
 * Copyright (C) 2007 Intel
 * Copyright (C) Zhang Yanmin (yanmin.zhang@intel.com)
 * Copyright (C) Shaohua Li (shaohua.li@intel.com)
 */

#include <linux/kernel.h>
#include <linux/module.h>
#include <linux/moduleparam.h>
#include <linux/pci.h>
#include <linux/pci_regs.h>
#include <linux/errno.h>
#include <linux/pm.h>
#include <linux/init.h>
#include <linux/slab.h>
19
#include <linux/jiffies.h>
20
#include <linux/delay.h>
S
Shaohua Li 已提交
21 22 23 24 25 26 27 28
#include <linux/pci-aspm.h>
#include "../pci.h"

#ifdef MODULE_PARAM_PREFIX
#undef MODULE_PARAM_PREFIX
#endif
#define MODULE_PARAM_PREFIX "pcie_aspm."

29 30 31 32
/* Note: those are not register definitions */
#define ASPM_STATE_L0S_UP	(1)	/* Upstream direction L0s state */
#define ASPM_STATE_L0S_DW	(2)	/* Downstream direction L0s state */
#define ASPM_STATE_L1		(4)	/* L1 state */
33 34 35 36 37 38 39 40
#define ASPM_STATE_L1_1		(8)	/* ASPM L1.1 state */
#define ASPM_STATE_L1_2		(0x10)	/* ASPM L1.2 state */
#define ASPM_STATE_L1_1_PCIPM	(0x20)	/* PCI PM L1.1 state */
#define ASPM_STATE_L1_2_PCIPM	(0x40)	/* PCI PM L1.2 state */
#define ASPM_STATE_L1_SS_PCIPM	(ASPM_STATE_L1_1_PCIPM | ASPM_STATE_L1_2_PCIPM)
#define ASPM_STATE_L1_2_MASK	(ASPM_STATE_L1_2 | ASPM_STATE_L1_2_PCIPM)
#define ASPM_STATE_L1SS		(ASPM_STATE_L1_1 | ASPM_STATE_L1_1_PCIPM |\
				 ASPM_STATE_L1_2_MASK)
41
#define ASPM_STATE_L0S		(ASPM_STATE_L0S_UP | ASPM_STATE_L0S_DW)
42 43
#define ASPM_STATE_ALL		(ASPM_STATE_L0S | ASPM_STATE_L1 |	\
				 ASPM_STATE_L1SS)
44

45 46 47
struct aspm_latency {
	u32 l0s;			/* L0s latency (nsec) */
	u32 l1;				/* L1 latency (nsec) */
S
Shaohua Li 已提交
48 49 50
};

struct pcie_link_state {
51
	struct pci_dev *pdev;		/* Upstream component of the Link */
52
	struct pci_dev *downstream;	/* Downstream component, function 0 */
53
	struct pcie_link_state *root;	/* pointer to the root port link */
54 55 56 57
	struct pcie_link_state *parent;	/* pointer to the parent Link state */
	struct list_head sibling;	/* node in link_list */
	struct list_head children;	/* list of child link states */
	struct list_head link;		/* node in parent's children list */
S
Shaohua Li 已提交
58 59

	/* ASPM state */
60 61 62 63 64
	u32 aspm_support:7;		/* Supported ASPM state */
	u32 aspm_enabled:7;		/* Enabled ASPM state */
	u32 aspm_capable:7;		/* Capable ASPM state with latency */
	u32 aspm_default:7;		/* Default ASPM state by BIOS */
	u32 aspm_disable:7;		/* Disabled ASPM state */
65

66 67 68 69 70
	/* Clock PM state */
	u32 clkpm_capable:1;		/* Clock PM capable? */
	u32 clkpm_enabled:1;		/* Current Clock PM state */
	u32 clkpm_default:1;		/* Default Clock PM state by BIOS */

71 72 73
	/* Exit latencies */
	struct aspm_latency latency_up;	/* Upstream direction exit latency */
	struct aspm_latency latency_dw;	/* Downstream direction exit latency */
S
Shaohua Li 已提交
74
	/*
75 76
	 * Endpoint acceptable latencies. A pcie downstream port only
	 * has one slot under it, so at most there are 8 functions.
S
Shaohua Li 已提交
77
	 */
78
	struct aspm_latency acceptable[8];
79 80 81 82 83 84 85 86

	/* L1 PM Substate info */
	struct {
		u32 up_cap_ptr;		/* L1SS cap ptr in upstream dev */
		u32 dw_cap_ptr;		/* L1SS cap ptr in downstream dev */
		u32 ctl1;		/* value to be programmed in ctl1 */
		u32 ctl2;		/* value to be programmed in ctl2 */
	} l1ss;
S
Shaohua Li 已提交
87 88
};

M
Matthew Garrett 已提交
89
static int aspm_disabled, aspm_force;
90
static bool aspm_support_enabled = true;
S
Shaohua Li 已提交
91 92 93 94 95 96
static DEFINE_MUTEX(aspm_lock);
static LIST_HEAD(link_list);

#define POLICY_DEFAULT 0	/* BIOS default setting */
#define POLICY_PERFORMANCE 1	/* high performance */
#define POLICY_POWERSAVE 2	/* high power saving */
97
#define POLICY_POWER_SUPERSAVE 3 /* possibly even more power saving */
98 99 100 101 102

#ifdef CONFIG_PCIEASPM_PERFORMANCE
static int aspm_policy = POLICY_PERFORMANCE;
#elif defined CONFIG_PCIEASPM_POWERSAVE
static int aspm_policy = POLICY_POWERSAVE;
103 104
#elif defined CONFIG_PCIEASPM_POWER_SUPERSAVE
static int aspm_policy = POLICY_POWER_SUPERSAVE;
105
#else
S
Shaohua Li 已提交
106
static int aspm_policy;
107 108
#endif

S
Shaohua Li 已提交
109 110 111
static const char *policy_str[] = {
	[POLICY_DEFAULT] = "default",
	[POLICY_PERFORMANCE] = "performance",
112 113
	[POLICY_POWERSAVE] = "powersave",
	[POLICY_POWER_SUPERSAVE] = "powersupersave"
S
Shaohua Li 已提交
114 115
};

116 117
#define LINK_RETRAIN_TIMEOUT HZ

118
static int policy_to_aspm_state(struct pcie_link_state *link)
S
Shaohua Li 已提交
119 120 121 122 123 124 125
{
	switch (aspm_policy) {
	case POLICY_PERFORMANCE:
		/* Disable ASPM and Clock PM */
		return 0;
	case POLICY_POWERSAVE:
		/* Enable ASPM L0s/L1 */
126 127 128
		return (ASPM_STATE_L0S | ASPM_STATE_L1);
	case POLICY_POWER_SUPERSAVE:
		/* Enable Everything */
129
		return ASPM_STATE_ALL;
S
Shaohua Li 已提交
130
	case POLICY_DEFAULT:
131
		return link->aspm_default;
S
Shaohua Li 已提交
132 133 134 135
	}
	return 0;
}

136
static int policy_to_clkpm_state(struct pcie_link_state *link)
S
Shaohua Li 已提交
137 138 139 140 141 142
{
	switch (aspm_policy) {
	case POLICY_PERFORMANCE:
		/* Disable ASPM and Clock PM */
		return 0;
	case POLICY_POWERSAVE:
143 144
	case POLICY_POWER_SUPERSAVE:
		/* Enable Clock PM */
S
Shaohua Li 已提交
145 146
		return 1;
	case POLICY_DEFAULT:
147
		return link->clkpm_default;
S
Shaohua Li 已提交
148 149 150 151
	}
	return 0;
}

K
Kenji Kaneshige 已提交
152
static void pcie_set_clkpm_nocheck(struct pcie_link_state *link, int enable)
S
Shaohua Li 已提交
153
{
154 155
	struct pci_dev *child;
	struct pci_bus *linkbus = link->pdev->subordinate;
156
	u32 val = enable ? PCI_EXP_LNKCTL_CLKREQ_EN : 0;
S
Shaohua Li 已提交
157

158 159 160 161
	list_for_each_entry(child, &linkbus->devices, bus_list)
		pcie_capability_clear_and_set_word(child, PCI_EXP_LNKCTL,
						   PCI_EXP_LNKCTL_CLKREQ_EN,
						   val);
162
	link->clkpm_enabled = !!enable;
S
Shaohua Li 已提交
163 164
}

K
Kenji Kaneshige 已提交
165 166 167
static void pcie_set_clkpm(struct pcie_link_state *link, int enable)
{
	/* Don't enable Clock PM if the link is not Clock PM capable */
168
	if (!link->clkpm_capable)
169
		enable = 0;
K
Kenji Kaneshige 已提交
170 171 172 173 174 175
	/* Need nothing if the specified equals to current state */
	if (link->clkpm_enabled == enable)
		return;
	pcie_set_clkpm_nocheck(link, enable);
}

176
static void pcie_clkpm_cap_init(struct pcie_link_state *link, int blacklist)
S
Shaohua Li 已提交
177
{
178
	int capable = 1, enabled = 1;
S
Shaohua Li 已提交
179 180
	u32 reg32;
	u16 reg16;
181 182
	struct pci_dev *child;
	struct pci_bus *linkbus = link->pdev->subordinate;
S
Shaohua Li 已提交
183 184

	/* All functions should have the same cap and state, take the worst */
185
	list_for_each_entry(child, &linkbus->devices, bus_list) {
186
		pcie_capability_read_dword(child, PCI_EXP_LNKCAP, &reg32);
S
Shaohua Li 已提交
187 188 189 190 191
		if (!(reg32 & PCI_EXP_LNKCAP_CLKPM)) {
			capable = 0;
			enabled = 0;
			break;
		}
192
		pcie_capability_read_word(child, PCI_EXP_LNKCTL, &reg16);
S
Shaohua Li 已提交
193 194 195
		if (!(reg16 & PCI_EXP_LNKCTL_CLKREQ_EN))
			enabled = 0;
	}
196 197
	link->clkpm_enabled = enabled;
	link->clkpm_default = enabled;
198
	link->clkpm_capable = (blacklist) ? 0 : capable;
199 200
}

201 202 203 204 205 206 207 208 209
static bool pcie_retrain_link(struct pcie_link_state *link)
{
	struct pci_dev *parent = link->pdev;
	unsigned long start_jiffies;
	u16 reg16;

	pcie_capability_read_word(parent, PCI_EXP_LNKCTL, &reg16);
	reg16 |= PCI_EXP_LNKCTL_RL;
	pcie_capability_write_word(parent, PCI_EXP_LNKCTL, reg16);
210 211 212 213 214 215 216 217 218
	if (parent->clear_retrain_link) {
		/*
		 * Due to an erratum in some devices the Retrain Link bit
		 * needs to be cleared again manually to allow the link
		 * training to succeed.
		 */
		reg16 &= ~PCI_EXP_LNKCTL_RL;
		pcie_capability_write_word(parent, PCI_EXP_LNKCTL, reg16);
	}
219 220 221 222 223 224 225 226 227 228 229 230 231 232

	/* Wait for link training end. Break out after waiting for timeout */
	start_jiffies = jiffies;
	for (;;) {
		pcie_capability_read_word(parent, PCI_EXP_LNKSTA, &reg16);
		if (!(reg16 & PCI_EXP_LNKSTA_LT))
			break;
		if (time_after(jiffies, start_jiffies + LINK_RETRAIN_TIMEOUT))
			break;
		msleep(1);
	}
	return !(reg16 & PCI_EXP_LNKSTA_LT);
}

S
Shaohua Li 已提交
233 234 235 236 237
/*
 * pcie_aspm_configure_common_clock: check if the 2 ends of a link
 *   could use common clock. If they are, configure them to use the
 *   common clock. That will reduce the ASPM state exit latency.
 */
238
static void pcie_aspm_configure_common_clock(struct pcie_link_state *link)
S
Shaohua Li 已提交
239
{
240
	int same_clock = 1;
241 242 243
	u16 reg16, parent_reg, child_reg[8];
	struct pci_dev *child, *parent = link->pdev;
	struct pci_bus *linkbus = parent->subordinate;
S
Shaohua Li 已提交
244
	/*
245
	 * All functions of a slot should have the same Slot Clock
S
Shaohua Li 已提交
246
	 * Configuration, so just check one function
247 248
	 */
	child = list_entry(linkbus->devices.next, struct pci_dev, bus_list);
K
Kenji Kaneshige 已提交
249
	BUG_ON(!pci_is_pcie(child));
S
Shaohua Li 已提交
250 251

	/* Check downstream component if bit Slot Clock Configuration is 1 */
252
	pcie_capability_read_word(child, PCI_EXP_LNKSTA, &reg16);
S
Shaohua Li 已提交
253 254 255 256
	if (!(reg16 & PCI_EXP_LNKSTA_SLC))
		same_clock = 0;

	/* Check upstream component if bit Slot Clock Configuration is 1 */
257
	pcie_capability_read_word(parent, PCI_EXP_LNKSTA, &reg16);
S
Shaohua Li 已提交
258 259 260
	if (!(reg16 & PCI_EXP_LNKSTA_SLC))
		same_clock = 0;

261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278
	/* Port might be already in common clock mode */
	pcie_capability_read_word(parent, PCI_EXP_LNKCTL, &reg16);
	if (same_clock && (reg16 & PCI_EXP_LNKCTL_CCC)) {
		bool consistent = true;

		list_for_each_entry(child, &linkbus->devices, bus_list) {
			pcie_capability_read_word(child, PCI_EXP_LNKCTL,
						  &reg16);
			if (!(reg16 & PCI_EXP_LNKCTL_CCC)) {
				consistent = false;
				break;
			}
		}
		if (consistent)
			return;
		pci_warn(parent, "ASPM: current common clock configuration is broken, reconfiguring\n");
	}

S
Shaohua Li 已提交
279
	/* Configure downstream component, all functions */
280
	list_for_each_entry(child, &linkbus->devices, bus_list) {
281
		pcie_capability_read_word(child, PCI_EXP_LNKCTL, &reg16);
282
		child_reg[PCI_FUNC(child->devfn)] = reg16;
S
Shaohua Li 已提交
283 284 285 286
		if (same_clock)
			reg16 |= PCI_EXP_LNKCTL_CCC;
		else
			reg16 &= ~PCI_EXP_LNKCTL_CCC;
287
		pcie_capability_write_word(child, PCI_EXP_LNKCTL, reg16);
S
Shaohua Li 已提交
288 289 290
	}

	/* Configure upstream component */
291
	pcie_capability_read_word(parent, PCI_EXP_LNKCTL, &reg16);
292
	parent_reg = reg16;
S
Shaohua Li 已提交
293 294 295 296
	if (same_clock)
		reg16 |= PCI_EXP_LNKCTL_CCC;
	else
		reg16 &= ~PCI_EXP_LNKCTL_CCC;
297
	pcie_capability_write_word(parent, PCI_EXP_LNKCTL, reg16);
S
Shaohua Li 已提交
298

299
	if (pcie_retrain_link(link))
300 301 302
		return;

	/* Training failed. Restore common clock configurations */
303
	pci_err(parent, "ASPM: Could not configure common clock\n");
304 305 306 307
	list_for_each_entry(child, &linkbus->devices, bus_list)
		pcie_capability_write_word(child, PCI_EXP_LNKCTL,
					   child_reg[PCI_FUNC(child->devfn)]);
	pcie_capability_write_word(parent, PCI_EXP_LNKCTL, parent_reg);
S
Shaohua Li 已提交
308 309
}

310 311
/* Convert L0s latency encoding to ns */
static u32 calc_l0s_latency(u32 encoding)
S
Shaohua Li 已提交
312
{
313 314 315 316
	if (encoding == 0x7)
		return (5 * 1000);	/* > 4us */
	return (64 << encoding);
}
S
Shaohua Li 已提交
317

318 319 320 321 322 323
/* Convert L0s acceptable latency encoding to ns */
static u32 calc_l0s_acceptable(u32 encoding)
{
	if (encoding == 0x7)
		return -1U;
	return (64 << encoding);
S
Shaohua Li 已提交
324 325
}

326 327
/* Convert L1 latency encoding to ns */
static u32 calc_l1_latency(u32 encoding)
S
Shaohua Li 已提交
328
{
329 330 331 332
	if (encoding == 0x7)
		return (65 * 1000);	/* > 64us */
	return (1000 << encoding);
}
S
Shaohua Li 已提交
333

334 335 336 337 338 339
/* Convert L1 acceptable latency encoding to ns */
static u32 calc_l1_acceptable(u32 encoding)
{
	if (encoding == 0x7)
		return -1U;
	return (1000 << encoding);
S
Shaohua Li 已提交
340 341
}

342 343 344 345 346 347 348 349 350 351 352
/* Convert L1SS T_pwr encoding to usec */
static u32 calc_l1ss_pwron(struct pci_dev *pdev, u32 scale, u32 val)
{
	switch (scale) {
	case 0:
		return val * 2;
	case 1:
		return val * 10;
	case 2:
		return val * 100;
	}
353
	pci_err(pdev, "%s: Invalid T_PwrOn scale: %u\n", __func__, scale);
354 355 356
	return 0;
}

357 358
static void encode_l12_threshold(u32 threshold_us, u32 *scale, u32 *value)
{
359
	u32 threshold_ns = threshold_us * 1000;
360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382

	/* See PCIe r3.1, sec 7.33.3 and sec 6.18 */
	if (threshold_ns < 32) {
		*scale = 0;
		*value = threshold_ns;
	} else if (threshold_ns < 1024) {
		*scale = 1;
		*value = threshold_ns >> 5;
	} else if (threshold_ns < 32768) {
		*scale = 2;
		*value = threshold_ns >> 10;
	} else if (threshold_ns < 1048576) {
		*scale = 3;
		*value = threshold_ns >> 15;
	} else if (threshold_ns < 33554432) {
		*scale = 4;
		*value = threshold_ns >> 20;
	} else {
		*scale = 5;
		*value = threshold_ns >> 25;
	}
}

383 384 385 386 387
struct aspm_register_info {
	u32 support:2;
	u32 enabled:2;
	u32 latency_encoding_l0s;
	u32 latency_encoding_l1;
388 389 390 391 392 393

	/* L1 substates */
	u32 l1ss_cap_ptr;
	u32 l1ss_cap;
	u32 l1ss_ctl1;
	u32 l1ss_ctl2;
394 395 396 397
};

static void pcie_get_aspm_reg(struct pci_dev *pdev,
			      struct aspm_register_info *info)
S
Shaohua Li 已提交
398 399
{
	u16 reg16;
400
	u32 reg32;
S
Shaohua Li 已提交
401

402
	pcie_capability_read_dword(pdev, PCI_EXP_LNKCAP, &reg32);
403 404 405
	info->support = (reg32 & PCI_EXP_LNKCAP_ASPMS) >> 10;
	info->latency_encoding_l0s = (reg32 & PCI_EXP_LNKCAP_L0SEL) >> 12;
	info->latency_encoding_l1  = (reg32 & PCI_EXP_LNKCAP_L1EL) >> 15;
406
	pcie_capability_read_word(pdev, PCI_EXP_LNKCTL, &reg16);
407
	info->enabled = reg16 & PCI_EXP_LNKCTL_ASPMC;
408 409 410 411 412 413 414 415 416 417 418 419

	/* Read L1 PM substate capabilities */
	info->l1ss_cap = info->l1ss_ctl1 = info->l1ss_ctl2 = 0;
	info->l1ss_cap_ptr = pci_find_ext_capability(pdev, PCI_EXT_CAP_ID_L1SS);
	if (!info->l1ss_cap_ptr)
		return;
	pci_read_config_dword(pdev, info->l1ss_cap_ptr + PCI_L1SS_CAP,
			      &info->l1ss_cap);
	if (!(info->l1ss_cap & PCI_L1SS_CAP_L1_PM_SS)) {
		info->l1ss_cap = 0;
		return;
	}
420 421 422 423 424 425 426 427 428

	/*
	 * If we don't have LTR for the entire path from the Root Complex
	 * to this device, we can't use ASPM L1.2 because it relies on the
	 * LTR_L1.2_THRESHOLD.  See PCIe r4.0, secs 5.5.4, 6.18.
	 */
	if (!pdev->ltr_path)
		info->l1ss_cap &= ~PCI_L1SS_CAP_ASPM_L1_2;

429 430 431 432
	pci_read_config_dword(pdev, info->l1ss_cap_ptr + PCI_L1SS_CTL1,
			      &info->l1ss_ctl1);
	pci_read_config_dword(pdev, info->l1ss_cap_ptr + PCI_L1SS_CTL2,
			      &info->l1ss_ctl2);
S
Shaohua Li 已提交
433 434
}

435 436
static void pcie_aspm_check_latency(struct pci_dev *endpoint)
{
437
	u32 latency, l1_switch_latency = 0;
438 439 440 441 442 443 444 445 446 447 448 449
	struct aspm_latency *acceptable;
	struct pcie_link_state *link;

	/* Device not in D0 doesn't need latency check */
	if ((endpoint->current_state != PCI_D0) &&
	    (endpoint->current_state != PCI_UNKNOWN))
		return;

	link = endpoint->bus->self->link_state;
	acceptable = &link->acceptable[PCI_FUNC(endpoint->devfn)];

	while (link) {
450 451 452 453 454 455 456 457 458
		/* Check upstream direction L0s latency */
		if ((link->aspm_capable & ASPM_STATE_L0S_UP) &&
		    (link->latency_up.l0s > acceptable->l0s))
			link->aspm_capable &= ~ASPM_STATE_L0S_UP;

		/* Check downstream direction L0s latency */
		if ((link->aspm_capable & ASPM_STATE_L0S_DW) &&
		    (link->latency_dw.l0s > acceptable->l0s))
			link->aspm_capable &= ~ASPM_STATE_L0S_DW;
459 460 461 462
		/*
		 * Check L1 latency.
		 * Every switch on the path to root complex need 1
		 * more microsecond for L1. Spec doesn't mention L0s.
463 464 465 466 467 468 469 470
		 *
		 * The exit latencies for L1 substates are not advertised
		 * by a device.  Since the spec also doesn't mention a way
		 * to determine max latencies introduced by enabling L1
		 * substates on the components, it is not clear how to do
		 * a L1 substate exit latency check.  We assume that the
		 * L1 exit latencies advertised by a device include L1
		 * substate latencies (and hence do not do any check).
471
		 */
472 473 474 475
		latency = max_t(u32, link->latency_up.l1, link->latency_dw.l1);
		if ((link->aspm_capable & ASPM_STATE_L1) &&
		    (latency + l1_switch_latency > acceptable->l1))
			link->aspm_capable &= ~ASPM_STATE_L1;
476 477 478 479 480 481
		l1_switch_latency += 1000;

		link = link->parent;
	}
}

482 483 484 485 486 487 488 489 490 491 492 493 494 495
/*
 * The L1 PM substate capability is only implemented in function 0 in a
 * multi function device.
 */
static struct pci_dev *pci_function_0(struct pci_bus *linkbus)
{
	struct pci_dev *child;

	list_for_each_entry(child, &linkbus->devices, bus_list)
		if (PCI_FUNC(child->devfn) == 0)
			return child;
	return NULL;
}

496 497 498 499 500 501
/* Calculate L1.2 PM substate timing parameters */
static void aspm_calc_l1ss_info(struct pcie_link_state *link,
				struct aspm_register_info *upreg,
				struct aspm_register_info *dwreg)
{
	u32 val1, val2, scale1, scale2;
502
	u32 t_common_mode, t_power_on, l1_2_threshold, scale, value;
503 504 505 506 507 508 509 510

	link->l1ss.up_cap_ptr = upreg->l1ss_cap_ptr;
	link->l1ss.dw_cap_ptr = dwreg->l1ss_cap_ptr;
	link->l1ss.ctl1 = link->l1ss.ctl2 = 0;

	if (!(link->aspm_support & ASPM_STATE_L1_2_MASK))
		return;

511 512 513
	/* Choose the greater of the two Port Common_Mode_Restore_Times */
	val1 = (upreg->l1ss_cap & PCI_L1SS_CAP_CM_RESTORE_TIME) >> 8;
	val2 = (dwreg->l1ss_cap & PCI_L1SS_CAP_CM_RESTORE_TIME) >> 8;
514
	t_common_mode = max(val1, val2);
515

516 517 518 519 520
	/* Choose the greater of the two Port T_POWER_ON times */
	val1   = (upreg->l1ss_cap & PCI_L1SS_CAP_P_PWR_ON_VALUE) >> 19;
	scale1 = (upreg->l1ss_cap & PCI_L1SS_CAP_P_PWR_ON_SCALE) >> 16;
	val2   = (dwreg->l1ss_cap & PCI_L1SS_CAP_P_PWR_ON_VALUE) >> 19;
	scale2 = (dwreg->l1ss_cap & PCI_L1SS_CAP_P_PWR_ON_SCALE) >> 16;
521 522

	if (calc_l1ss_pwron(link->pdev, scale1, val1) >
523
	    calc_l1ss_pwron(link->downstream, scale2, val2)) {
524
		link->l1ss.ctl2 |= scale1 | (val1 << 3);
525 526
		t_power_on = calc_l1ss_pwron(link->pdev, scale1, val1);
	} else {
527
		link->l1ss.ctl2 |= scale2 | (val2 << 3);
528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543
		t_power_on = calc_l1ss_pwron(link->downstream, scale2, val2);
	}

	/*
	 * Set LTR_L1.2_THRESHOLD to the time required to transition the
	 * Link from L0 to L1.2 and back to L0 so we enter L1.2 only if
	 * downstream devices report (via LTR) that they can tolerate at
	 * least that much latency.
	 *
	 * Based on PCIe r3.1, sec 5.5.3.3.1, Figures 5-16 and 5-17, and
	 * Table 5-11.  T(POWER_OFF) is at most 2us and T(L1.2) is at
	 * least 4us.
	 */
	l1_2_threshold = 2 + 4 + t_common_mode + t_power_on;
	encode_l12_threshold(l1_2_threshold, &scale, &value);
	link->l1ss.ctl1 |= t_common_mode << 8 | scale << 29 | value << 16;
544 545
}

546
static void pcie_aspm_cap_init(struct pcie_link_state *link, int blacklist)
S
Shaohua Li 已提交
547
{
548
	struct pci_dev *child = link->downstream, *parent = link->pdev;
549
	struct pci_bus *linkbus = parent->subordinate;
550
	struct aspm_register_info upreg, dwreg;
S
Shaohua Li 已提交
551

552
	if (blacklist) {
553
		/* Set enabled/disable so that we will disable ASPM later */
554 555
		link->aspm_enabled = ASPM_STATE_ALL;
		link->aspm_disable = ASPM_STATE_ALL;
556 557 558
		return;
	}

559 560 561 562 563 564 565 566 567 568 569
	/* Get upstream/downstream components' register state */
	pcie_get_aspm_reg(parent, &upreg);
	pcie_get_aspm_reg(child, &dwreg);

	/*
	 * If ASPM not supported, don't mess with the clocks and link,
	 * bail out now.
	 */
	if (!(upreg.support & dwreg.support))
		return;

570 571 572
	/* Configure common clock before checking latencies */
	pcie_aspm_configure_common_clock(link);

573 574 575 576
	/*
	 * Re-read upstream/downstream components' register state
	 * after clock configuration
	 */
577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602
	pcie_get_aspm_reg(parent, &upreg);
	pcie_get_aspm_reg(child, &dwreg);

	/*
	 * Setup L0s state
	 *
	 * Note that we must not enable L0s in either direction on a
	 * given link unless components on both sides of the link each
	 * support L0s.
	 */
	if (dwreg.support & upreg.support & PCIE_LINK_STATE_L0S)
		link->aspm_support |= ASPM_STATE_L0S;
	if (dwreg.enabled & PCIE_LINK_STATE_L0S)
		link->aspm_enabled |= ASPM_STATE_L0S_UP;
	if (upreg.enabled & PCIE_LINK_STATE_L0S)
		link->aspm_enabled |= ASPM_STATE_L0S_DW;
	link->latency_up.l0s = calc_l0s_latency(upreg.latency_encoding_l0s);
	link->latency_dw.l0s = calc_l0s_latency(dwreg.latency_encoding_l0s);

	/* Setup L1 state */
	if (upreg.support & dwreg.support & PCIE_LINK_STATE_L1)
		link->aspm_support |= ASPM_STATE_L1;
	if (upreg.enabled & dwreg.enabled & PCIE_LINK_STATE_L1)
		link->aspm_enabled |= ASPM_STATE_L1;
	link->latency_up.l1 = calc_l1_latency(upreg.latency_encoding_l1);
	link->latency_dw.l1 = calc_l1_latency(dwreg.latency_encoding_l1);
603

604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622
	/* Setup L1 substate */
	if (upreg.l1ss_cap & dwreg.l1ss_cap & PCI_L1SS_CAP_ASPM_L1_1)
		link->aspm_support |= ASPM_STATE_L1_1;
	if (upreg.l1ss_cap & dwreg.l1ss_cap & PCI_L1SS_CAP_ASPM_L1_2)
		link->aspm_support |= ASPM_STATE_L1_2;
	if (upreg.l1ss_cap & dwreg.l1ss_cap & PCI_L1SS_CAP_PCIPM_L1_1)
		link->aspm_support |= ASPM_STATE_L1_1_PCIPM;
	if (upreg.l1ss_cap & dwreg.l1ss_cap & PCI_L1SS_CAP_PCIPM_L1_2)
		link->aspm_support |= ASPM_STATE_L1_2_PCIPM;

	if (upreg.l1ss_ctl1 & dwreg.l1ss_ctl1 & PCI_L1SS_CTL1_ASPM_L1_1)
		link->aspm_enabled |= ASPM_STATE_L1_1;
	if (upreg.l1ss_ctl1 & dwreg.l1ss_ctl1 & PCI_L1SS_CTL1_ASPM_L1_2)
		link->aspm_enabled |= ASPM_STATE_L1_2;
	if (upreg.l1ss_ctl1 & dwreg.l1ss_ctl1 & PCI_L1SS_CTL1_PCIPM_L1_1)
		link->aspm_enabled |= ASPM_STATE_L1_1_PCIPM;
	if (upreg.l1ss_ctl1 & dwreg.l1ss_ctl1 & PCI_L1SS_CTL1_PCIPM_L1_2)
		link->aspm_enabled |= ASPM_STATE_L1_2_PCIPM;

623 624 625
	if (link->aspm_support & ASPM_STATE_L1SS)
		aspm_calc_l1ss_info(link, &upreg, &dwreg);

626 627
	/* Save default state */
	link->aspm_default = link->aspm_enabled;
628 629 630

	/* Setup initial capable state. Will be updated later */
	link->aspm_capable = link->aspm_support;
631 632 633 634 635
	/*
	 * If the downstream component has pci bridge function, don't
	 * do ASPM for now.
	 */
	list_for_each_entry(child, &linkbus->devices, bus_list) {
636
		if (pci_pcie_type(child) == PCI_EXP_TYPE_PCI_BRIDGE) {
637
			link->aspm_disable = ASPM_STATE_ALL;
638 639 640
			break;
		}
	}
641

642
	/* Get and check endpoint acceptable latencies */
643
	list_for_each_entry(child, &linkbus->devices, bus_list) {
644
		u32 reg32, encoding;
645
		struct aspm_latency *acceptable =
646
			&link->acceptable[PCI_FUNC(child->devfn)];
S
Shaohua Li 已提交
647

648 649
		if (pci_pcie_type(child) != PCI_EXP_TYPE_ENDPOINT &&
		    pci_pcie_type(child) != PCI_EXP_TYPE_LEG_END)
S
Shaohua Li 已提交
650 651
			continue;

652
		pcie_capability_read_dword(child, PCI_EXP_DEVCAP, &reg32);
653
		/* Calculate endpoint L0s acceptable latency */
654 655
		encoding = (reg32 & PCI_EXP_DEVCAP_L0S) >> 6;
		acceptable->l0s = calc_l0s_acceptable(encoding);
656 657 658 659 660
		/* Calculate endpoint L1 acceptable latency */
		encoding = (reg32 & PCI_EXP_DEVCAP_L1) >> 9;
		acceptable->l1 = calc_l1_acceptable(encoding);

		pcie_aspm_check_latency(child);
S
Shaohua Li 已提交
661 662 663
	}
}

664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715
static void pci_clear_and_set_dword(struct pci_dev *pdev, int pos,
				    u32 clear, u32 set)
{
	u32 val;

	pci_read_config_dword(pdev, pos, &val);
	val &= ~clear;
	val |= set;
	pci_write_config_dword(pdev, pos, val);
}

/* Configure the ASPM L1 substates */
static void pcie_config_aspm_l1ss(struct pcie_link_state *link, u32 state)
{
	u32 val, enable_req;
	struct pci_dev *child = link->downstream, *parent = link->pdev;
	u32 up_cap_ptr = link->l1ss.up_cap_ptr;
	u32 dw_cap_ptr = link->l1ss.dw_cap_ptr;

	enable_req = (link->aspm_enabled ^ state) & state;

	/*
	 * Here are the rules specified in the PCIe spec for enabling L1SS:
	 * - When enabling L1.x, enable bit at parent first, then at child
	 * - When disabling L1.x, disable bit at child first, then at parent
	 * - When enabling ASPM L1.x, need to disable L1
	 *   (at child followed by parent).
	 * - The ASPM/PCIPM L1.2 must be disabled while programming timing
	 *   parameters
	 *
	 * To keep it simple, disable all L1SS bits first, and later enable
	 * what is needed.
	 */

	/* Disable all L1 substates */
	pci_clear_and_set_dword(child, dw_cap_ptr + PCI_L1SS_CTL1,
				PCI_L1SS_CTL1_L1SS_MASK, 0);
	pci_clear_and_set_dword(parent, up_cap_ptr + PCI_L1SS_CTL1,
				PCI_L1SS_CTL1_L1SS_MASK, 0);
	/*
	 * If needed, disable L1, and it gets enabled later
	 * in pcie_config_aspm_link().
	 */
	if (enable_req & (ASPM_STATE_L1_1 | ASPM_STATE_L1_2)) {
		pcie_capability_clear_and_set_word(child, PCI_EXP_LNKCTL,
						   PCI_EXP_LNKCTL_ASPM_L1, 0);
		pcie_capability_clear_and_set_word(parent, PCI_EXP_LNKCTL,
						   PCI_EXP_LNKCTL_ASPM_L1, 0);
	}

	if (enable_req & ASPM_STATE_L1_2_MASK) {

716
		/* Program T_POWER_ON times in both ports */
717 718 719 720 721
		pci_write_config_dword(parent, up_cap_ptr + PCI_L1SS_CTL2,
				       link->l1ss.ctl2);
		pci_write_config_dword(child, dw_cap_ptr + PCI_L1SS_CTL2,
				       link->l1ss.ctl2);

722
		/* Program Common_Mode_Restore_Time in upstream device */
723
		pci_clear_and_set_dword(parent, up_cap_ptr + PCI_L1SS_CTL1,
724 725
					PCI_L1SS_CTL1_CM_RESTORE_TIME,
					link->l1ss.ctl1);
726

727
		/* Program LTR_L1.2_THRESHOLD time in both ports */
728
		pci_clear_and_set_dword(parent,	up_cap_ptr + PCI_L1SS_CTL1,
729 730 731
					PCI_L1SS_CTL1_LTR_L12_TH_VALUE |
					PCI_L1SS_CTL1_LTR_L12_TH_SCALE,
					link->l1ss.ctl1);
732
		pci_clear_and_set_dword(child, dw_cap_ptr + PCI_L1SS_CTL1,
733 734 735
					PCI_L1SS_CTL1_LTR_L12_TH_VALUE |
					PCI_L1SS_CTL1_LTR_L12_TH_SCALE,
					link->l1ss.ctl1);
736 737 738 739 740 741 742 743 744 745 746 747 748 749 750 751 752 753 754
	}

	val = 0;
	if (state & ASPM_STATE_L1_1)
		val |= PCI_L1SS_CTL1_ASPM_L1_1;
	if (state & ASPM_STATE_L1_2)
		val |= PCI_L1SS_CTL1_ASPM_L1_2;
	if (state & ASPM_STATE_L1_1_PCIPM)
		val |= PCI_L1SS_CTL1_PCIPM_L1_1;
	if (state & ASPM_STATE_L1_2_PCIPM)
		val |= PCI_L1SS_CTL1_PCIPM_L1_2;

	/* Enable what we need to enable */
	pci_clear_and_set_dword(parent, up_cap_ptr + PCI_L1SS_CTL1,
				PCI_L1SS_CAP_L1_PM_SS, val);
	pci_clear_and_set_dword(child, dw_cap_ptr + PCI_L1SS_CTL1,
				PCI_L1SS_CAP_L1_PM_SS, val);
}

755
static void pcie_config_aspm_dev(struct pci_dev *pdev, u32 val)
S
Shaohua Li 已提交
756
{
757 758
	pcie_capability_clear_and_set_word(pdev, PCI_EXP_LNKCTL,
					   PCI_EXP_LNKCTL_ASPMC, val);
S
Shaohua Li 已提交
759 760
}

761
static void pcie_config_aspm_link(struct pcie_link_state *link, u32 state)
S
Shaohua Li 已提交
762
{
763
	u32 upstream = 0, dwstream = 0;
764
	struct pci_dev *child = link->downstream, *parent = link->pdev;
765
	struct pci_bus *linkbus = parent->subordinate;
S
Shaohua Li 已提交
766

767
	/* Enable only the states that were not explicitly disabled */
768
	state &= (link->aspm_capable & ~link->aspm_disable);
769 770 771 772 773 774 775 776 777 778 779 780

	/* Can't enable any substates if L1 is not enabled */
	if (!(state & ASPM_STATE_L1))
		state &= ~ASPM_STATE_L1SS;

	/* Spec says both ports must be in D0 before enabling PCI PM substates*/
	if (parent->current_state != PCI_D0 || child->current_state != PCI_D0) {
		state &= ~ASPM_STATE_L1_SS_PCIPM;
		state |= (link->aspm_enabled & ASPM_STATE_L1_SS_PCIPM);
	}

	/* Nothing to do if the link is already in the requested state */
781 782
	if (link->aspm_enabled == state)
		return;
783 784
	/* Convert ASPM state to upstream/downstream ASPM register state */
	if (state & ASPM_STATE_L0S_UP)
785
		dwstream |= PCI_EXP_LNKCTL_ASPM_L0S;
786
	if (state & ASPM_STATE_L0S_DW)
787
		upstream |= PCI_EXP_LNKCTL_ASPM_L0S;
788
	if (state & ASPM_STATE_L1) {
789 790
		upstream |= PCI_EXP_LNKCTL_ASPM_L1;
		dwstream |= PCI_EXP_LNKCTL_ASPM_L1;
791
	}
792 793 794 795

	if (link->aspm_capable & ASPM_STATE_L1SS)
		pcie_config_aspm_l1ss(link, state);

S
Shaohua Li 已提交
796
	/*
797 798 799 800
	 * Spec 2.0 suggests all functions should be configured the
	 * same setting for ASPM. Enabling ASPM L1 should be done in
	 * upstream component first and then downstream, and vice
	 * versa for disabling ASPM L1. Spec doesn't mention L0S.
S
Shaohua Li 已提交
801
	 */
802 803
	if (state & ASPM_STATE_L1)
		pcie_config_aspm_dev(parent, upstream);
804
	list_for_each_entry(child, &linkbus->devices, bus_list)
805 806 807
		pcie_config_aspm_dev(child, dwstream);
	if (!(state & ASPM_STATE_L1))
		pcie_config_aspm_dev(parent, upstream);
S
Shaohua Li 已提交
808

809
	link->aspm_enabled = state;
S
Shaohua Li 已提交
810 811
}

812
static void pcie_config_aspm_path(struct pcie_link_state *link)
S
Shaohua Li 已提交
813
{
814 815 816
	while (link) {
		pcie_config_aspm_link(link, policy_to_aspm_state(link));
		link = link->parent;
817
	}
S
Shaohua Li 已提交
818 819
}

820
static void free_link_state(struct pcie_link_state *link)
S
Shaohua Li 已提交
821
{
822 823
	link->pdev->link_state = NULL;
	kfree(link);
S
Shaohua Li 已提交
824 825
}

826 827
static int pcie_aspm_sanity_check(struct pci_dev *pdev)
{
828
	struct pci_dev *child;
829
	u32 reg32;
830

831
	/*
832
	 * Some functions in a slot might not all be PCIe functions,
833
	 * very strange. Disable ASPM for the whole slot
834
	 */
835
	list_for_each_entry(child, &pdev->subordinate->devices, bus_list) {
836
		if (!pci_is_pcie(child))
837
			return -EINVAL;
838 839 840 841 842 843 844 845 846 847

		/*
		 * If ASPM is disabled then we're not going to change
		 * the BIOS state. It's safe to continue even if it's a
		 * pre-1.1 device
		 */

		if (aspm_disabled)
			continue;

848 849 850 851
		/*
		 * Disable ASPM for pre-1.1 PCIe device, we follow MS to use
		 * RBER bit to determine if a function is 1.1 version device
		 */
852
		pcie_capability_read_dword(child, PCI_EXP_DEVCAP, &reg32);
S
Sitsofe Wheeler 已提交
853
		if (!(reg32 & PCI_EXP_DEVCAP_RBER) && !aspm_force) {
854
			pci_info(child, "disabling ASPM on pre-1.1 PCIe device.  You can enable it with 'pcie_aspm=force'\n");
855 856
			return -EINVAL;
		}
857 858 859 860
	}
	return 0;
}

861
static struct pcie_link_state *alloc_pcie_link_state(struct pci_dev *pdev)
862 863 864 865 866 867
{
	struct pcie_link_state *link;

	link = kzalloc(sizeof(*link), GFP_KERNEL);
	if (!link)
		return NULL;
868

869 870 871 872
	INIT_LIST_HEAD(&link->sibling);
	INIT_LIST_HEAD(&link->children);
	INIT_LIST_HEAD(&link->link);
	link->pdev = pdev;
873
	link->downstream = pci_function_0(pdev->subordinate);
874 875 876

	/*
	 * Root Ports and PCI/PCI-X to PCIe Bridges are roots of PCIe
877 878 879 880
	 * hierarchies.  Note that some PCIe host implementations omit
	 * the root ports entirely, in which case a downstream port on
	 * a switch may become the root of the link state chain for all
	 * its subordinate endpoints.
881 882
	 */
	if (pci_pcie_type(pdev) == PCI_EXP_TYPE_ROOT_PORT ||
883 884
	    pci_pcie_type(pdev) == PCI_EXP_TYPE_PCIE_BRIDGE ||
	    !pdev->bus->parent->self) {
885 886
		link->root = link;
	} else {
887
		struct pcie_link_state *parent;
888

889 890 891 892 893
		parent = pdev->bus->parent->self->link_state;
		if (!parent) {
			kfree(link);
			return NULL;
		}
894

895
		link->parent = parent;
896
		link->root = link->parent->root;
897 898
		list_add(&link->link, &parent->children);
	}
899

900 901 902 903 904
	list_add(&link->sibling, &link_list);
	pdev->link_state = link;
	return link;
}

S
Shaohua Li 已提交
905 906
/*
 * pcie_aspm_init_link_state: Initiate PCI express link state.
907
 * It is called after the pcie and its children devices are scanned.
S
Shaohua Li 已提交
908 909 910 911
 * @pdev: the root port or switch downstream port
 */
void pcie_aspm_init_link_state(struct pci_dev *pdev)
{
912
	struct pcie_link_state *link;
913
	int blacklist = !!pcie_aspm_sanity_check(pdev);
S
Shaohua Li 已提交
914

915 916 917
	if (!aspm_support_enabled)
		return;

918
	if (pdev->link_state)
S
Shaohua Li 已提交
919
		return;
920 921 922 923 924 925 926

	/*
	 * We allocate pcie_link_state for the component on the upstream
	 * end of a Link, so there's nothing to do unless this device has a
	 * Link on its secondary side.
	 */
	if (!pdev->has_secondary_link)
S
Shaohua Li 已提交
927
		return;
928

929
	/* VIA has a strange chipset, root port is under a bridge */
930
	if (pci_pcie_type(pdev) == PCI_EXP_TYPE_ROOT_PORT &&
931
	    pdev->bus->self)
932
		return;
933

S
Shaohua Li 已提交
934 935 936 937 938
	down_read(&pci_bus_sem);
	if (list_empty(&pdev->subordinate->devices))
		goto out;

	mutex_lock(&aspm_lock);
939
	link = alloc_pcie_link_state(pdev);
940 941 942
	if (!link)
		goto unlock;
	/*
943 944 945
	 * Setup initial ASPM state. Note that we need to configure
	 * upstream links also because capable state of them can be
	 * update through pcie_aspm_cap_init().
946
	 */
947
	pcie_aspm_cap_init(link, blacklist);
S
Shaohua Li 已提交
948

949
	/* Setup initial Clock PM state */
950
	pcie_clkpm_cap_init(link, blacklist);
951 952 953 954 955 956 957 958 959

	/*
	 * At this stage drivers haven't had an opportunity to change the
	 * link policy setting. Enabling ASPM on broken hardware can cripple
	 * it even before the driver has had a chance to disable ASPM, so
	 * default to a safe level right now. If we're enabling ASPM beyond
	 * the BIOS's expectation, we'll do so once pci_enable_device() is
	 * called.
	 */
960 961
	if (aspm_policy != POLICY_POWERSAVE &&
	    aspm_policy != POLICY_POWER_SUPERSAVE) {
962 963 964 965
		pcie_config_aspm_path(link);
		pcie_set_clkpm(link, policy_to_clkpm_state(link));
	}

966
unlock:
S
Shaohua Li 已提交
967 968 969 970 971
	mutex_unlock(&aspm_lock);
out:
	up_read(&pci_bus_sem);
}

972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987
/* Recheck latencies and update aspm_capable for links under the root */
static void pcie_update_aspm_capable(struct pcie_link_state *root)
{
	struct pcie_link_state *link;
	BUG_ON(root->parent);
	list_for_each_entry(link, &link_list, sibling) {
		if (link->root != root)
			continue;
		link->aspm_capable = link->aspm_support;
	}
	list_for_each_entry(link, &link_list, sibling) {
		struct pci_dev *child;
		struct pci_bus *linkbus = link->pdev->subordinate;
		if (link->root != root)
			continue;
		list_for_each_entry(child, &linkbus->devices, bus_list) {
988 989
			if ((pci_pcie_type(child) != PCI_EXP_TYPE_ENDPOINT) &&
			    (pci_pcie_type(child) != PCI_EXP_TYPE_LEG_END))
990 991 992 993 994 995
				continue;
			pcie_aspm_check_latency(child);
		}
	}
}

S
Shaohua Li 已提交
996 997 998 999
/* @pdev: the endpoint device */
void pcie_aspm_exit_link_state(struct pci_dev *pdev)
{
	struct pci_dev *parent = pdev->bus->self;
1000
	struct pcie_link_state *link, *root, *parent_link;
S
Shaohua Li 已提交
1001

1002
	if (!parent || !parent->link_state)
S
Shaohua Li 已提交
1003
		return;
1004

S
Shaohua Li 已提交
1005 1006 1007 1008
	down_read(&pci_bus_sem);
	mutex_lock(&aspm_lock);
	/*
	 * All PCIe functions are in one slot, remove one function will remove
1009
	 * the whole slot, so just wait until we are the last function left.
S
Shaohua Li 已提交
1010
	 */
1011
	if (!list_empty(&parent->subordinate->devices))
S
Shaohua Li 已提交
1012 1013
		goto out;

1014
	link = parent->link_state;
1015
	root = link->root;
1016
	parent_link = link->parent;
1017

S
Shaohua Li 已提交
1018
	/* All functions are removed, so just disable ASPM for the link */
1019
	pcie_config_aspm_link(link, 0);
1020 1021
	list_del(&link->sibling);
	list_del(&link->link);
S
Shaohua Li 已提交
1022
	/* Clock PM is for endpoint device */
1023
	free_link_state(link);
1024 1025

	/* Recheck latencies and configure upstream links */
1026 1027 1028 1029
	if (parent_link) {
		pcie_update_aspm_capable(root);
		pcie_config_aspm_path(parent_link);
	}
S
Shaohua Li 已提交
1030 1031 1032 1033 1034 1035 1036 1037
out:
	mutex_unlock(&aspm_lock);
	up_read(&pci_bus_sem);
}

/* @pdev: the root port or switch downstream port */
void pcie_aspm_pm_state_change(struct pci_dev *pdev)
{
1038
	struct pcie_link_state *link = pdev->link_state;
S
Shaohua Li 已提交
1039

1040
	if (aspm_disabled || !link)
S
Shaohua Li 已提交
1041 1042
		return;
	/*
1043 1044
	 * Devices changed PM state, we should recheck if latency
	 * meets all functions' requirement
S
Shaohua Li 已提交
1045
	 */
1046 1047 1048
	down_read(&pci_bus_sem);
	mutex_lock(&aspm_lock);
	pcie_update_aspm_capable(link->root);
1049
	pcie_config_aspm_path(link);
1050 1051
	mutex_unlock(&aspm_lock);
	up_read(&pci_bus_sem);
S
Shaohua Li 已提交
1052 1053
}

1054 1055 1056 1057
void pcie_aspm_powersave_config_link(struct pci_dev *pdev)
{
	struct pcie_link_state *link = pdev->link_state;

1058
	if (aspm_disabled || !link)
1059 1060
		return;

1061 1062
	if (aspm_policy != POLICY_POWERSAVE &&
	    aspm_policy != POLICY_POWER_SUPERSAVE)
1063 1064 1065 1066 1067 1068 1069 1070 1071 1072
		return;

	down_read(&pci_bus_sem);
	mutex_lock(&aspm_lock);
	pcie_config_aspm_path(link);
	pcie_set_clkpm(link, policy_to_clkpm_state(link));
	mutex_unlock(&aspm_lock);
	up_read(&pci_bus_sem);
}

1073
static void __pci_disable_link_state(struct pci_dev *pdev, int state, bool sem)
S
Shaohua Li 已提交
1074 1075
{
	struct pci_dev *parent = pdev->bus->self;
1076
	struct pcie_link_state *link;
S
Shaohua Li 已提交
1077

M
Matthew Garrett 已提交
1078
	if (!pci_is_pcie(pdev))
S
Shaohua Li 已提交
1079
		return;
M
Matthew Garrett 已提交
1080

1081
	if (pdev->has_secondary_link)
S
Shaohua Li 已提交
1082 1083 1084 1085
		parent = pdev;
	if (!parent || !parent->link_state)
		return;

1086 1087 1088 1089 1090 1091 1092 1093
	/*
	 * A driver requested that ASPM be disabled on this device, but
	 * if we don't have permission to manage ASPM (e.g., on ACPI
	 * systems we have to observe the FADT ACPI_FADT_NO_ASPM bit and
	 * the _OSC method), we can't honor that request.  Windows has
	 * a similar mechanism using "PciASPMOptOut", which is also
	 * ignored in this situation.
	 */
1094
	if (aspm_disabled) {
1095
		pci_warn(pdev, "can't disable ASPM; OS doesn't have ASPM control\n");
1096 1097 1098
		return;
	}

1099 1100
	if (sem)
		down_read(&pci_bus_sem);
S
Shaohua Li 已提交
1101
	mutex_lock(&aspm_lock);
1102
	link = parent->link_state;
1103 1104 1105 1106
	if (state & PCIE_LINK_STATE_L0S)
		link->aspm_disable |= ASPM_STATE_L0S;
	if (state & PCIE_LINK_STATE_L1)
		link->aspm_disable |= ASPM_STATE_L1;
1107 1108
	pcie_config_aspm_link(link, policy_to_aspm_state(link));

K
Kenji Kaneshige 已提交
1109
	if (state & PCIE_LINK_STATE_CLKPM) {
1110 1111
		link->clkpm_capable = 0;
		pcie_set_clkpm(link, 0);
K
Kenji Kaneshige 已提交
1112
	}
S
Shaohua Li 已提交
1113
	mutex_unlock(&aspm_lock);
1114 1115 1116 1117 1118 1119
	if (sem)
		up_read(&pci_bus_sem);
}

void pci_disable_link_state_locked(struct pci_dev *pdev, int state)
{
1120
	__pci_disable_link_state(pdev, state, false);
1121 1122 1123
}
EXPORT_SYMBOL(pci_disable_link_state_locked);

1124 1125 1126 1127 1128 1129 1130 1131 1132
/**
 * pci_disable_link_state - Disable device's link state, so the link will
 * never enter specific states.  Note that if the BIOS didn't grant ASPM
 * control to the OS, this does nothing because we can't touch the LNKCTL
 * register.
 *
 * @pdev: PCI device
 * @state: ASPM link state to disable
 */
1133 1134
void pci_disable_link_state(struct pci_dev *pdev, int state)
{
1135
	__pci_disable_link_state(pdev, state, true);
S
Shaohua Li 已提交
1136 1137 1138
}
EXPORT_SYMBOL(pci_disable_link_state);

1139 1140
static int pcie_aspm_set_policy(const char *val,
				const struct kernel_param *kp)
S
Shaohua Li 已提交
1141 1142
{
	int i;
1143
	struct pcie_link_state *link;
S
Shaohua Li 已提交
1144

1145 1146
	if (aspm_disabled)
		return -EPERM;
1147 1148 1149
	i = sysfs_match_string(policy_str, val);
	if (i < 0)
		return i;
S
Shaohua Li 已提交
1150 1151 1152 1153 1154 1155
	if (i == aspm_policy)
		return 0;

	down_read(&pci_bus_sem);
	mutex_lock(&aspm_lock);
	aspm_policy = i;
1156 1157 1158
	list_for_each_entry(link, &link_list, sibling) {
		pcie_config_aspm_link(link, policy_to_aspm_state(link));
		pcie_set_clkpm(link, policy_to_clkpm_state(link));
S
Shaohua Li 已提交
1159 1160 1161 1162 1163 1164
	}
	mutex_unlock(&aspm_lock);
	up_read(&pci_bus_sem);
	return 0;
}

1165
static int pcie_aspm_get_policy(char *buffer, const struct kernel_param *kp)
S
Shaohua Li 已提交
1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186
{
	int i, cnt = 0;
	for (i = 0; i < ARRAY_SIZE(policy_str); i++)
		if (i == aspm_policy)
			cnt += sprintf(buffer + cnt, "[%s] ", policy_str[i]);
		else
			cnt += sprintf(buffer + cnt, "%s ", policy_str[i]);
	return cnt;
}

module_param_call(policy, pcie_aspm_set_policy, pcie_aspm_get_policy,
	NULL, 0644);

#ifdef CONFIG_PCIEASPM_DEBUG
static ssize_t link_state_show(struct device *dev,
		struct device_attribute *attr,
		char *buf)
{
	struct pci_dev *pci_device = to_pci_dev(dev);
	struct pcie_link_state *link_state = pci_device->link_state;

1187
	return sprintf(buf, "%d\n", link_state->aspm_enabled);
S
Shaohua Li 已提交
1188 1189 1190 1191 1192 1193 1194
}

static ssize_t link_state_store(struct device *dev,
		struct device_attribute *attr,
		const char *buf,
		size_t n)
{
1195
	struct pci_dev *pdev = to_pci_dev(dev);
1196
	struct pcie_link_state *link, *root = pdev->link_state->root;
1197
	u32 state;
S
Shaohua Li 已提交
1198

1199 1200
	if (aspm_disabled)
		return -EPERM;
S
Shaohua Li 已提交
1201

1202 1203 1204 1205
	if (kstrtouint(buf, 10, &state))
		return -EINVAL;
	if ((state & ~ASPM_STATE_ALL) != 0)
		return -EINVAL;
1206

1207 1208 1209 1210 1211 1212 1213 1214 1215 1216
	down_read(&pci_bus_sem);
	mutex_lock(&aspm_lock);
	list_for_each_entry(link, &link_list, sibling) {
		if (link->root != root)
			continue;
		pcie_config_aspm_link(link, state);
	}
	mutex_unlock(&aspm_lock);
	up_read(&pci_bus_sem);
	return n;
S
Shaohua Li 已提交
1217 1218 1219 1220 1221 1222 1223 1224 1225
}

static ssize_t clk_ctl_show(struct device *dev,
		struct device_attribute *attr,
		char *buf)
{
	struct pci_dev *pci_device = to_pci_dev(dev);
	struct pcie_link_state *link_state = pci_device->link_state;

1226
	return sprintf(buf, "%d\n", link_state->clkpm_enabled);
S
Shaohua Li 已提交
1227 1228 1229 1230 1231 1232 1233
}

static ssize_t clk_ctl_store(struct device *dev,
		struct device_attribute *attr,
		const char *buf,
		size_t n)
{
K
Kenji Kaneshige 已提交
1234
	struct pci_dev *pdev = to_pci_dev(dev);
1235
	bool state;
S
Shaohua Li 已提交
1236

1237
	if (strtobool(buf, &state))
S
Shaohua Li 已提交
1238 1239 1240 1241
		return -EINVAL;

	down_read(&pci_bus_sem);
	mutex_lock(&aspm_lock);
1242
	pcie_set_clkpm_nocheck(pdev->link_state, state);
S
Shaohua Li 已提交
1243 1244 1245 1246 1247 1248
	mutex_unlock(&aspm_lock);
	up_read(&pci_bus_sem);

	return n;
}

1249 1250
static DEVICE_ATTR_RW(link_state);
static DEVICE_ATTR_RW(clk_ctl);
S
Shaohua Li 已提交
1251 1252 1253 1254 1255 1256

static char power_group[] = "power";
void pcie_aspm_create_sysfs_dev_files(struct pci_dev *pdev)
{
	struct pcie_link_state *link_state = pdev->link_state;

1257
	if (!link_state)
S
Shaohua Li 已提交
1258 1259
		return;

1260
	if (link_state->aspm_support)
S
Shaohua Li 已提交
1261 1262
		sysfs_add_file_to_group(&pdev->dev.kobj,
			&dev_attr_link_state.attr, power_group);
1263
	if (link_state->clkpm_capable)
S
Shaohua Li 已提交
1264 1265 1266 1267 1268 1269 1270 1271
		sysfs_add_file_to_group(&pdev->dev.kobj,
			&dev_attr_clk_ctl.attr, power_group);
}

void pcie_aspm_remove_sysfs_dev_files(struct pci_dev *pdev)
{
	struct pcie_link_state *link_state = pdev->link_state;

1272
	if (!link_state)
S
Shaohua Li 已提交
1273 1274
		return;

1275
	if (link_state->aspm_support)
S
Shaohua Li 已提交
1276 1277
		sysfs_remove_file_from_group(&pdev->dev.kobj,
			&dev_attr_link_state.attr, power_group);
1278
	if (link_state->clkpm_capable)
S
Shaohua Li 已提交
1279 1280 1281 1282 1283 1284 1285
		sysfs_remove_file_from_group(&pdev->dev.kobj,
			&dev_attr_clk_ctl.attr, power_group);
}
#endif

static int __init pcie_aspm_disable(char *str)
{
1286
	if (!strcmp(str, "off")) {
M
Matthew Garrett 已提交
1287
		aspm_policy = POLICY_DEFAULT;
1288
		aspm_disabled = 1;
1289
		aspm_support_enabled = false;
1290 1291 1292
		printk(KERN_INFO "PCIe ASPM is disabled\n");
	} else if (!strcmp(str, "force")) {
		aspm_force = 1;
M
Michael Witten 已提交
1293
		printk(KERN_INFO "PCIe ASPM is forcibly enabled\n");
1294
	}
S
Shaohua Li 已提交
1295 1296 1297
	return 1;
}

1298
__setup("pcie_aspm=", pcie_aspm_disable);
S
Shaohua Li 已提交
1299

1300 1301
void pcie_no_aspm(void)
{
M
Matthew Garrett 已提交
1302 1303 1304 1305 1306 1307 1308 1309
	/*
	 * Disabling ASPM is intended to prevent the kernel from modifying
	 * existing hardware state, not to clear existing state. To that end:
	 * (a) set policy to POLICY_DEFAULT in order to avoid changing state
	 * (b) prevent userspace from changing policy
	 */
	if (!aspm_force) {
		aspm_policy = POLICY_DEFAULT;
1310
		aspm_disabled = 1;
M
Matthew Garrett 已提交
1311
	}
1312 1313
}

1314 1315 1316 1317 1318
bool pcie_aspm_support_enabled(void)
{
	return aspm_support_enabled;
}
EXPORT_SYMBOL(pcie_aspm_support_enabled);