printf: Remove unused 'bprintf'
[drm/drm-misc.git] / drivers / pci / pcie / aspm.c
blob28567d457613bf4e40c892ded718861ce1546fa7
1 // SPDX-License-Identifier: GPL-2.0
2 /*
3 * Enable PCIe link L0s/L1 state and Clock Power Management
5 * Copyright (C) 2007 Intel
6 * Copyright (C) Zhang Yanmin (yanmin.zhang@intel.com)
7 * Copyright (C) Shaohua Li (shaohua.li@intel.com)
8 */
10 #include <linux/bitfield.h>
11 #include <linux/bits.h>
12 #include <linux/build_bug.h>
13 #include <linux/kernel.h>
14 #include <linux/limits.h>
15 #include <linux/math.h>
16 #include <linux/module.h>
17 #include <linux/moduleparam.h>
18 #include <linux/pci.h>
19 #include <linux/pci_regs.h>
20 #include <linux/errno.h>
21 #include <linux/pm.h>
22 #include <linux/init.h>
23 #include <linux/printk.h>
24 #include <linux/slab.h>
25 #include <linux/time.h>
27 #include "../pci.h"
29 void pci_save_ltr_state(struct pci_dev *dev)
31 int ltr;
32 struct pci_cap_saved_state *save_state;
33 u32 *cap;
35 if (!pci_is_pcie(dev))
36 return;
38 ltr = pci_find_ext_capability(dev, PCI_EXT_CAP_ID_LTR);
39 if (!ltr)
40 return;
42 save_state = pci_find_saved_ext_cap(dev, PCI_EXT_CAP_ID_LTR);
43 if (!save_state) {
44 pci_err(dev, "no suspend buffer for LTR; ASPM issues possible after resume\n");
45 return;
48 /* Some broken devices only support dword access to LTR */
49 cap = &save_state->cap.data[0];
50 pci_read_config_dword(dev, ltr + PCI_LTR_MAX_SNOOP_LAT, cap);
53 void pci_restore_ltr_state(struct pci_dev *dev)
55 struct pci_cap_saved_state *save_state;
56 int ltr;
57 u32 *cap;
59 save_state = pci_find_saved_ext_cap(dev, PCI_EXT_CAP_ID_LTR);
60 ltr = pci_find_ext_capability(dev, PCI_EXT_CAP_ID_LTR);
61 if (!save_state || !ltr)
62 return;
64 /* Some broken devices only support dword access to LTR */
65 cap = &save_state->cap.data[0];
66 pci_write_config_dword(dev, ltr + PCI_LTR_MAX_SNOOP_LAT, *cap);
69 void pci_configure_aspm_l1ss(struct pci_dev *pdev)
71 int rc;
73 pdev->l1ss = pci_find_ext_capability(pdev, PCI_EXT_CAP_ID_L1SS);
75 rc = pci_add_ext_cap_save_buffer(pdev, PCI_EXT_CAP_ID_L1SS,
76 2 * sizeof(u32));
77 if (rc)
78 pci_err(pdev, "unable to allocate ASPM L1SS save buffer (%pe)\n",
79 ERR_PTR(rc));
82 void pci_save_aspm_l1ss_state(struct pci_dev *pdev)
84 struct pci_cap_saved_state *save_state;
85 u16 l1ss = pdev->l1ss;
86 u32 *cap;
89 * Save L1 substate configuration. The ASPM L0s/L1 configuration
90 * in PCI_EXP_LNKCTL_ASPMC is saved by pci_save_pcie_state().
92 if (!l1ss)
93 return;
95 save_state = pci_find_saved_ext_cap(pdev, PCI_EXT_CAP_ID_L1SS);
96 if (!save_state)
97 return;
99 cap = &save_state->cap.data[0];
100 pci_read_config_dword(pdev, l1ss + PCI_L1SS_CTL2, cap++);
101 pci_read_config_dword(pdev, l1ss + PCI_L1SS_CTL1, cap++);
104 void pci_restore_aspm_l1ss_state(struct pci_dev *pdev)
106 struct pci_cap_saved_state *pl_save_state, *cl_save_state;
107 struct pci_dev *parent = pdev->bus->self;
108 u32 *cap, pl_ctl1, pl_ctl2, pl_l1_2_enable;
109 u32 cl_ctl1, cl_ctl2, cl_l1_2_enable;
110 u16 clnkctl, plnkctl;
113 * In case BIOS enabled L1.2 when resuming, we need to disable it first
114 * on the downstream component before the upstream. So, don't attempt to
115 * restore either until we are at the downstream component.
117 if (pcie_downstream_port(pdev) || !parent)
118 return;
120 if (!pdev->l1ss || !parent->l1ss)
121 return;
123 cl_save_state = pci_find_saved_ext_cap(pdev, PCI_EXT_CAP_ID_L1SS);
124 pl_save_state = pci_find_saved_ext_cap(parent, PCI_EXT_CAP_ID_L1SS);
125 if (!cl_save_state || !pl_save_state)
126 return;
128 cap = &cl_save_state->cap.data[0];
129 cl_ctl2 = *cap++;
130 cl_ctl1 = *cap;
131 cap = &pl_save_state->cap.data[0];
132 pl_ctl2 = *cap++;
133 pl_ctl1 = *cap;
135 /* Make sure L0s/L1 are disabled before updating L1SS config */
136 pcie_capability_read_word(pdev, PCI_EXP_LNKCTL, &clnkctl);
137 pcie_capability_read_word(parent, PCI_EXP_LNKCTL, &plnkctl);
138 if (FIELD_GET(PCI_EXP_LNKCTL_ASPMC, clnkctl) ||
139 FIELD_GET(PCI_EXP_LNKCTL_ASPMC, plnkctl)) {
140 pcie_capability_write_word(pdev, PCI_EXP_LNKCTL,
141 clnkctl & ~PCI_EXP_LNKCTL_ASPMC);
142 pcie_capability_write_word(parent, PCI_EXP_LNKCTL,
143 plnkctl & ~PCI_EXP_LNKCTL_ASPMC);
147 * Disable L1.2 on this downstream endpoint device first, followed
148 * by the upstream
150 pci_clear_and_set_config_dword(pdev, pdev->l1ss + PCI_L1SS_CTL1,
151 PCI_L1SS_CTL1_L1_2_MASK, 0);
152 pci_clear_and_set_config_dword(parent, parent->l1ss + PCI_L1SS_CTL1,
153 PCI_L1SS_CTL1_L1_2_MASK, 0);
156 * In addition, Common_Mode_Restore_Time and LTR_L1.2_THRESHOLD
157 * in PCI_L1SS_CTL1 must be programmed *before* setting the L1.2
158 * enable bits, even though they're all in PCI_L1SS_CTL1.
160 pl_l1_2_enable = pl_ctl1 & PCI_L1SS_CTL1_L1_2_MASK;
161 pl_ctl1 &= ~PCI_L1SS_CTL1_L1_2_MASK;
162 cl_l1_2_enable = cl_ctl1 & PCI_L1SS_CTL1_L1_2_MASK;
163 cl_ctl1 &= ~PCI_L1SS_CTL1_L1_2_MASK;
165 /* Write back without enables first (above we cleared them in ctl1) */
166 pci_write_config_dword(parent, parent->l1ss + PCI_L1SS_CTL2, pl_ctl2);
167 pci_write_config_dword(pdev, pdev->l1ss + PCI_L1SS_CTL2, cl_ctl2);
168 pci_write_config_dword(parent, parent->l1ss + PCI_L1SS_CTL1, pl_ctl1);
169 pci_write_config_dword(pdev, pdev->l1ss + PCI_L1SS_CTL1, cl_ctl1);
171 /* Then write back the enables */
172 if (pl_l1_2_enable || cl_l1_2_enable) {
173 pci_write_config_dword(parent, parent->l1ss + PCI_L1SS_CTL1,
174 pl_ctl1 | pl_l1_2_enable);
175 pci_write_config_dword(pdev, pdev->l1ss + PCI_L1SS_CTL1,
176 cl_ctl1 | cl_l1_2_enable);
179 /* Restore L0s/L1 if they were enabled */
180 if (FIELD_GET(PCI_EXP_LNKCTL_ASPMC, clnkctl) ||
181 FIELD_GET(PCI_EXP_LNKCTL_ASPMC, plnkctl)) {
182 pcie_capability_write_word(parent, PCI_EXP_LNKCTL, plnkctl);
183 pcie_capability_write_word(pdev, PCI_EXP_LNKCTL, clnkctl);
187 #ifdef CONFIG_PCIEASPM
189 #ifdef MODULE_PARAM_PREFIX
190 #undef MODULE_PARAM_PREFIX
191 #endif
192 #define MODULE_PARAM_PREFIX "pcie_aspm."
194 /* Note: these are not register definitions */
195 #define PCIE_LINK_STATE_L0S_UP BIT(0) /* Upstream direction L0s state */
196 #define PCIE_LINK_STATE_L0S_DW BIT(1) /* Downstream direction L0s state */
197 static_assert(PCIE_LINK_STATE_L0S == (PCIE_LINK_STATE_L0S_UP | PCIE_LINK_STATE_L0S_DW));
199 #define PCIE_LINK_STATE_L1_SS_PCIPM (PCIE_LINK_STATE_L1_1_PCIPM |\
200 PCIE_LINK_STATE_L1_2_PCIPM)
201 #define PCIE_LINK_STATE_L1_2_MASK (PCIE_LINK_STATE_L1_2 |\
202 PCIE_LINK_STATE_L1_2_PCIPM)
203 #define PCIE_LINK_STATE_L1SS (PCIE_LINK_STATE_L1_1 |\
204 PCIE_LINK_STATE_L1_1_PCIPM |\
205 PCIE_LINK_STATE_L1_2_MASK)
207 struct pcie_link_state {
208 struct pci_dev *pdev; /* Upstream component of the Link */
209 struct pci_dev *downstream; /* Downstream component, function 0 */
210 struct pcie_link_state *root; /* pointer to the root port link */
211 struct pcie_link_state *parent; /* pointer to the parent Link state */
212 struct list_head sibling; /* node in link_list */
214 /* ASPM state */
215 u32 aspm_support:7; /* Supported ASPM state */
216 u32 aspm_enabled:7; /* Enabled ASPM state */
217 u32 aspm_capable:7; /* Capable ASPM state with latency */
218 u32 aspm_default:7; /* Default ASPM state by BIOS */
219 u32 aspm_disable:7; /* Disabled ASPM state */
221 /* Clock PM state */
222 u32 clkpm_capable:1; /* Clock PM capable? */
223 u32 clkpm_enabled:1; /* Current Clock PM state */
224 u32 clkpm_default:1; /* Default Clock PM state by BIOS */
225 u32 clkpm_disable:1; /* Clock PM disabled */
228 static int aspm_disabled, aspm_force;
229 static bool aspm_support_enabled = true;
230 static DEFINE_MUTEX(aspm_lock);
231 static LIST_HEAD(link_list);
233 #define POLICY_DEFAULT 0 /* BIOS default setting */
234 #define POLICY_PERFORMANCE 1 /* high performance */
235 #define POLICY_POWERSAVE 2 /* high power saving */
236 #define POLICY_POWER_SUPERSAVE 3 /* possibly even more power saving */
238 #ifdef CONFIG_PCIEASPM_PERFORMANCE
239 static int aspm_policy = POLICY_PERFORMANCE;
240 #elif defined CONFIG_PCIEASPM_POWERSAVE
241 static int aspm_policy = POLICY_POWERSAVE;
242 #elif defined CONFIG_PCIEASPM_POWER_SUPERSAVE
243 static int aspm_policy = POLICY_POWER_SUPERSAVE;
244 #else
245 static int aspm_policy;
246 #endif
248 static const char *policy_str[] = {
249 [POLICY_DEFAULT] = "default",
250 [POLICY_PERFORMANCE] = "performance",
251 [POLICY_POWERSAVE] = "powersave",
252 [POLICY_POWER_SUPERSAVE] = "powersupersave"
256 * The L1 PM substate capability is only implemented in function 0 in a
257 * multi function device.
259 static struct pci_dev *pci_function_0(struct pci_bus *linkbus)
261 struct pci_dev *child;
263 list_for_each_entry(child, &linkbus->devices, bus_list)
264 if (PCI_FUNC(child->devfn) == 0)
265 return child;
266 return NULL;
269 static int policy_to_aspm_state(struct pcie_link_state *link)
271 switch (aspm_policy) {
272 case POLICY_PERFORMANCE:
273 /* Disable ASPM and Clock PM */
274 return 0;
275 case POLICY_POWERSAVE:
276 /* Enable ASPM L0s/L1 */
277 return PCIE_LINK_STATE_L0S | PCIE_LINK_STATE_L1;
278 case POLICY_POWER_SUPERSAVE:
279 /* Enable Everything */
280 return PCIE_LINK_STATE_ASPM_ALL;
281 case POLICY_DEFAULT:
282 return link->aspm_default;
284 return 0;
287 static int policy_to_clkpm_state(struct pcie_link_state *link)
289 switch (aspm_policy) {
290 case POLICY_PERFORMANCE:
291 /* Disable ASPM and Clock PM */
292 return 0;
293 case POLICY_POWERSAVE:
294 case POLICY_POWER_SUPERSAVE:
295 /* Enable Clock PM */
296 return 1;
297 case POLICY_DEFAULT:
298 return link->clkpm_default;
300 return 0;
303 static void pci_update_aspm_saved_state(struct pci_dev *dev)
305 struct pci_cap_saved_state *save_state;
306 u16 *cap, lnkctl, aspm_ctl;
308 save_state = pci_find_saved_cap(dev, PCI_CAP_ID_EXP);
309 if (!save_state)
310 return;
312 pcie_capability_read_word(dev, PCI_EXP_LNKCTL, &lnkctl);
315 * Update ASPM and CLKREQ bits of LNKCTL in save_state. We only
316 * write PCI_EXP_LNKCTL_CCC during enumeration, so it shouldn't
317 * change after being captured in save_state.
319 aspm_ctl = lnkctl & (PCI_EXP_LNKCTL_ASPMC | PCI_EXP_LNKCTL_CLKREQ_EN);
320 lnkctl &= ~(PCI_EXP_LNKCTL_ASPMC | PCI_EXP_LNKCTL_CLKREQ_EN);
322 /* Depends on pci_save_pcie_state(): cap[1] is LNKCTL */
323 cap = (u16 *)&save_state->cap.data[0];
324 cap[1] = lnkctl | aspm_ctl;
327 static void pcie_set_clkpm_nocheck(struct pcie_link_state *link, int enable)
329 struct pci_dev *child;
330 struct pci_bus *linkbus = link->pdev->subordinate;
331 u32 val = enable ? PCI_EXP_LNKCTL_CLKREQ_EN : 0;
333 list_for_each_entry(child, &linkbus->devices, bus_list) {
334 pcie_capability_clear_and_set_word(child, PCI_EXP_LNKCTL,
335 PCI_EXP_LNKCTL_CLKREQ_EN,
336 val);
337 pci_update_aspm_saved_state(child);
339 link->clkpm_enabled = !!enable;
342 static void pcie_set_clkpm(struct pcie_link_state *link, int enable)
345 * Don't enable Clock PM if the link is not Clock PM capable
346 * or Clock PM is disabled
348 if (!link->clkpm_capable || link->clkpm_disable)
349 enable = 0;
350 /* Need nothing if the specified equals to current state */
351 if (link->clkpm_enabled == enable)
352 return;
353 pcie_set_clkpm_nocheck(link, enable);
356 static void pcie_clkpm_cap_init(struct pcie_link_state *link, int blacklist)
358 int capable = 1, enabled = 1;
359 u32 reg32;
360 u16 reg16;
361 struct pci_dev *child;
362 struct pci_bus *linkbus = link->pdev->subordinate;
364 /* All functions should have the same cap and state, take the worst */
365 list_for_each_entry(child, &linkbus->devices, bus_list) {
366 pcie_capability_read_dword(child, PCI_EXP_LNKCAP, &reg32);
367 if (!(reg32 & PCI_EXP_LNKCAP_CLKPM)) {
368 capable = 0;
369 enabled = 0;
370 break;
372 pcie_capability_read_word(child, PCI_EXP_LNKCTL, &reg16);
373 if (!(reg16 & PCI_EXP_LNKCTL_CLKREQ_EN))
374 enabled = 0;
376 link->clkpm_enabled = enabled;
377 link->clkpm_default = enabled;
378 link->clkpm_capable = capable;
379 link->clkpm_disable = blacklist ? 1 : 0;
383 * pcie_aspm_configure_common_clock: check if the 2 ends of a link
384 * could use common clock. If they are, configure them to use the
385 * common clock. That will reduce the ASPM state exit latency.
387 static void pcie_aspm_configure_common_clock(struct pcie_link_state *link)
389 int same_clock = 1;
390 u16 reg16, ccc, parent_old_ccc, child_old_ccc[8];
391 struct pci_dev *child, *parent = link->pdev;
392 struct pci_bus *linkbus = parent->subordinate;
394 * All functions of a slot should have the same Slot Clock
395 * Configuration, so just check one function
397 child = list_entry(linkbus->devices.next, struct pci_dev, bus_list);
398 BUG_ON(!pci_is_pcie(child));
400 /* Check downstream component if bit Slot Clock Configuration is 1 */
401 pcie_capability_read_word(child, PCI_EXP_LNKSTA, &reg16);
402 if (!(reg16 & PCI_EXP_LNKSTA_SLC))
403 same_clock = 0;
405 /* Check upstream component if bit Slot Clock Configuration is 1 */
406 pcie_capability_read_word(parent, PCI_EXP_LNKSTA, &reg16);
407 if (!(reg16 & PCI_EXP_LNKSTA_SLC))
408 same_clock = 0;
410 /* Port might be already in common clock mode */
411 pcie_capability_read_word(parent, PCI_EXP_LNKCTL, &reg16);
412 parent_old_ccc = reg16 & PCI_EXP_LNKCTL_CCC;
413 if (same_clock && (reg16 & PCI_EXP_LNKCTL_CCC)) {
414 bool consistent = true;
416 list_for_each_entry(child, &linkbus->devices, bus_list) {
417 pcie_capability_read_word(child, PCI_EXP_LNKCTL,
418 &reg16);
419 if (!(reg16 & PCI_EXP_LNKCTL_CCC)) {
420 consistent = false;
421 break;
424 if (consistent)
425 return;
426 pci_info(parent, "ASPM: current common clock configuration is inconsistent, reconfiguring\n");
429 ccc = same_clock ? PCI_EXP_LNKCTL_CCC : 0;
430 /* Configure downstream component, all functions */
431 list_for_each_entry(child, &linkbus->devices, bus_list) {
432 pcie_capability_read_word(child, PCI_EXP_LNKCTL, &reg16);
433 child_old_ccc[PCI_FUNC(child->devfn)] = reg16 & PCI_EXP_LNKCTL_CCC;
434 pcie_capability_clear_and_set_word(child, PCI_EXP_LNKCTL,
435 PCI_EXP_LNKCTL_CCC, ccc);
438 /* Configure upstream component */
439 pcie_capability_clear_and_set_word(parent, PCI_EXP_LNKCTL,
440 PCI_EXP_LNKCTL_CCC, ccc);
442 if (pcie_retrain_link(link->pdev, true)) {
444 /* Training failed. Restore common clock configurations */
445 pci_err(parent, "ASPM: Could not configure common clock\n");
446 list_for_each_entry(child, &linkbus->devices, bus_list)
447 pcie_capability_clear_and_set_word(child, PCI_EXP_LNKCTL,
448 PCI_EXP_LNKCTL_CCC,
449 child_old_ccc[PCI_FUNC(child->devfn)]);
450 pcie_capability_clear_and_set_word(parent, PCI_EXP_LNKCTL,
451 PCI_EXP_LNKCTL_CCC, parent_old_ccc);
455 /* Convert L0s latency encoding to ns */
456 static u32 calc_l0s_latency(u32 lnkcap)
458 u32 encoding = FIELD_GET(PCI_EXP_LNKCAP_L0SEL, lnkcap);
460 if (encoding == 0x7)
461 return 5 * NSEC_PER_USEC; /* > 4us */
462 return (64 << encoding);
465 /* Convert L0s acceptable latency encoding to ns */
466 static u32 calc_l0s_acceptable(u32 encoding)
468 if (encoding == 0x7)
469 return U32_MAX;
470 return (64 << encoding);
473 /* Convert L1 latency encoding to ns */
474 static u32 calc_l1_latency(u32 lnkcap)
476 u32 encoding = FIELD_GET(PCI_EXP_LNKCAP_L1EL, lnkcap);
478 if (encoding == 0x7)
479 return 65 * NSEC_PER_USEC; /* > 64us */
480 return NSEC_PER_USEC << encoding;
483 /* Convert L1 acceptable latency encoding to ns */
484 static u32 calc_l1_acceptable(u32 encoding)
486 if (encoding == 0x7)
487 return U32_MAX;
488 return NSEC_PER_USEC << encoding;
491 /* Convert L1SS T_pwr encoding to usec */
492 static u32 calc_l12_pwron(struct pci_dev *pdev, u32 scale, u32 val)
494 switch (scale) {
495 case 0:
496 return val * 2;
497 case 1:
498 return val * 10;
499 case 2:
500 return val * 100;
502 pci_err(pdev, "%s: Invalid T_PwrOn scale: %u\n", __func__, scale);
503 return 0;
507 * Encode an LTR_L1.2_THRESHOLD value for the L1 PM Substates Control 1
508 * register. Ports enter L1.2 when the most recent LTR value is greater
509 * than or equal to LTR_L1.2_THRESHOLD, so we round up to make sure we
510 * don't enter L1.2 too aggressively.
512 * See PCIe r6.0, sec 5.5.1, 6.18, 7.8.3.3.
514 static void encode_l12_threshold(u32 threshold_us, u32 *scale, u32 *value)
516 u64 threshold_ns = (u64)threshold_us * NSEC_PER_USEC;
519 * LTR_L1.2_THRESHOLD_Value ("value") is a 10-bit field with max
520 * value of 0x3ff.
522 if (threshold_ns <= 1 * FIELD_MAX(PCI_L1SS_CTL1_LTR_L12_TH_VALUE)) {
523 *scale = 0; /* Value times 1ns */
524 *value = threshold_ns;
525 } else if (threshold_ns <= 32 * FIELD_MAX(PCI_L1SS_CTL1_LTR_L12_TH_VALUE)) {
526 *scale = 1; /* Value times 32ns */
527 *value = roundup(threshold_ns, 32) / 32;
528 } else if (threshold_ns <= 1024 * FIELD_MAX(PCI_L1SS_CTL1_LTR_L12_TH_VALUE)) {
529 *scale = 2; /* Value times 1024ns */
530 *value = roundup(threshold_ns, 1024) / 1024;
531 } else if (threshold_ns <= 32768 * FIELD_MAX(PCI_L1SS_CTL1_LTR_L12_TH_VALUE)) {
532 *scale = 3; /* Value times 32768ns */
533 *value = roundup(threshold_ns, 32768) / 32768;
534 } else if (threshold_ns <= 1048576 * FIELD_MAX(PCI_L1SS_CTL1_LTR_L12_TH_VALUE)) {
535 *scale = 4; /* Value times 1048576ns */
536 *value = roundup(threshold_ns, 1048576) / 1048576;
537 } else if (threshold_ns <= (u64)33554432 * FIELD_MAX(PCI_L1SS_CTL1_LTR_L12_TH_VALUE)) {
538 *scale = 5; /* Value times 33554432ns */
539 *value = roundup(threshold_ns, 33554432) / 33554432;
540 } else {
541 *scale = 5;
542 *value = FIELD_MAX(PCI_L1SS_CTL1_LTR_L12_TH_VALUE);
546 static void pcie_aspm_check_latency(struct pci_dev *endpoint)
548 u32 latency, encoding, lnkcap_up, lnkcap_dw;
549 u32 l1_switch_latency = 0, latency_up_l0s;
550 u32 latency_up_l1, latency_dw_l0s, latency_dw_l1;
551 u32 acceptable_l0s, acceptable_l1;
552 struct pcie_link_state *link;
554 /* Device not in D0 doesn't need latency check */
555 if ((endpoint->current_state != PCI_D0) &&
556 (endpoint->current_state != PCI_UNKNOWN))
557 return;
559 link = endpoint->bus->self->link_state;
561 /* Calculate endpoint L0s acceptable latency */
562 encoding = FIELD_GET(PCI_EXP_DEVCAP_L0S, endpoint->devcap);
563 acceptable_l0s = calc_l0s_acceptable(encoding);
565 /* Calculate endpoint L1 acceptable latency */
566 encoding = FIELD_GET(PCI_EXP_DEVCAP_L1, endpoint->devcap);
567 acceptable_l1 = calc_l1_acceptable(encoding);
569 while (link) {
570 struct pci_dev *dev = pci_function_0(link->pdev->subordinate);
572 /* Read direction exit latencies */
573 pcie_capability_read_dword(link->pdev, PCI_EXP_LNKCAP,
574 &lnkcap_up);
575 pcie_capability_read_dword(dev, PCI_EXP_LNKCAP,
576 &lnkcap_dw);
577 latency_up_l0s = calc_l0s_latency(lnkcap_up);
578 latency_up_l1 = calc_l1_latency(lnkcap_up);
579 latency_dw_l0s = calc_l0s_latency(lnkcap_dw);
580 latency_dw_l1 = calc_l1_latency(lnkcap_dw);
582 /* Check upstream direction L0s latency */
583 if ((link->aspm_capable & PCIE_LINK_STATE_L0S_UP) &&
584 (latency_up_l0s > acceptable_l0s))
585 link->aspm_capable &= ~PCIE_LINK_STATE_L0S_UP;
587 /* Check downstream direction L0s latency */
588 if ((link->aspm_capable & PCIE_LINK_STATE_L0S_DW) &&
589 (latency_dw_l0s > acceptable_l0s))
590 link->aspm_capable &= ~PCIE_LINK_STATE_L0S_DW;
592 * Check L1 latency.
593 * Every switch on the path to root complex need 1
594 * more microsecond for L1. Spec doesn't mention L0s.
596 * The exit latencies for L1 substates are not advertised
597 * by a device. Since the spec also doesn't mention a way
598 * to determine max latencies introduced by enabling L1
599 * substates on the components, it is not clear how to do
600 * a L1 substate exit latency check. We assume that the
601 * L1 exit latencies advertised by a device include L1
602 * substate latencies (and hence do not do any check).
604 latency = max_t(u32, latency_up_l1, latency_dw_l1);
605 if ((link->aspm_capable & PCIE_LINK_STATE_L1) &&
606 (latency + l1_switch_latency > acceptable_l1))
607 link->aspm_capable &= ~PCIE_LINK_STATE_L1;
608 l1_switch_latency += NSEC_PER_USEC;
610 link = link->parent;
614 /* Calculate L1.2 PM substate timing parameters */
615 static void aspm_calc_l12_info(struct pcie_link_state *link,
616 u32 parent_l1ss_cap, u32 child_l1ss_cap)
618 struct pci_dev *child = link->downstream, *parent = link->pdev;
619 u32 val1, val2, scale1, scale2;
620 u32 t_common_mode, t_power_on, l1_2_threshold, scale, value;
621 u32 ctl1 = 0, ctl2 = 0;
622 u32 pctl1, pctl2, cctl1, cctl2;
623 u32 pl1_2_enables, cl1_2_enables;
625 /* Choose the greater of the two Port Common_Mode_Restore_Times */
626 val1 = FIELD_GET(PCI_L1SS_CAP_CM_RESTORE_TIME, parent_l1ss_cap);
627 val2 = FIELD_GET(PCI_L1SS_CAP_CM_RESTORE_TIME, child_l1ss_cap);
628 t_common_mode = max(val1, val2);
630 /* Choose the greater of the two Port T_POWER_ON times */
631 val1 = FIELD_GET(PCI_L1SS_CAP_P_PWR_ON_VALUE, parent_l1ss_cap);
632 scale1 = FIELD_GET(PCI_L1SS_CAP_P_PWR_ON_SCALE, parent_l1ss_cap);
633 val2 = FIELD_GET(PCI_L1SS_CAP_P_PWR_ON_VALUE, child_l1ss_cap);
634 scale2 = FIELD_GET(PCI_L1SS_CAP_P_PWR_ON_SCALE, child_l1ss_cap);
636 if (calc_l12_pwron(parent, scale1, val1) >
637 calc_l12_pwron(child, scale2, val2)) {
638 ctl2 |= FIELD_PREP(PCI_L1SS_CTL2_T_PWR_ON_SCALE, scale1) |
639 FIELD_PREP(PCI_L1SS_CTL2_T_PWR_ON_VALUE, val1);
640 t_power_on = calc_l12_pwron(parent, scale1, val1);
641 } else {
642 ctl2 |= FIELD_PREP(PCI_L1SS_CTL2_T_PWR_ON_SCALE, scale2) |
643 FIELD_PREP(PCI_L1SS_CTL2_T_PWR_ON_VALUE, val2);
644 t_power_on = calc_l12_pwron(child, scale2, val2);
648 * Set LTR_L1.2_THRESHOLD to the time required to transition the
649 * Link from L0 to L1.2 and back to L0 so we enter L1.2 only if
650 * downstream devices report (via LTR) that they can tolerate at
651 * least that much latency.
653 * Based on PCIe r3.1, sec 5.5.3.3.1, Figures 5-16 and 5-17, and
654 * Table 5-11. T(POWER_OFF) is at most 2us and T(L1.2) is at
655 * least 4us.
657 l1_2_threshold = 2 + 4 + t_common_mode + t_power_on;
658 encode_l12_threshold(l1_2_threshold, &scale, &value);
659 ctl1 |= FIELD_PREP(PCI_L1SS_CTL1_CM_RESTORE_TIME, t_common_mode) |
660 FIELD_PREP(PCI_L1SS_CTL1_LTR_L12_TH_VALUE, value) |
661 FIELD_PREP(PCI_L1SS_CTL1_LTR_L12_TH_SCALE, scale);
663 /* Some broken devices only support dword access to L1 SS */
664 pci_read_config_dword(parent, parent->l1ss + PCI_L1SS_CTL1, &pctl1);
665 pci_read_config_dword(parent, parent->l1ss + PCI_L1SS_CTL2, &pctl2);
666 pci_read_config_dword(child, child->l1ss + PCI_L1SS_CTL1, &cctl1);
667 pci_read_config_dword(child, child->l1ss + PCI_L1SS_CTL2, &cctl2);
669 if (ctl1 == pctl1 && ctl1 == cctl1 &&
670 ctl2 == pctl2 && ctl2 == cctl2)
671 return;
673 /* Disable L1.2 while updating. See PCIe r5.0, sec 5.5.4, 7.8.3.3 */
674 pl1_2_enables = pctl1 & PCI_L1SS_CTL1_L1_2_MASK;
675 cl1_2_enables = cctl1 & PCI_L1SS_CTL1_L1_2_MASK;
677 if (pl1_2_enables || cl1_2_enables) {
678 pci_clear_and_set_config_dword(child,
679 child->l1ss + PCI_L1SS_CTL1,
680 PCI_L1SS_CTL1_L1_2_MASK, 0);
681 pci_clear_and_set_config_dword(parent,
682 parent->l1ss + PCI_L1SS_CTL1,
683 PCI_L1SS_CTL1_L1_2_MASK, 0);
686 /* Program T_POWER_ON times in both ports */
687 pci_write_config_dword(parent, parent->l1ss + PCI_L1SS_CTL2, ctl2);
688 pci_write_config_dword(child, child->l1ss + PCI_L1SS_CTL2, ctl2);
690 /* Program Common_Mode_Restore_Time in upstream device */
691 pci_clear_and_set_config_dword(parent, parent->l1ss + PCI_L1SS_CTL1,
692 PCI_L1SS_CTL1_CM_RESTORE_TIME, ctl1);
694 /* Program LTR_L1.2_THRESHOLD time in both ports */
695 pci_clear_and_set_config_dword(parent, parent->l1ss + PCI_L1SS_CTL1,
696 PCI_L1SS_CTL1_LTR_L12_TH_VALUE |
697 PCI_L1SS_CTL1_LTR_L12_TH_SCALE,
698 ctl1);
699 pci_clear_and_set_config_dword(child, child->l1ss + PCI_L1SS_CTL1,
700 PCI_L1SS_CTL1_LTR_L12_TH_VALUE |
701 PCI_L1SS_CTL1_LTR_L12_TH_SCALE,
702 ctl1);
704 if (pl1_2_enables || cl1_2_enables) {
705 pci_clear_and_set_config_dword(parent,
706 parent->l1ss + PCI_L1SS_CTL1, 0,
707 pl1_2_enables);
708 pci_clear_and_set_config_dword(child,
709 child->l1ss + PCI_L1SS_CTL1, 0,
710 cl1_2_enables);
714 static void aspm_l1ss_init(struct pcie_link_state *link)
716 struct pci_dev *child = link->downstream, *parent = link->pdev;
717 u32 parent_l1ss_cap, child_l1ss_cap;
718 u32 parent_l1ss_ctl1 = 0, child_l1ss_ctl1 = 0;
720 if (!parent->l1ss || !child->l1ss)
721 return;
723 /* Setup L1 substate */
724 pci_read_config_dword(parent, parent->l1ss + PCI_L1SS_CAP,
725 &parent_l1ss_cap);
726 pci_read_config_dword(child, child->l1ss + PCI_L1SS_CAP,
727 &child_l1ss_cap);
729 if (!(parent_l1ss_cap & PCI_L1SS_CAP_L1_PM_SS))
730 parent_l1ss_cap = 0;
731 if (!(child_l1ss_cap & PCI_L1SS_CAP_L1_PM_SS))
732 child_l1ss_cap = 0;
735 * If we don't have LTR for the entire path from the Root Complex
736 * to this device, we can't use ASPM L1.2 because it relies on the
737 * LTR_L1.2_THRESHOLD. See PCIe r4.0, secs 5.5.4, 6.18.
739 if (!child->ltr_path)
740 child_l1ss_cap &= ~PCI_L1SS_CAP_ASPM_L1_2;
742 if (parent_l1ss_cap & child_l1ss_cap & PCI_L1SS_CAP_ASPM_L1_1)
743 link->aspm_support |= PCIE_LINK_STATE_L1_1;
744 if (parent_l1ss_cap & child_l1ss_cap & PCI_L1SS_CAP_ASPM_L1_2)
745 link->aspm_support |= PCIE_LINK_STATE_L1_2;
746 if (parent_l1ss_cap & child_l1ss_cap & PCI_L1SS_CAP_PCIPM_L1_1)
747 link->aspm_support |= PCIE_LINK_STATE_L1_1_PCIPM;
748 if (parent_l1ss_cap & child_l1ss_cap & PCI_L1SS_CAP_PCIPM_L1_2)
749 link->aspm_support |= PCIE_LINK_STATE_L1_2_PCIPM;
751 if (parent_l1ss_cap)
752 pci_read_config_dword(parent, parent->l1ss + PCI_L1SS_CTL1,
753 &parent_l1ss_ctl1);
754 if (child_l1ss_cap)
755 pci_read_config_dword(child, child->l1ss + PCI_L1SS_CTL1,
756 &child_l1ss_ctl1);
758 if (parent_l1ss_ctl1 & child_l1ss_ctl1 & PCI_L1SS_CTL1_ASPM_L1_1)
759 link->aspm_enabled |= PCIE_LINK_STATE_L1_1;
760 if (parent_l1ss_ctl1 & child_l1ss_ctl1 & PCI_L1SS_CTL1_ASPM_L1_2)
761 link->aspm_enabled |= PCIE_LINK_STATE_L1_2;
762 if (parent_l1ss_ctl1 & child_l1ss_ctl1 & PCI_L1SS_CTL1_PCIPM_L1_1)
763 link->aspm_enabled |= PCIE_LINK_STATE_L1_1_PCIPM;
764 if (parent_l1ss_ctl1 & child_l1ss_ctl1 & PCI_L1SS_CTL1_PCIPM_L1_2)
765 link->aspm_enabled |= PCIE_LINK_STATE_L1_2_PCIPM;
767 if (link->aspm_support & PCIE_LINK_STATE_L1_2_MASK)
768 aspm_calc_l12_info(link, parent_l1ss_cap, child_l1ss_cap);
771 static void pcie_aspm_cap_init(struct pcie_link_state *link, int blacklist)
773 struct pci_dev *child = link->downstream, *parent = link->pdev;
774 u32 parent_lnkcap, child_lnkcap;
775 u16 parent_lnkctl, child_lnkctl;
776 struct pci_bus *linkbus = parent->subordinate;
778 if (blacklist) {
779 /* Set enabled/disable so that we will disable ASPM later */
780 link->aspm_enabled = PCIE_LINK_STATE_ASPM_ALL;
781 link->aspm_disable = PCIE_LINK_STATE_ASPM_ALL;
782 return;
786 * If ASPM not supported, don't mess with the clocks and link,
787 * bail out now.
789 pcie_capability_read_dword(parent, PCI_EXP_LNKCAP, &parent_lnkcap);
790 pcie_capability_read_dword(child, PCI_EXP_LNKCAP, &child_lnkcap);
791 if (!(parent_lnkcap & child_lnkcap & PCI_EXP_LNKCAP_ASPMS))
792 return;
794 /* Configure common clock before checking latencies */
795 pcie_aspm_configure_common_clock(link);
798 * Re-read upstream/downstream components' register state after
799 * clock configuration. L0s & L1 exit latencies in the otherwise
800 * read-only Link Capabilities may change depending on common clock
801 * configuration (PCIe r5.0, sec 7.5.3.6).
803 pcie_capability_read_dword(parent, PCI_EXP_LNKCAP, &parent_lnkcap);
804 pcie_capability_read_dword(child, PCI_EXP_LNKCAP, &child_lnkcap);
805 pcie_capability_read_word(parent, PCI_EXP_LNKCTL, &parent_lnkctl);
806 pcie_capability_read_word(child, PCI_EXP_LNKCTL, &child_lnkctl);
808 /* Disable L0s/L1 before updating L1SS config */
809 if (FIELD_GET(PCI_EXP_LNKCTL_ASPMC, child_lnkctl) ||
810 FIELD_GET(PCI_EXP_LNKCTL_ASPMC, parent_lnkctl)) {
811 pcie_capability_write_word(child, PCI_EXP_LNKCTL,
812 child_lnkctl & ~PCI_EXP_LNKCTL_ASPMC);
813 pcie_capability_write_word(parent, PCI_EXP_LNKCTL,
814 parent_lnkctl & ~PCI_EXP_LNKCTL_ASPMC);
818 * Setup L0s state
820 * Note that we must not enable L0s in either direction on a
821 * given link unless components on both sides of the link each
822 * support L0s.
824 if (parent_lnkcap & child_lnkcap & PCI_EXP_LNKCAP_ASPM_L0S)
825 link->aspm_support |= PCIE_LINK_STATE_L0S;
827 if (child_lnkctl & PCI_EXP_LNKCTL_ASPM_L0S)
828 link->aspm_enabled |= PCIE_LINK_STATE_L0S_UP;
829 if (parent_lnkctl & PCI_EXP_LNKCTL_ASPM_L0S)
830 link->aspm_enabled |= PCIE_LINK_STATE_L0S_DW;
832 /* Setup L1 state */
833 if (parent_lnkcap & child_lnkcap & PCI_EXP_LNKCAP_ASPM_L1)
834 link->aspm_support |= PCIE_LINK_STATE_L1;
836 if (parent_lnkctl & child_lnkctl & PCI_EXP_LNKCTL_ASPM_L1)
837 link->aspm_enabled |= PCIE_LINK_STATE_L1;
839 aspm_l1ss_init(link);
841 /* Restore L0s/L1 if they were enabled */
842 if (FIELD_GET(PCI_EXP_LNKCTL_ASPMC, child_lnkctl) ||
843 FIELD_GET(PCI_EXP_LNKCTL_ASPMC, parent_lnkctl)) {
844 pcie_capability_write_word(parent, PCI_EXP_LNKCTL, parent_lnkctl);
845 pcie_capability_write_word(child, PCI_EXP_LNKCTL, child_lnkctl);
848 /* Save default state */
849 link->aspm_default = link->aspm_enabled;
851 /* Setup initial capable state. Will be updated later */
852 link->aspm_capable = link->aspm_support;
854 /* Get and check endpoint acceptable latencies */
855 list_for_each_entry(child, &linkbus->devices, bus_list) {
856 if (pci_pcie_type(child) != PCI_EXP_TYPE_ENDPOINT &&
857 pci_pcie_type(child) != PCI_EXP_TYPE_LEG_END)
858 continue;
860 pcie_aspm_check_latency(child);
864 /* Configure the ASPM L1 substates. Caller must disable L1 first. */
865 static void pcie_config_aspm_l1ss(struct pcie_link_state *link, u32 state)
867 u32 val;
868 struct pci_dev *child = link->downstream, *parent = link->pdev;
870 val = 0;
871 if (state & PCIE_LINK_STATE_L1_1)
872 val |= PCI_L1SS_CTL1_ASPM_L1_1;
873 if (state & PCIE_LINK_STATE_L1_2)
874 val |= PCI_L1SS_CTL1_ASPM_L1_2;
875 if (state & PCIE_LINK_STATE_L1_1_PCIPM)
876 val |= PCI_L1SS_CTL1_PCIPM_L1_1;
877 if (state & PCIE_LINK_STATE_L1_2_PCIPM)
878 val |= PCI_L1SS_CTL1_PCIPM_L1_2;
881 * PCIe r6.2, sec 5.5.4, rules for enabling L1 PM Substates:
882 * - Clear L1.x enable bits at child first, then at parent
883 * - Set L1.x enable bits at parent first, then at child
884 * - ASPM/PCIPM L1.2 must be disabled while programming timing
885 * parameters
888 /* Disable all L1 substates */
889 pci_clear_and_set_config_dword(child, child->l1ss + PCI_L1SS_CTL1,
890 PCI_L1SS_CTL1_L1SS_MASK, 0);
891 pci_clear_and_set_config_dword(parent, parent->l1ss + PCI_L1SS_CTL1,
892 PCI_L1SS_CTL1_L1SS_MASK, 0);
894 /* Enable what we need to enable */
895 pci_clear_and_set_config_dword(parent, parent->l1ss + PCI_L1SS_CTL1,
896 PCI_L1SS_CTL1_L1SS_MASK, val);
897 pci_clear_and_set_config_dword(child, child->l1ss + PCI_L1SS_CTL1,
898 PCI_L1SS_CTL1_L1SS_MASK, val);
901 static void pcie_config_aspm_dev(struct pci_dev *pdev, u32 val)
903 pcie_capability_clear_and_set_word(pdev, PCI_EXP_LNKCTL,
904 PCI_EXP_LNKCTL_ASPMC, val);
907 static void pcie_config_aspm_link(struct pcie_link_state *link, u32 state)
909 u32 upstream = 0, dwstream = 0;
910 struct pci_dev *child = link->downstream, *parent = link->pdev;
911 struct pci_bus *linkbus = parent->subordinate;
913 /* Enable only the states that were not explicitly disabled */
914 state &= (link->aspm_capable & ~link->aspm_disable);
916 /* Can't enable any substates if L1 is not enabled */
917 if (!(state & PCIE_LINK_STATE_L1))
918 state &= ~PCIE_LINK_STATE_L1SS;
920 /* Spec says both ports must be in D0 before enabling PCI PM substates*/
921 if (parent->current_state != PCI_D0 || child->current_state != PCI_D0) {
922 state &= ~PCIE_LINK_STATE_L1_SS_PCIPM;
923 state |= (link->aspm_enabled & PCIE_LINK_STATE_L1_SS_PCIPM);
926 /* Nothing to do if the link is already in the requested state */
927 if (link->aspm_enabled == state)
928 return;
929 /* Convert ASPM state to upstream/downstream ASPM register state */
930 if (state & PCIE_LINK_STATE_L0S_UP)
931 dwstream |= PCI_EXP_LNKCTL_ASPM_L0S;
932 if (state & PCIE_LINK_STATE_L0S_DW)
933 upstream |= PCI_EXP_LNKCTL_ASPM_L0S;
934 if (state & PCIE_LINK_STATE_L1) {
935 upstream |= PCI_EXP_LNKCTL_ASPM_L1;
936 dwstream |= PCI_EXP_LNKCTL_ASPM_L1;
940 * Per PCIe r6.2, sec 5.5.4, setting either or both of the enable
941 * bits for ASPM L1 PM Substates must be done while ASPM L1 is
942 * disabled. Disable L1 here and apply new configuration after L1SS
943 * configuration has been completed.
945 * Per sec 7.5.3.7, when disabling ASPM L1, software must disable
946 * it in the Downstream component prior to disabling it in the
947 * Upstream component, and ASPM L1 must be enabled in the Upstream
948 * component prior to enabling it in the Downstream component.
950 * Sec 7.5.3.7 also recommends programming the same ASPM Control
951 * value for all functions of a multi-function device.
953 list_for_each_entry(child, &linkbus->devices, bus_list)
954 pcie_config_aspm_dev(child, 0);
955 pcie_config_aspm_dev(parent, 0);
957 if (link->aspm_capable & PCIE_LINK_STATE_L1SS)
958 pcie_config_aspm_l1ss(link, state);
960 pcie_config_aspm_dev(parent, upstream);
961 list_for_each_entry(child, &linkbus->devices, bus_list)
962 pcie_config_aspm_dev(child, dwstream);
964 link->aspm_enabled = state;
966 /* Update latest ASPM configuration in saved context */
967 pci_save_aspm_l1ss_state(link->downstream);
968 pci_update_aspm_saved_state(link->downstream);
969 pci_save_aspm_l1ss_state(parent);
970 pci_update_aspm_saved_state(parent);
973 static void pcie_config_aspm_path(struct pcie_link_state *link)
975 while (link) {
976 pcie_config_aspm_link(link, policy_to_aspm_state(link));
977 link = link->parent;
981 static void free_link_state(struct pcie_link_state *link)
983 link->pdev->link_state = NULL;
984 kfree(link);
987 static int pcie_aspm_sanity_check(struct pci_dev *pdev)
989 struct pci_dev *child;
990 u32 reg32;
993 * Some functions in a slot might not all be PCIe functions,
994 * very strange. Disable ASPM for the whole slot
996 list_for_each_entry(child, &pdev->subordinate->devices, bus_list) {
997 if (!pci_is_pcie(child))
998 return -EINVAL;
1001 * If ASPM is disabled then we're not going to change
1002 * the BIOS state. It's safe to continue even if it's a
1003 * pre-1.1 device
1006 if (aspm_disabled)
1007 continue;
1010 * Disable ASPM for pre-1.1 PCIe device, we follow MS to use
1011 * RBER bit to determine if a function is 1.1 version device
1013 pcie_capability_read_dword(child, PCI_EXP_DEVCAP, &reg32);
1014 if (!(reg32 & PCI_EXP_DEVCAP_RBER) && !aspm_force) {
1015 pci_info(child, "disabling ASPM on pre-1.1 PCIe device. You can enable it with 'pcie_aspm=force'\n");
1016 return -EINVAL;
1019 return 0;
1022 static struct pcie_link_state *alloc_pcie_link_state(struct pci_dev *pdev)
1024 struct pcie_link_state *link;
1026 link = kzalloc(sizeof(*link), GFP_KERNEL);
1027 if (!link)
1028 return NULL;
1030 INIT_LIST_HEAD(&link->sibling);
1031 link->pdev = pdev;
1032 link->downstream = pci_function_0(pdev->subordinate);
1035 * Root Ports and PCI/PCI-X to PCIe Bridges are roots of PCIe
1036 * hierarchies. Note that some PCIe host implementations omit
1037 * the root ports entirely, in which case a downstream port on
1038 * a switch may become the root of the link state chain for all
1039 * its subordinate endpoints.
1041 if (pci_pcie_type(pdev) == PCI_EXP_TYPE_ROOT_PORT ||
1042 pci_pcie_type(pdev) == PCI_EXP_TYPE_PCIE_BRIDGE ||
1043 !pdev->bus->parent->self) {
1044 link->root = link;
1045 } else {
1046 struct pcie_link_state *parent;
1048 parent = pdev->bus->parent->self->link_state;
1049 if (!parent) {
1050 kfree(link);
1051 return NULL;
1054 link->parent = parent;
1055 link->root = link->parent->root;
1058 list_add(&link->sibling, &link_list);
1059 pdev->link_state = link;
1060 return link;
1063 static void pcie_aspm_update_sysfs_visibility(struct pci_dev *pdev)
1065 struct pci_dev *child;
1067 list_for_each_entry(child, &pdev->subordinate->devices, bus_list)
1068 sysfs_update_group(&child->dev.kobj, &aspm_ctrl_attr_group);
1072 * pcie_aspm_init_link_state: Initiate PCI express link state.
1073 * It is called after the pcie and its children devices are scanned.
1074 * @pdev: the root port or switch downstream port
1076 void pcie_aspm_init_link_state(struct pci_dev *pdev)
1078 struct pcie_link_state *link;
1079 int blacklist = !!pcie_aspm_sanity_check(pdev);
1081 if (!aspm_support_enabled)
1082 return;
1084 if (pdev->link_state)
1085 return;
1088 * We allocate pcie_link_state for the component on the upstream
1089 * end of a Link, so there's nothing to do unless this device is
1090 * downstream port.
1092 if (!pcie_downstream_port(pdev))
1093 return;
1095 /* VIA has a strange chipset, root port is under a bridge */
1096 if (pci_pcie_type(pdev) == PCI_EXP_TYPE_ROOT_PORT &&
1097 pdev->bus->self)
1098 return;
1100 down_read(&pci_bus_sem);
1101 if (list_empty(&pdev->subordinate->devices))
1102 goto out;
1104 mutex_lock(&aspm_lock);
1105 link = alloc_pcie_link_state(pdev);
1106 if (!link)
1107 goto unlock;
1109 * Setup initial ASPM state. Note that we need to configure
1110 * upstream links also because capable state of them can be
1111 * update through pcie_aspm_cap_init().
1113 pcie_aspm_cap_init(link, blacklist);
1115 /* Setup initial Clock PM state */
1116 pcie_clkpm_cap_init(link, blacklist);
1119 * At this stage drivers haven't had an opportunity to change the
1120 * link policy setting. Enabling ASPM on broken hardware can cripple
1121 * it even before the driver has had a chance to disable ASPM, so
1122 * default to a safe level right now. If we're enabling ASPM beyond
1123 * the BIOS's expectation, we'll do so once pci_enable_device() is
1124 * called.
1126 if (aspm_policy != POLICY_POWERSAVE &&
1127 aspm_policy != POLICY_POWER_SUPERSAVE) {
1128 pcie_config_aspm_path(link);
1129 pcie_set_clkpm(link, policy_to_clkpm_state(link));
1132 pcie_aspm_update_sysfs_visibility(pdev);
1134 unlock:
1135 mutex_unlock(&aspm_lock);
1136 out:
1137 up_read(&pci_bus_sem);
1140 void pci_bridge_reconfigure_ltr(struct pci_dev *pdev)
1142 struct pci_dev *bridge;
1143 u32 ctl;
1145 bridge = pci_upstream_bridge(pdev);
1146 if (bridge && bridge->ltr_path) {
1147 pcie_capability_read_dword(bridge, PCI_EXP_DEVCTL2, &ctl);
1148 if (!(ctl & PCI_EXP_DEVCTL2_LTR_EN)) {
1149 pci_dbg(bridge, "re-enabling LTR\n");
1150 pcie_capability_set_word(bridge, PCI_EXP_DEVCTL2,
1151 PCI_EXP_DEVCTL2_LTR_EN);
1156 void pci_configure_ltr(struct pci_dev *pdev)
1158 struct pci_host_bridge *host = pci_find_host_bridge(pdev->bus);
1159 struct pci_dev *bridge;
1160 u32 cap, ctl;
1162 if (!pci_is_pcie(pdev))
1163 return;
1165 pcie_capability_read_dword(pdev, PCI_EXP_DEVCAP2, &cap);
1166 if (!(cap & PCI_EXP_DEVCAP2_LTR))
1167 return;
1169 pcie_capability_read_dword(pdev, PCI_EXP_DEVCTL2, &ctl);
1170 if (ctl & PCI_EXP_DEVCTL2_LTR_EN) {
1171 if (pci_pcie_type(pdev) == PCI_EXP_TYPE_ROOT_PORT) {
1172 pdev->ltr_path = 1;
1173 return;
1176 bridge = pci_upstream_bridge(pdev);
1177 if (bridge && bridge->ltr_path)
1178 pdev->ltr_path = 1;
1180 return;
1183 if (!host->native_ltr)
1184 return;
1187 * Software must not enable LTR in an Endpoint unless the Root
1188 * Complex and all intermediate Switches indicate support for LTR.
1189 * PCIe r4.0, sec 6.18.
1191 if (pci_pcie_type(pdev) == PCI_EXP_TYPE_ROOT_PORT) {
1192 pcie_capability_set_word(pdev, PCI_EXP_DEVCTL2,
1193 PCI_EXP_DEVCTL2_LTR_EN);
1194 pdev->ltr_path = 1;
1195 return;
1199 * If we're configuring a hot-added device, LTR was likely
1200 * disabled in the upstream bridge, so re-enable it before enabling
1201 * it in the new device.
1203 bridge = pci_upstream_bridge(pdev);
1204 if (bridge && bridge->ltr_path) {
1205 pci_bridge_reconfigure_ltr(pdev);
1206 pcie_capability_set_word(pdev, PCI_EXP_DEVCTL2,
1207 PCI_EXP_DEVCTL2_LTR_EN);
1208 pdev->ltr_path = 1;
1212 /* Recheck latencies and update aspm_capable for links under the root */
1213 static void pcie_update_aspm_capable(struct pcie_link_state *root)
1215 struct pcie_link_state *link;
1216 BUG_ON(root->parent);
1217 list_for_each_entry(link, &link_list, sibling) {
1218 if (link->root != root)
1219 continue;
1220 link->aspm_capable = link->aspm_support;
1222 list_for_each_entry(link, &link_list, sibling) {
1223 struct pci_dev *child;
1224 struct pci_bus *linkbus = link->pdev->subordinate;
1225 if (link->root != root)
1226 continue;
1227 list_for_each_entry(child, &linkbus->devices, bus_list) {
1228 if ((pci_pcie_type(child) != PCI_EXP_TYPE_ENDPOINT) &&
1229 (pci_pcie_type(child) != PCI_EXP_TYPE_LEG_END))
1230 continue;
1231 pcie_aspm_check_latency(child);
1236 /* @pdev: the endpoint device */
1237 void pcie_aspm_exit_link_state(struct pci_dev *pdev)
1239 struct pci_dev *parent = pdev->bus->self;
1240 struct pcie_link_state *link, *root, *parent_link;
1242 if (!parent || !parent->link_state)
1243 return;
1245 down_read(&pci_bus_sem);
1246 mutex_lock(&aspm_lock);
1248 link = parent->link_state;
1249 root = link->root;
1250 parent_link = link->parent;
1253 * link->downstream is a pointer to the pci_dev of function 0. If
1254 * we remove that function, the pci_dev is about to be deallocated,
1255 * so we can't use link->downstream again. Free the link state to
1256 * avoid this.
1258 * If we're removing a non-0 function, it's possible we could
1259 * retain the link state, but PCIe r6.0, sec 7.5.3.7, recommends
1260 * programming the same ASPM Control value for all functions of
1261 * multi-function devices, so disable ASPM for all of them.
1263 pcie_config_aspm_link(link, 0);
1264 list_del(&link->sibling);
1265 free_link_state(link);
1267 /* Recheck latencies and configure upstream links */
1268 if (parent_link) {
1269 pcie_update_aspm_capable(root);
1270 pcie_config_aspm_path(parent_link);
1273 mutex_unlock(&aspm_lock);
1274 up_read(&pci_bus_sem);
1278 * @pdev: the root port or switch downstream port
1279 * @locked: whether pci_bus_sem is held
1281 void pcie_aspm_pm_state_change(struct pci_dev *pdev, bool locked)
1283 struct pcie_link_state *link = pdev->link_state;
1285 if (aspm_disabled || !link)
1286 return;
1288 * Devices changed PM state, we should recheck if latency
1289 * meets all functions' requirement
1291 if (!locked)
1292 down_read(&pci_bus_sem);
1293 mutex_lock(&aspm_lock);
1294 pcie_update_aspm_capable(link->root);
1295 pcie_config_aspm_path(link);
1296 mutex_unlock(&aspm_lock);
1297 if (!locked)
1298 up_read(&pci_bus_sem);
1301 void pcie_aspm_powersave_config_link(struct pci_dev *pdev)
1303 struct pcie_link_state *link = pdev->link_state;
1305 if (aspm_disabled || !link)
1306 return;
1308 if (aspm_policy != POLICY_POWERSAVE &&
1309 aspm_policy != POLICY_POWER_SUPERSAVE)
1310 return;
1312 down_read(&pci_bus_sem);
1313 mutex_lock(&aspm_lock);
1314 pcie_config_aspm_path(link);
1315 pcie_set_clkpm(link, policy_to_clkpm_state(link));
1316 mutex_unlock(&aspm_lock);
1317 up_read(&pci_bus_sem);
1320 static struct pcie_link_state *pcie_aspm_get_link(struct pci_dev *pdev)
1322 struct pci_dev *bridge;
1324 if (!pci_is_pcie(pdev))
1325 return NULL;
1327 bridge = pci_upstream_bridge(pdev);
1328 if (!bridge || !pci_is_pcie(bridge))
1329 return NULL;
1331 return bridge->link_state;
1334 static u8 pci_calc_aspm_disable_mask(int state)
1336 state &= ~PCIE_LINK_STATE_CLKPM;
1338 /* L1 PM substates require L1 */
1339 if (state & PCIE_LINK_STATE_L1)
1340 state |= PCIE_LINK_STATE_L1SS;
1342 return state;
1345 static u8 pci_calc_aspm_enable_mask(int state)
1347 state &= ~PCIE_LINK_STATE_CLKPM;
1349 /* L1 PM substates require L1 */
1350 if (state & PCIE_LINK_STATE_L1SS)
1351 state |= PCIE_LINK_STATE_L1;
1353 return state;
1356 static int __pci_disable_link_state(struct pci_dev *pdev, int state, bool locked)
1358 struct pcie_link_state *link = pcie_aspm_get_link(pdev);
1360 if (!link)
1361 return -EINVAL;
1363 * A driver requested that ASPM be disabled on this device, but
1364 * if we don't have permission to manage ASPM (e.g., on ACPI
1365 * systems we have to observe the FADT ACPI_FADT_NO_ASPM bit and
1366 * the _OSC method), we can't honor that request. Windows has
1367 * a similar mechanism using "PciASPMOptOut", which is also
1368 * ignored in this situation.
1370 if (aspm_disabled) {
1371 pci_warn(pdev, "can't disable ASPM; OS doesn't have ASPM control\n");
1372 return -EPERM;
1375 if (!locked)
1376 down_read(&pci_bus_sem);
1377 mutex_lock(&aspm_lock);
1378 link->aspm_disable |= pci_calc_aspm_disable_mask(state);
1379 pcie_config_aspm_link(link, policy_to_aspm_state(link));
1381 if (state & PCIE_LINK_STATE_CLKPM)
1382 link->clkpm_disable = 1;
1383 pcie_set_clkpm(link, policy_to_clkpm_state(link));
1384 mutex_unlock(&aspm_lock);
1385 if (!locked)
1386 up_read(&pci_bus_sem);
1388 return 0;
1391 int pci_disable_link_state_locked(struct pci_dev *pdev, int state)
1393 lockdep_assert_held_read(&pci_bus_sem);
1395 return __pci_disable_link_state(pdev, state, true);
1397 EXPORT_SYMBOL(pci_disable_link_state_locked);
1400 * pci_disable_link_state - Disable device's link state, so the link will
1401 * never enter specific states. Note that if the BIOS didn't grant ASPM
1402 * control to the OS, this does nothing because we can't touch the LNKCTL
1403 * register. Returns 0 or a negative errno.
1405 * @pdev: PCI device
1406 * @state: ASPM link state to disable
1408 int pci_disable_link_state(struct pci_dev *pdev, int state)
1410 return __pci_disable_link_state(pdev, state, false);
1412 EXPORT_SYMBOL(pci_disable_link_state);
1414 static int __pci_enable_link_state(struct pci_dev *pdev, int state, bool locked)
1416 struct pcie_link_state *link = pcie_aspm_get_link(pdev);
1418 if (!link)
1419 return -EINVAL;
1421 * A driver requested that ASPM be enabled on this device, but
1422 * if we don't have permission to manage ASPM (e.g., on ACPI
1423 * systems we have to observe the FADT ACPI_FADT_NO_ASPM bit and
1424 * the _OSC method), we can't honor that request.
1426 if (aspm_disabled) {
1427 pci_warn(pdev, "can't override BIOS ASPM; OS doesn't have ASPM control\n");
1428 return -EPERM;
1431 if (!locked)
1432 down_read(&pci_bus_sem);
1433 mutex_lock(&aspm_lock);
1434 link->aspm_default = pci_calc_aspm_enable_mask(state);
1435 pcie_config_aspm_link(link, policy_to_aspm_state(link));
1437 link->clkpm_default = (state & PCIE_LINK_STATE_CLKPM) ? 1 : 0;
1438 pcie_set_clkpm(link, policy_to_clkpm_state(link));
1439 mutex_unlock(&aspm_lock);
1440 if (!locked)
1441 up_read(&pci_bus_sem);
1443 return 0;
1447 * pci_enable_link_state - Clear and set the default device link state so that
1448 * the link may be allowed to enter the specified states. Note that if the
1449 * BIOS didn't grant ASPM control to the OS, this does nothing because we can't
1450 * touch the LNKCTL register. Also note that this does not enable states
1451 * disabled by pci_disable_link_state(). Return 0 or a negative errno.
1453 * Note: Ensure devices are in D0 before enabling PCI-PM L1 PM Substates, per
1454 * PCIe r6.0, sec 5.5.4.
1456 * @pdev: PCI device
1457 * @state: Mask of ASPM link states to enable
1459 int pci_enable_link_state(struct pci_dev *pdev, int state)
1461 return __pci_enable_link_state(pdev, state, false);
1463 EXPORT_SYMBOL(pci_enable_link_state);
1466 * pci_enable_link_state_locked - Clear and set the default device link state
1467 * so that the link may be allowed to enter the specified states. Note that if
1468 * the BIOS didn't grant ASPM control to the OS, this does nothing because we
1469 * can't touch the LNKCTL register. Also note that this does not enable states
1470 * disabled by pci_disable_link_state(). Return 0 or a negative errno.
1472 * Note: Ensure devices are in D0 before enabling PCI-PM L1 PM Substates, per
1473 * PCIe r6.0, sec 5.5.4.
1475 * @pdev: PCI device
1476 * @state: Mask of ASPM link states to enable
1478 * Context: Caller holds pci_bus_sem read lock.
1480 int pci_enable_link_state_locked(struct pci_dev *pdev, int state)
1482 lockdep_assert_held_read(&pci_bus_sem);
1484 return __pci_enable_link_state(pdev, state, true);
1486 EXPORT_SYMBOL(pci_enable_link_state_locked);
1488 static int pcie_aspm_set_policy(const char *val,
1489 const struct kernel_param *kp)
1491 int i;
1492 struct pcie_link_state *link;
1494 if (aspm_disabled)
1495 return -EPERM;
1496 i = sysfs_match_string(policy_str, val);
1497 if (i < 0)
1498 return i;
1499 if (i == aspm_policy)
1500 return 0;
1502 down_read(&pci_bus_sem);
1503 mutex_lock(&aspm_lock);
1504 aspm_policy = i;
1505 list_for_each_entry(link, &link_list, sibling) {
1506 pcie_config_aspm_link(link, policy_to_aspm_state(link));
1507 pcie_set_clkpm(link, policy_to_clkpm_state(link));
1509 mutex_unlock(&aspm_lock);
1510 up_read(&pci_bus_sem);
1511 return 0;
1514 static int pcie_aspm_get_policy(char *buffer, const struct kernel_param *kp)
1516 int i, cnt = 0;
1517 for (i = 0; i < ARRAY_SIZE(policy_str); i++)
1518 if (i == aspm_policy)
1519 cnt += sprintf(buffer + cnt, "[%s] ", policy_str[i]);
1520 else
1521 cnt += sprintf(buffer + cnt, "%s ", policy_str[i]);
1522 cnt += sprintf(buffer + cnt, "\n");
1523 return cnt;
1526 module_param_call(policy, pcie_aspm_set_policy, pcie_aspm_get_policy,
1527 NULL, 0644);
1530 * pcie_aspm_enabled - Check if PCIe ASPM has been enabled for a device.
1531 * @pdev: Target device.
1533 * Relies on the upstream bridge's link_state being valid. The link_state
1534 * is deallocated only when the last child of the bridge (i.e., @pdev or a
1535 * sibling) is removed, and the caller should be holding a reference to
1536 * @pdev, so this should be safe.
1538 bool pcie_aspm_enabled(struct pci_dev *pdev)
1540 struct pcie_link_state *link = pcie_aspm_get_link(pdev);
1542 if (!link)
1543 return false;
1545 return link->aspm_enabled;
1547 EXPORT_SYMBOL_GPL(pcie_aspm_enabled);
1549 static ssize_t aspm_attr_show_common(struct device *dev,
1550 struct device_attribute *attr,
1551 char *buf, u8 state)
1553 struct pci_dev *pdev = to_pci_dev(dev);
1554 struct pcie_link_state *link = pcie_aspm_get_link(pdev);
1556 return sysfs_emit(buf, "%d\n", (link->aspm_enabled & state) ? 1 : 0);
1559 static ssize_t aspm_attr_store_common(struct device *dev,
1560 struct device_attribute *attr,
1561 const char *buf, size_t len, u8 state)
1563 struct pci_dev *pdev = to_pci_dev(dev);
1564 struct pcie_link_state *link = pcie_aspm_get_link(pdev);
1565 bool state_enable;
1567 if (kstrtobool(buf, &state_enable) < 0)
1568 return -EINVAL;
1570 down_read(&pci_bus_sem);
1571 mutex_lock(&aspm_lock);
1573 if (state_enable) {
1574 link->aspm_disable &= ~state;
1575 /* need to enable L1 for substates */
1576 if (state & PCIE_LINK_STATE_L1SS)
1577 link->aspm_disable &= ~PCIE_LINK_STATE_L1;
1578 } else {
1579 link->aspm_disable |= state;
1580 if (state & PCIE_LINK_STATE_L1)
1581 link->aspm_disable |= PCIE_LINK_STATE_L1SS;
1584 pcie_config_aspm_link(link, policy_to_aspm_state(link));
1586 mutex_unlock(&aspm_lock);
1587 up_read(&pci_bus_sem);
1589 return len;
1592 #define ASPM_ATTR(_f, _s) \
1593 static ssize_t _f##_show(struct device *dev, \
1594 struct device_attribute *attr, char *buf) \
1595 { return aspm_attr_show_common(dev, attr, buf, PCIE_LINK_STATE_##_s); } \
1597 static ssize_t _f##_store(struct device *dev, \
1598 struct device_attribute *attr, \
1599 const char *buf, size_t len) \
1600 { return aspm_attr_store_common(dev, attr, buf, len, PCIE_LINK_STATE_##_s); }
1602 ASPM_ATTR(l0s_aspm, L0S)
1603 ASPM_ATTR(l1_aspm, L1)
1604 ASPM_ATTR(l1_1_aspm, L1_1)
1605 ASPM_ATTR(l1_2_aspm, L1_2)
1606 ASPM_ATTR(l1_1_pcipm, L1_1_PCIPM)
1607 ASPM_ATTR(l1_2_pcipm, L1_2_PCIPM)
1609 static ssize_t clkpm_show(struct device *dev,
1610 struct device_attribute *attr, char *buf)
1612 struct pci_dev *pdev = to_pci_dev(dev);
1613 struct pcie_link_state *link = pcie_aspm_get_link(pdev);
1615 return sysfs_emit(buf, "%d\n", link->clkpm_enabled);
1618 static ssize_t clkpm_store(struct device *dev,
1619 struct device_attribute *attr,
1620 const char *buf, size_t len)
1622 struct pci_dev *pdev = to_pci_dev(dev);
1623 struct pcie_link_state *link = pcie_aspm_get_link(pdev);
1624 bool state_enable;
1626 if (kstrtobool(buf, &state_enable) < 0)
1627 return -EINVAL;
1629 down_read(&pci_bus_sem);
1630 mutex_lock(&aspm_lock);
1632 link->clkpm_disable = !state_enable;
1633 pcie_set_clkpm(link, policy_to_clkpm_state(link));
1635 mutex_unlock(&aspm_lock);
1636 up_read(&pci_bus_sem);
1638 return len;
1641 static DEVICE_ATTR_RW(clkpm);
1642 static DEVICE_ATTR_RW(l0s_aspm);
1643 static DEVICE_ATTR_RW(l1_aspm);
1644 static DEVICE_ATTR_RW(l1_1_aspm);
1645 static DEVICE_ATTR_RW(l1_2_aspm);
1646 static DEVICE_ATTR_RW(l1_1_pcipm);
1647 static DEVICE_ATTR_RW(l1_2_pcipm);
1649 static struct attribute *aspm_ctrl_attrs[] = {
1650 &dev_attr_clkpm.attr,
1651 &dev_attr_l0s_aspm.attr,
1652 &dev_attr_l1_aspm.attr,
1653 &dev_attr_l1_1_aspm.attr,
1654 &dev_attr_l1_2_aspm.attr,
1655 &dev_attr_l1_1_pcipm.attr,
1656 &dev_attr_l1_2_pcipm.attr,
1657 NULL
1660 static umode_t aspm_ctrl_attrs_are_visible(struct kobject *kobj,
1661 struct attribute *a, int n)
1663 struct device *dev = kobj_to_dev(kobj);
1664 struct pci_dev *pdev = to_pci_dev(dev);
1665 struct pcie_link_state *link = pcie_aspm_get_link(pdev);
1666 static const u8 aspm_state_map[] = {
1667 PCIE_LINK_STATE_L0S,
1668 PCIE_LINK_STATE_L1,
1669 PCIE_LINK_STATE_L1_1,
1670 PCIE_LINK_STATE_L1_2,
1671 PCIE_LINK_STATE_L1_1_PCIPM,
1672 PCIE_LINK_STATE_L1_2_PCIPM,
1675 if (aspm_disabled || !link)
1676 return 0;
1678 if (n == 0)
1679 return link->clkpm_capable ? a->mode : 0;
1681 return link->aspm_capable & aspm_state_map[n - 1] ? a->mode : 0;
1684 const struct attribute_group aspm_ctrl_attr_group = {
1685 .name = "link",
1686 .attrs = aspm_ctrl_attrs,
1687 .is_visible = aspm_ctrl_attrs_are_visible,
1690 static int __init pcie_aspm_disable(char *str)
1692 if (!strcmp(str, "off")) {
1693 aspm_policy = POLICY_DEFAULT;
1694 aspm_disabled = 1;
1695 aspm_support_enabled = false;
1696 pr_info("PCIe ASPM is disabled\n");
1697 } else if (!strcmp(str, "force")) {
1698 aspm_force = 1;
1699 pr_info("PCIe ASPM is forcibly enabled\n");
1701 return 1;
1704 __setup("pcie_aspm=", pcie_aspm_disable);
1706 void pcie_no_aspm(void)
1709 * Disabling ASPM is intended to prevent the kernel from modifying
1710 * existing hardware state, not to clear existing state. To that end:
1711 * (a) set policy to POLICY_DEFAULT in order to avoid changing state
1712 * (b) prevent userspace from changing policy
1714 if (!aspm_force) {
1715 aspm_policy = POLICY_DEFAULT;
1716 aspm_disabled = 1;
1720 bool pcie_aspm_support_enabled(void)
1722 return aspm_support_enabled;
1725 #endif /* CONFIG_PCIEASPM */