summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorRafael J. Wysocki <rafael.j.wysocki@intel.com>2022-05-05 21:09:12 +0300
committerBjorn Helgaas <bhelgaas@google.com>2022-05-05 22:19:49 +0300
commit0b59193548e63957101aae5e4fc47151fce4a629 (patch)
tree635e04ecde026ce2023d8412c7905388425bc06f
parent6d8c016a55aca612802fc325eb0e659d1c5f255d (diff)
downloadlinux-0b59193548e63957101aae5e4fc47151fce4a629.tar.xz
PCI/PM: Do not call pci_update_current_state() from pci_power_up()
Notice that calling pci_update_current_state() from pci_power_up() is redundant and may be harmful in some cases. First, if the device is in a low-power state before pci_power_up() gets called for it and platform_pci_set_power_state() successfully changes its power state to D0, pci_update_current_state() will update current_state to reflect that and pci_power_up() will return success right away without restoring the device's BARs or reconfiguring ASPM which may be necessary. This is arguably incorrect and definitely inconsistent with the case when platform_pci_set_power_state() returns an error (for example, because the device is not power-manageable by the platform firmware). Second, current_state should not be overwritten until the decision whether or not to restore the device's BARs is made, because that decision generally depends on its value. Again, calling pci_update_current_state() in pci_power_up() is not consistent with this observation. Next, pci_power_up() attempts to read from the device's PCI_PM_CTRL register regardless of the current_state value unless it is PCI_D0, including the case when pci_update_current_state() sets current_state to PCI_D3cold to indicate that the device is not accessible. If the register read is not successful, current_state will be set to PCI_D3cold anyway, so that pci_update_current_state() action is redundant. Further, if pci_update_current_state() reads the device's PCI_PM_CTRL register, pci_power_up() will repeat that read going forward and it is not necessary to update current_state in the meantime. Finally, if pm_cap is not set (in which case the PCI_PM_CTRL register is not present), the power state of the device should be determined with the help of the platform firmware or set to D0 if that's not possible and pci_update_current_state() does not do that. Accordingly, rearrange pci_power_up() so as to address the above shortcomings. Link: https://lore.kernel.org/r/3695055.kQq0lBPeGt@kreacher Signed-off-by: Rafael J. Wysocki <rafael.j.wysocki@intel.com> Signed-off-by: Bjorn Helgaas <bhelgaas@google.com>
-rw-r--r--drivers/pci/pci.c49
1 files changed, 28 insertions, 21 deletions
diff --git a/drivers/pci/pci.c b/drivers/pci/pci.c
index bc4af86da3f9..a5b93f85377a 100644
--- a/drivers/pci/pci.c
+++ b/drivers/pci/pci.c
@@ -1192,23 +1192,24 @@ static int pci_dev_wait(struct pci_dev *dev, char *reset_type, int timeout)
*/
int pci_power_up(struct pci_dev *dev)
{
- bool need_restore = false;
+ bool need_restore;
+ pci_power_t state;
u16 pmcsr;
- int ret;
- ret = platform_pci_set_power_state(dev, PCI_D0);
- if (!ret) {
- pci_update_current_state(dev, PCI_D0);
- } else if (!dev->pm_cap) { /* Fall back to PCI_D0 */
- dev->current_state = PCI_D0;
- return 0;
- }
+ platform_pci_set_power_state(dev, PCI_D0);
- if (dev->current_state == PCI_D0)
- return 0;
+ if (!dev->pm_cap) {
+ state = platform_pci_get_power_state(dev);
+ if (state == PCI_UNKNOWN)
+ dev->current_state = PCI_D0;
+ else
+ dev->current_state = state;
+
+ if (state == PCI_D0)
+ return 0;
- if (!dev->pm_cap)
return -EIO;
+ }
pci_read_config_word(dev, dev->pm_cap + PCI_PM_CTRL, &pmcsr);
if (PCI_POSSIBLE_ERROR(pmcsr)) {
@@ -1218,26 +1219,31 @@ int pci_power_up(struct pci_dev *dev)
return -EIO;
}
+ state = pmcsr & PCI_PM_CTRL_STATE_MASK;
+
+ need_restore = (state == PCI_D3hot || dev->current_state >= PCI_D3hot) &&
+ !(pmcsr & PCI_PM_CTRL_NO_SOFT_RESET);
+
+ if (state == PCI_D0) {
+ dev->current_state = PCI_D0;
+ goto end;
+ }
+
/*
* If we're (effectively) in D3, force entire word to 0. This doesn't
* affect PME_Status, disables PME_En, and sets PowerState to 0.
*/
- if (dev->current_state >= PCI_D3hot) {
- if ((pmcsr & PCI_PM_CTRL_STATE_MASK) == PCI_D3hot &&
- !(pmcsr & PCI_PM_CTRL_NO_SOFT_RESET))
- need_restore = true;
-
+ if (state == PCI_D3hot)
pmcsr = 0;
- } else {
+ else
pmcsr &= ~PCI_PM_CTRL_STATE_MASK;
- }
pci_write_config_word(dev, dev->pm_cap + PCI_PM_CTRL, pmcsr);
/* Mandatory transition delays; see PCI PM 1.2. */
- if (dev->current_state == PCI_D3hot)
+ if (state == PCI_D3hot)
pci_dev_d3_sleep(dev);
- else if (dev->current_state == PCI_D2)
+ else if (state == PCI_D2)
udelay(PCI_PM_D2_DELAY);
pci_read_config_word(dev, dev->pm_cap + PCI_PM_CTRL, &pmcsr);
@@ -1246,6 +1252,7 @@ int pci_power_up(struct pci_dev *dev)
pci_info_ratelimited(dev, "Refused to change power state from %s to D0\n",
pci_power_name(dev->current_state));
+end:
/*
* According to section 5.4.1 of the "PCI BUS POWER MANAGEMENT
* INTERFACE SPECIFICATION, REV. 1.2", a device transitioning