1 // SPDX-License-Identifier: GPL-2.0
3 * (C) Copyright 2002-2004, 2007 Greg Kroah-Hartman <greg@kroah.com>
4 * (C) Copyright 2007 Novell Inc.
8 #include <linux/module.h>
9 #include <linux/init.h>
10 #include <linux/device.h>
11 #include <linux/mempolicy.h>
12 #include <linux/string.h>
13 #include <linux/slab.h>
14 #include <linux/sched.h>
15 #include <linux/sched/isolation.h>
16 #include <linux/cpu.h>
17 #include <linux/pm_runtime.h>
18 #include <linux/suspend.h>
19 #include <linux/kexec.h>
20 #include <linux/of_device.h>
21 #include <linux/acpi.h>
22 #include <linux/dma-map-ops.h>
23 #include <linux/iommu.h>
25 #include "pcie/portdrv.h"
28 struct list_head node;
29 struct pci_device_id id;
33 * pci_add_dynid - add a new PCI device ID to this driver and re-probe devices
34 * @drv: target pci driver
35 * @vendor: PCI vendor ID
36 * @device: PCI device ID
37 * @subvendor: PCI subvendor ID
38 * @subdevice: PCI subdevice ID
40 * @class_mask: PCI class mask
41 * @driver_data: private driver data
43 * Adds a new dynamic pci device ID to this driver and causes the
44 * driver to probe for all devices again. @drv must have been
45 * registered prior to calling this function.
48 * Does GFP_KERNEL allocation.
51 * 0 on success, -errno on failure.
53 int pci_add_dynid(struct pci_driver *drv,
54 unsigned int vendor, unsigned int device,
55 unsigned int subvendor, unsigned int subdevice,
56 unsigned int class, unsigned int class_mask,
57 unsigned long driver_data)
59 struct pci_dynid *dynid;
61 dynid = kzalloc(sizeof(*dynid), GFP_KERNEL);
65 dynid->id.vendor = vendor;
66 dynid->id.device = device;
67 dynid->id.subvendor = subvendor;
68 dynid->id.subdevice = subdevice;
69 dynid->id.class = class;
70 dynid->id.class_mask = class_mask;
71 dynid->id.driver_data = driver_data;
73 spin_lock(&drv->dynids.lock);
74 list_add_tail(&dynid->node, &drv->dynids.list);
75 spin_unlock(&drv->dynids.lock);
77 return driver_attach(&drv->driver);
79 EXPORT_SYMBOL_GPL(pci_add_dynid);
81 static void pci_free_dynids(struct pci_driver *drv)
83 struct pci_dynid *dynid, *n;
85 spin_lock(&drv->dynids.lock);
86 list_for_each_entry_safe(dynid, n, &drv->dynids.list, node) {
87 list_del(&dynid->node);
90 spin_unlock(&drv->dynids.lock);
94 * pci_match_id - See if a PCI device matches a given pci_id table
95 * @ids: array of PCI device ID structures to search in
96 * @dev: the PCI device structure to match against.
98 * Used by a driver to check whether a PCI device is in its list of
99 * supported devices. Returns the matching pci_device_id structure or
100 * %NULL if there is no match.
102 * Deprecated; don't use this as it will not catch any dynamic IDs
103 * that a driver might want to check for.
105 const struct pci_device_id *pci_match_id(const struct pci_device_id *ids,
109 while (ids->vendor || ids->subvendor || ids->class_mask) {
110 if (pci_match_one_device(ids, dev))
117 EXPORT_SYMBOL(pci_match_id);
119 static const struct pci_device_id pci_device_id_any = {
120 .vendor = PCI_ANY_ID,
121 .device = PCI_ANY_ID,
122 .subvendor = PCI_ANY_ID,
123 .subdevice = PCI_ANY_ID,
127 * pci_match_device - See if a device matches a driver's list of IDs
128 * @drv: the PCI driver to match against
129 * @dev: the PCI device structure to match against
131 * Used by a driver to check whether a PCI device is in its list of
132 * supported devices or in the dynids list, which may have been augmented
133 * via the sysfs "new_id" file. Returns the matching pci_device_id
134 * structure or %NULL if there is no match.
136 static const struct pci_device_id *pci_match_device(struct pci_driver *drv,
139 struct pci_dynid *dynid;
140 const struct pci_device_id *found_id = NULL, *ids;
142 /* When driver_override is set, only bind to the matching driver */
143 if (dev->driver_override && strcmp(dev->driver_override, drv->name))
146 /* Look at the dynamic ids first, before the static ones */
147 spin_lock(&drv->dynids.lock);
148 list_for_each_entry(dynid, &drv->dynids.list, node) {
149 if (pci_match_one_device(&dynid->id, dev)) {
150 found_id = &dynid->id;
154 spin_unlock(&drv->dynids.lock);
159 for (ids = drv->id_table; (found_id = pci_match_id(ids, dev));
160 ids = found_id + 1) {
162 * The match table is split based on driver_override.
163 * In case override_only was set, enforce driver_override
166 if (found_id->override_only) {
167 if (dev->driver_override)
174 /* driver_override will always match, send a dummy id */
175 if (dev->driver_override)
176 return &pci_device_id_any;
181 * new_id_store - sysfs frontend to pci_add_dynid()
182 * @driver: target device driver
183 * @buf: buffer for scanning device ID data
186 * Allow PCI IDs to be added to an existing driver via sysfs.
188 static ssize_t new_id_store(struct device_driver *driver, const char *buf,
191 struct pci_driver *pdrv = to_pci_driver(driver);
192 const struct pci_device_id *ids = pdrv->id_table;
193 u32 vendor, device, subvendor = PCI_ANY_ID,
194 subdevice = PCI_ANY_ID, class = 0, class_mask = 0;
195 unsigned long driver_data = 0;
199 fields = sscanf(buf, "%x %x %x %x %x %x %lx",
200 &vendor, &device, &subvendor, &subdevice,
201 &class, &class_mask, &driver_data);
206 struct pci_dev *pdev = kzalloc(sizeof(*pdev), GFP_KERNEL);
210 pdev->vendor = vendor;
211 pdev->device = device;
212 pdev->subsystem_vendor = subvendor;
213 pdev->subsystem_device = subdevice;
216 if (pci_match_device(pdrv, pdev))
225 /* Only accept driver_data values that match an existing id_table
229 while (ids->vendor || ids->subvendor || ids->class_mask) {
230 if (driver_data == ids->driver_data) {
236 if (retval) /* No match */
240 retval = pci_add_dynid(pdrv, vendor, device, subvendor, subdevice,
241 class, class_mask, driver_data);
246 static DRIVER_ATTR_WO(new_id);
249 * remove_id_store - remove a PCI device ID from this driver
250 * @driver: target device driver
251 * @buf: buffer for scanning device ID data
254 * Removes a dynamic pci device ID to this driver.
256 static ssize_t remove_id_store(struct device_driver *driver, const char *buf,
259 struct pci_dynid *dynid, *n;
260 struct pci_driver *pdrv = to_pci_driver(driver);
261 u32 vendor, device, subvendor = PCI_ANY_ID,
262 subdevice = PCI_ANY_ID, class = 0, class_mask = 0;
264 size_t retval = -ENODEV;
266 fields = sscanf(buf, "%x %x %x %x %x %x",
267 &vendor, &device, &subvendor, &subdevice,
268 &class, &class_mask);
272 spin_lock(&pdrv->dynids.lock);
273 list_for_each_entry_safe(dynid, n, &pdrv->dynids.list, node) {
274 struct pci_device_id *id = &dynid->id;
275 if ((id->vendor == vendor) &&
276 (id->device == device) &&
277 (subvendor == PCI_ANY_ID || id->subvendor == subvendor) &&
278 (subdevice == PCI_ANY_ID || id->subdevice == subdevice) &&
279 !((id->class ^ class) & class_mask)) {
280 list_del(&dynid->node);
286 spin_unlock(&pdrv->dynids.lock);
290 static DRIVER_ATTR_WO(remove_id);
292 static struct attribute *pci_drv_attrs[] = {
293 &driver_attr_new_id.attr,
294 &driver_attr_remove_id.attr,
297 ATTRIBUTE_GROUPS(pci_drv);
299 struct drv_dev_and_id {
300 struct pci_driver *drv;
302 const struct pci_device_id *id;
305 static long local_pci_probe(void *_ddi)
307 struct drv_dev_and_id *ddi = _ddi;
308 struct pci_dev *pci_dev = ddi->dev;
309 struct pci_driver *pci_drv = ddi->drv;
310 struct device *dev = &pci_dev->dev;
314 * Unbound PCI devices are always put in D0, regardless of
315 * runtime PM status. During probe, the device is set to
316 * active and the usage count is incremented. If the driver
317 * supports runtime PM, it should call pm_runtime_put_noidle(),
318 * or any other runtime PM helper function decrementing the usage
319 * count, in its probe routine and pm_runtime_get_noresume() in
320 * its remove routine.
322 pm_runtime_get_sync(dev);
323 pci_dev->driver = pci_drv;
324 rc = pci_drv->probe(pci_dev, ddi->id);
328 pci_dev->driver = NULL;
329 pm_runtime_put_sync(dev);
333 * Probe function should return < 0 for failure, 0 for success
334 * Treat values > 0 as success, but warn.
336 pci_warn(pci_dev, "Driver probe function unexpectedly returned %d\n",
341 static bool pci_physfn_is_probed(struct pci_dev *dev)
343 #ifdef CONFIG_PCI_IOV
344 return dev->is_virtfn && dev->physfn->is_probed;
350 static int pci_call_probe(struct pci_driver *drv, struct pci_dev *dev,
351 const struct pci_device_id *id)
353 int error, node, cpu;
354 struct drv_dev_and_id ddi = { drv, dev, id };
357 * Execute driver initialization on node where the device is
358 * attached. This way the driver likely allocates its local memory
361 node = dev_to_node(&dev->dev);
364 cpu_hotplug_disable();
367 * Prevent nesting work_on_cpu() for the case where a Virtual Function
368 * device is probed from work_on_cpu() of the Physical device.
370 if (node < 0 || node >= MAX_NUMNODES || !node_online(node) ||
371 pci_physfn_is_probed(dev)) {
374 cpumask_var_t wq_domain_mask;
376 if (!zalloc_cpumask_var(&wq_domain_mask, GFP_KERNEL)) {
380 cpumask_and(wq_domain_mask,
381 housekeeping_cpumask(HK_TYPE_WQ),
382 housekeeping_cpumask(HK_TYPE_DOMAIN));
384 cpu = cpumask_any_and(cpumask_of_node(node),
386 free_cpumask_var(wq_domain_mask);
389 if (cpu < nr_cpu_ids)
390 error = work_on_cpu(cpu, local_pci_probe, &ddi);
392 error = local_pci_probe(&ddi);
395 cpu_hotplug_enable();
400 * __pci_device_probe - check if a driver wants to claim a specific PCI device
401 * @drv: driver to call to check if it wants the PCI device
402 * @pci_dev: PCI device being probed
404 * returns 0 on success, else error.
405 * side-effect: pci_dev->driver is set to drv when drv claims pci_dev.
407 static int __pci_device_probe(struct pci_driver *drv, struct pci_dev *pci_dev)
409 const struct pci_device_id *id;
415 id = pci_match_device(drv, pci_dev);
417 error = pci_call_probe(drv, pci_dev, id);
422 int __weak pcibios_alloc_irq(struct pci_dev *dev)
427 void __weak pcibios_free_irq(struct pci_dev *dev)
431 #ifdef CONFIG_PCI_IOV
432 static inline bool pci_device_can_probe(struct pci_dev *pdev)
434 return (!pdev->is_virtfn || pdev->physfn->sriov->drivers_autoprobe ||
435 pdev->driver_override);
438 static inline bool pci_device_can_probe(struct pci_dev *pdev)
444 static int pci_device_probe(struct device *dev)
447 struct pci_dev *pci_dev = to_pci_dev(dev);
448 struct pci_driver *drv = to_pci_driver(dev->driver);
450 if (!pci_device_can_probe(pci_dev))
453 pci_assign_irq(pci_dev);
455 error = pcibios_alloc_irq(pci_dev);
459 pci_dev_get(pci_dev);
460 error = __pci_device_probe(drv, pci_dev);
462 pcibios_free_irq(pci_dev);
463 pci_dev_put(pci_dev);
469 static void pci_device_remove(struct device *dev)
471 struct pci_dev *pci_dev = to_pci_dev(dev);
472 struct pci_driver *drv = pci_dev->driver;
475 pm_runtime_get_sync(dev);
476 drv->remove(pci_dev);
477 pm_runtime_put_noidle(dev);
479 pcibios_free_irq(pci_dev);
480 pci_dev->driver = NULL;
481 pci_iov_remove(pci_dev);
483 /* Undo the runtime PM settings in local_pci_probe() */
484 pm_runtime_put_sync(dev);
487 * If the device is still on, set the power state as "unknown",
488 * since it might change by the next time we load the driver.
490 if (pci_dev->current_state == PCI_D0)
491 pci_dev->current_state = PCI_UNKNOWN;
494 * We would love to complain here if pci_dev->is_enabled is set, that
495 * the driver should have called pci_disable_device(), but the
496 * unfortunate fact is there are too many odd BIOS and bridge setups
497 * that don't like drivers doing that all of the time.
498 * Oh well, we can dream of sane hardware when we sleep, no matter how
499 * horrible the crap we have to deal with is when we are awake...
502 pci_dev_put(pci_dev);
505 static void pci_device_shutdown(struct device *dev)
507 struct pci_dev *pci_dev = to_pci_dev(dev);
508 struct pci_driver *drv = pci_dev->driver;
510 pm_runtime_resume(dev);
512 if (drv && drv->shutdown)
513 drv->shutdown(pci_dev);
516 * If this is a kexec reboot, turn off Bus Master bit on the
517 * device to tell it to not continue to do DMA. Don't touch
518 * devices in D3cold or unknown states.
519 * If it is not a kexec reboot, firmware will hit the PCI
520 * devices with big hammer and stop their DMA any way.
522 if (kexec_in_progress && (pci_dev->current_state <= PCI_D3hot))
523 pci_clear_master(pci_dev);
526 #ifdef CONFIG_PM_SLEEP
528 /* Auxiliary functions used for system resume */
531 * pci_restore_standard_config - restore standard config registers of PCI device
532 * @pci_dev: PCI device to handle
534 static int pci_restore_standard_config(struct pci_dev *pci_dev)
536 pci_update_current_state(pci_dev, PCI_UNKNOWN);
538 if (pci_dev->current_state != PCI_D0) {
539 int error = pci_set_power_state(pci_dev, PCI_D0);
544 pci_restore_state(pci_dev);
545 pci_pme_restore(pci_dev);
548 #endif /* CONFIG_PM_SLEEP */
552 /* Auxiliary functions used for system resume and run-time resume */
554 static void pci_pm_default_resume(struct pci_dev *pci_dev)
556 pci_fixup_device(pci_fixup_resume, pci_dev);
557 pci_enable_wake(pci_dev, PCI_D0, false);
560 static void pci_pm_power_up_and_verify_state(struct pci_dev *pci_dev)
562 pci_power_up(pci_dev);
563 pci_update_current_state(pci_dev, PCI_D0);
566 static void pci_pm_default_resume_early(struct pci_dev *pci_dev)
568 pci_pm_power_up_and_verify_state(pci_dev);
569 pci_restore_state(pci_dev);
570 pci_pme_restore(pci_dev);
573 static void pci_pm_bridge_power_up_actions(struct pci_dev *pci_dev)
577 ret = pci_bridge_wait_for_secondary_bus(pci_dev, "resume");
580 * The downstream link failed to come up, so mark the
581 * devices below as disconnected to make sure we don't
582 * attempt to resume them.
584 pci_walk_bus(pci_dev->subordinate, pci_dev_set_disconnected,
590 * When powering on a bridge from D3cold, the whole hierarchy may be
591 * powered on into D0uninitialized state, resume them to give them a
592 * chance to suspend again
594 pci_resume_bus(pci_dev->subordinate);
597 #endif /* CONFIG_PM */
599 #ifdef CONFIG_PM_SLEEP
602 * Default "suspend" method for devices that have no driver provided suspend,
603 * or not even a driver at all (second part).
605 static void pci_pm_set_unknown_state(struct pci_dev *pci_dev)
608 * mark its power state as "unknown", since we don't know if
609 * e.g. the BIOS will change its device state when we suspend.
611 if (pci_dev->current_state == PCI_D0)
612 pci_dev->current_state = PCI_UNKNOWN;
616 * Default "resume" method for devices that have no driver provided resume,
617 * or not even a driver at all (second part).
619 static int pci_pm_reenable_device(struct pci_dev *pci_dev)
623 /* if the device was enabled before suspend, re-enable */
624 retval = pci_reenable_device(pci_dev);
626 * if the device was busmaster before the suspend, make it busmaster
629 if (pci_dev->is_busmaster)
630 pci_set_master(pci_dev);
635 static int pci_legacy_suspend(struct device *dev, pm_message_t state)
637 struct pci_dev *pci_dev = to_pci_dev(dev);
638 struct pci_driver *drv = pci_dev->driver;
640 if (drv && drv->suspend) {
641 pci_power_t prev = pci_dev->current_state;
644 error = drv->suspend(pci_dev, state);
645 suspend_report_result(dev, drv->suspend, error);
649 if (!pci_dev->state_saved && pci_dev->current_state != PCI_D0
650 && pci_dev->current_state != PCI_UNKNOWN) {
651 pci_WARN_ONCE(pci_dev, pci_dev->current_state != prev,
652 "PCI PM: Device state not saved by %pS\n",
657 pci_fixup_device(pci_fixup_suspend, pci_dev);
662 static int pci_legacy_suspend_late(struct device *dev)
664 struct pci_dev *pci_dev = to_pci_dev(dev);
666 if (!pci_dev->state_saved)
667 pci_save_state(pci_dev);
669 pci_pm_set_unknown_state(pci_dev);
671 pci_fixup_device(pci_fixup_suspend_late, pci_dev);
676 static int pci_legacy_resume(struct device *dev)
678 struct pci_dev *pci_dev = to_pci_dev(dev);
679 struct pci_driver *drv = pci_dev->driver;
681 pci_fixup_device(pci_fixup_resume, pci_dev);
683 return drv && drv->resume ?
684 drv->resume(pci_dev) : pci_pm_reenable_device(pci_dev);
687 /* Auxiliary functions used by the new power management framework */
689 static void pci_pm_default_suspend(struct pci_dev *pci_dev)
691 /* Disable non-bridge devices without PM support */
692 if (!pci_has_subordinate(pci_dev))
693 pci_disable_enabled_device(pci_dev);
696 static bool pci_has_legacy_pm_support(struct pci_dev *pci_dev)
698 struct pci_driver *drv = pci_dev->driver;
699 bool ret = drv && (drv->suspend || drv->resume);
702 * Legacy PM support is used by default, so warn if the new framework is
703 * supported as well. Drivers are supposed to support either the
704 * former, or the latter, but not both at the same time.
706 pci_WARN(pci_dev, ret && drv->driver.pm, "device %04x:%04x\n",
707 pci_dev->vendor, pci_dev->device);
712 /* New power management framework */
714 static int pci_pm_prepare(struct device *dev)
716 struct pci_dev *pci_dev = to_pci_dev(dev);
717 const struct dev_pm_ops *pm = dev->driver ? dev->driver->pm : NULL;
719 if (pm && pm->prepare) {
720 int error = pm->prepare(dev);
724 if (!error && dev_pm_test_driver_flags(dev, DPM_FLAG_SMART_PREPARE))
727 if (pci_dev_need_resume(pci_dev))
731 * The PME setting needs to be adjusted here in case the direct-complete
732 * optimization is used with respect to this device.
734 pci_dev_adjust_pme(pci_dev);
738 static void pci_pm_complete(struct device *dev)
740 struct pci_dev *pci_dev = to_pci_dev(dev);
742 pci_dev_complete_resume(pci_dev);
743 pm_generic_complete(dev);
745 /* Resume device if platform firmware has put it in reset-power-on */
746 if (pm_runtime_suspended(dev) && pm_resume_via_firmware()) {
747 pci_power_t pre_sleep_state = pci_dev->current_state;
749 pci_refresh_power_state(pci_dev);
751 * On platforms with ACPI this check may also trigger for
752 * devices sharing power resources if one of those power
753 * resources has been activated as a result of a change of the
754 * power state of another device sharing it. However, in that
755 * case it is also better to resume the device, in general.
757 if (pci_dev->current_state < pre_sleep_state)
758 pm_request_resume(dev);
762 #else /* !CONFIG_PM_SLEEP */
764 #define pci_pm_prepare NULL
765 #define pci_pm_complete NULL
767 #endif /* !CONFIG_PM_SLEEP */
769 #ifdef CONFIG_SUSPEND
770 static void pcie_pme_root_status_cleanup(struct pci_dev *pci_dev)
773 * Some BIOSes forget to clear Root PME Status bits after system
774 * wakeup, which breaks ACPI-based runtime wakeup on PCI Express.
775 * Clear those bits now just in case (shouldn't hurt).
777 if (pci_is_pcie(pci_dev) &&
778 (pci_pcie_type(pci_dev) == PCI_EXP_TYPE_ROOT_PORT ||
779 pci_pcie_type(pci_dev) == PCI_EXP_TYPE_RC_EC))
780 pcie_clear_root_pme_status(pci_dev);
783 static int pci_pm_suspend(struct device *dev)
785 struct pci_dev *pci_dev = to_pci_dev(dev);
786 const struct dev_pm_ops *pm = dev->driver ? dev->driver->pm : NULL;
788 pci_dev->skip_bus_pm = false;
791 * Disabling PTM allows some systems, e.g., Intel mobile chips
792 * since Coffee Lake, to enter a lower-power PM state.
794 pci_suspend_ptm(pci_dev);
796 if (pci_has_legacy_pm_support(pci_dev))
797 return pci_legacy_suspend(dev, PMSG_SUSPEND);
800 pci_pm_default_suspend(pci_dev);
805 * PCI devices suspended at run time may need to be resumed at this
806 * point, because in general it may be necessary to reconfigure them for
807 * system suspend. Namely, if the device is expected to wake up the
808 * system from the sleep state, it may have to be reconfigured for this
809 * purpose, or if the device is not expected to wake up the system from
810 * the sleep state, it should be prevented from signaling wakeup events
813 * Also if the driver of the device does not indicate that its system
814 * suspend callbacks can cope with runtime-suspended devices, it is
815 * better to resume the device from runtime suspend here.
817 if (!dev_pm_test_driver_flags(dev, DPM_FLAG_SMART_SUSPEND) ||
818 pci_dev_need_resume(pci_dev)) {
819 pm_runtime_resume(dev);
820 pci_dev->state_saved = false;
822 pci_dev_adjust_pme(pci_dev);
826 pci_power_t prev = pci_dev->current_state;
829 error = pm->suspend(dev);
830 suspend_report_result(dev, pm->suspend, error);
834 if (!pci_dev->state_saved && pci_dev->current_state != PCI_D0
835 && pci_dev->current_state != PCI_UNKNOWN) {
836 pci_WARN_ONCE(pci_dev, pci_dev->current_state != prev,
837 "PCI PM: State of device not saved by %pS\n",
845 static int pci_pm_suspend_late(struct device *dev)
847 if (dev_pm_skip_suspend(dev))
850 pci_fixup_device(pci_fixup_suspend, to_pci_dev(dev));
852 return pm_generic_suspend_late(dev);
855 static int pci_pm_suspend_noirq(struct device *dev)
857 struct pci_dev *pci_dev = to_pci_dev(dev);
858 const struct dev_pm_ops *pm = dev->driver ? dev->driver->pm : NULL;
860 if (dev_pm_skip_suspend(dev))
863 if (pci_has_legacy_pm_support(pci_dev))
864 return pci_legacy_suspend_late(dev);
867 pci_save_state(pci_dev);
871 if (pm->suspend_noirq) {
872 pci_power_t prev = pci_dev->current_state;
875 error = pm->suspend_noirq(dev);
876 suspend_report_result(dev, pm->suspend_noirq, error);
880 if (!pci_dev->state_saved && pci_dev->current_state != PCI_D0
881 && pci_dev->current_state != PCI_UNKNOWN) {
882 pci_WARN_ONCE(pci_dev, pci_dev->current_state != prev,
883 "PCI PM: State of device not saved by %pS\n",
889 if (!pci_dev->state_saved) {
890 pci_save_state(pci_dev);
893 * If the device is a bridge with a child in D0 below it,
894 * it needs to stay in D0, so check skip_bus_pm to avoid
895 * putting it into a low-power state in that case.
897 if (!pci_dev->skip_bus_pm && pci_power_manageable(pci_dev))
898 pci_prepare_to_sleep(pci_dev);
901 pci_dbg(pci_dev, "PCI PM: Suspend power state: %s\n",
902 pci_power_name(pci_dev->current_state));
904 if (pci_dev->current_state == PCI_D0) {
905 pci_dev->skip_bus_pm = true;
907 * Per PCI PM r1.2, table 6-1, a bridge must be in D0 if any
908 * downstream device is in D0, so avoid changing the power state
909 * of the parent bridge by setting the skip_bus_pm flag for it.
911 if (pci_dev->bus->self)
912 pci_dev->bus->self->skip_bus_pm = true;
915 if (pci_dev->skip_bus_pm && pm_suspend_no_platform()) {
916 pci_dbg(pci_dev, "PCI PM: Skipped\n");
920 pci_pm_set_unknown_state(pci_dev);
923 * Some BIOSes from ASUS have a bug: If a USB EHCI host controller's
924 * PCI COMMAND register isn't 0, the BIOS assumes that the controller
925 * hasn't been quiesced and tries to turn it off. If the controller
926 * is already in D3, this can hang or cause memory corruption.
928 * Since the value of the COMMAND register doesn't matter once the
929 * device has been suspended, we can safely set it to 0 here.
931 if (pci_dev->class == PCI_CLASS_SERIAL_USB_EHCI)
932 pci_write_config_word(pci_dev, PCI_COMMAND, 0);
935 pci_fixup_device(pci_fixup_suspend_late, pci_dev);
938 * If the target system sleep state is suspend-to-idle, it is sufficient
939 * to check whether or not the device's wakeup settings are good for
940 * runtime PM. Otherwise, the pm_resume_via_firmware() check will cause
941 * pci_pm_complete() to take care of fixing up the device's state
942 * anyway, if need be.
944 if (device_can_wakeup(dev) && !device_may_wakeup(dev))
945 dev->power.may_skip_resume = false;
950 static int pci_pm_resume_noirq(struct device *dev)
952 struct pci_dev *pci_dev = to_pci_dev(dev);
953 const struct dev_pm_ops *pm = dev->driver ? dev->driver->pm : NULL;
954 pci_power_t prev_state = pci_dev->current_state;
955 bool skip_bus_pm = pci_dev->skip_bus_pm;
957 if (dev_pm_skip_resume(dev))
961 * In the suspend-to-idle case, devices left in D0 during suspend will
962 * stay in D0, so it is not necessary to restore or update their
963 * configuration here and attempting to put them into D0 again is
964 * pointless, so avoid doing that.
966 if (!(skip_bus_pm && pm_suspend_no_platform()))
967 pci_pm_default_resume_early(pci_dev);
969 pci_fixup_device(pci_fixup_resume_early, pci_dev);
970 pcie_pme_root_status_cleanup(pci_dev);
972 if (!skip_bus_pm && prev_state == PCI_D3cold)
973 pci_pm_bridge_power_up_actions(pci_dev);
975 if (pci_has_legacy_pm_support(pci_dev))
978 if (pm && pm->resume_noirq)
979 return pm->resume_noirq(dev);
984 static int pci_pm_resume_early(struct device *dev)
986 if (dev_pm_skip_resume(dev))
989 return pm_generic_resume_early(dev);
992 static int pci_pm_resume(struct device *dev)
994 struct pci_dev *pci_dev = to_pci_dev(dev);
995 const struct dev_pm_ops *pm = dev->driver ? dev->driver->pm : NULL;
998 * This is necessary for the suspend error path in which resume is
999 * called without restoring the standard config registers of the device.
1001 if (pci_dev->state_saved)
1002 pci_restore_standard_config(pci_dev);
1004 pci_resume_ptm(pci_dev);
1006 if (pci_has_legacy_pm_support(pci_dev))
1007 return pci_legacy_resume(dev);
1009 pci_pm_default_resume(pci_dev);
1013 return pm->resume(dev);
1015 pci_pm_reenable_device(pci_dev);
1021 #else /* !CONFIG_SUSPEND */
1023 #define pci_pm_suspend NULL
1024 #define pci_pm_suspend_late NULL
1025 #define pci_pm_suspend_noirq NULL
1026 #define pci_pm_resume NULL
1027 #define pci_pm_resume_early NULL
1028 #define pci_pm_resume_noirq NULL
1030 #endif /* !CONFIG_SUSPEND */
1032 #ifdef CONFIG_HIBERNATE_CALLBACKS
1034 static int pci_pm_freeze(struct device *dev)
1036 struct pci_dev *pci_dev = to_pci_dev(dev);
1037 const struct dev_pm_ops *pm = dev->driver ? dev->driver->pm : NULL;
1039 if (pci_has_legacy_pm_support(pci_dev))
1040 return pci_legacy_suspend(dev, PMSG_FREEZE);
1043 pci_pm_default_suspend(pci_dev);
1048 * Resume all runtime-suspended devices before creating a snapshot
1049 * image of system memory, because the restore kernel generally cannot
1050 * be expected to always handle them consistently and they need to be
1051 * put into the runtime-active metastate during system resume anyway,
1052 * so it is better to ensure that the state saved in the image will be
1053 * always consistent with that.
1055 pm_runtime_resume(dev);
1056 pci_dev->state_saved = false;
1061 error = pm->freeze(dev);
1062 suspend_report_result(dev, pm->freeze, error);
1070 static int pci_pm_freeze_noirq(struct device *dev)
1072 struct pci_dev *pci_dev = to_pci_dev(dev);
1073 const struct dev_pm_ops *pm = dev->driver ? dev->driver->pm : NULL;
1075 if (pci_has_legacy_pm_support(pci_dev))
1076 return pci_legacy_suspend_late(dev);
1078 if (pm && pm->freeze_noirq) {
1081 error = pm->freeze_noirq(dev);
1082 suspend_report_result(dev, pm->freeze_noirq, error);
1087 if (!pci_dev->state_saved)
1088 pci_save_state(pci_dev);
1090 pci_pm_set_unknown_state(pci_dev);
1095 static int pci_pm_thaw_noirq(struct device *dev)
1097 struct pci_dev *pci_dev = to_pci_dev(dev);
1098 const struct dev_pm_ops *pm = dev->driver ? dev->driver->pm : NULL;
1101 * The pm->thaw_noirq() callback assumes the device has been
1102 * returned to D0 and its config state has been restored.
1104 * In addition, pci_restore_state() restores MSI-X state in MMIO
1105 * space, which requires the device to be in D0, so return it to D0
1106 * in case the driver's "freeze" callbacks put it into a low-power
1109 pci_pm_power_up_and_verify_state(pci_dev);
1110 pci_restore_state(pci_dev);
1112 if (pci_has_legacy_pm_support(pci_dev))
1115 if (pm && pm->thaw_noirq)
1116 return pm->thaw_noirq(dev);
1121 static int pci_pm_thaw(struct device *dev)
1123 struct pci_dev *pci_dev = to_pci_dev(dev);
1124 const struct dev_pm_ops *pm = dev->driver ? dev->driver->pm : NULL;
1127 if (pci_has_legacy_pm_support(pci_dev))
1128 return pci_legacy_resume(dev);
1132 error = pm->thaw(dev);
1134 pci_pm_reenable_device(pci_dev);
1137 pci_dev->state_saved = false;
1142 static int pci_pm_poweroff(struct device *dev)
1144 struct pci_dev *pci_dev = to_pci_dev(dev);
1145 const struct dev_pm_ops *pm = dev->driver ? dev->driver->pm : NULL;
1147 if (pci_has_legacy_pm_support(pci_dev))
1148 return pci_legacy_suspend(dev, PMSG_HIBERNATE);
1151 pci_pm_default_suspend(pci_dev);
1155 /* The reason to do that is the same as in pci_pm_suspend(). */
1156 if (!dev_pm_test_driver_flags(dev, DPM_FLAG_SMART_SUSPEND) ||
1157 pci_dev_need_resume(pci_dev)) {
1158 pm_runtime_resume(dev);
1159 pci_dev->state_saved = false;
1161 pci_dev_adjust_pme(pci_dev);
1167 error = pm->poweroff(dev);
1168 suspend_report_result(dev, pm->poweroff, error);
1176 static int pci_pm_poweroff_late(struct device *dev)
1178 if (dev_pm_skip_suspend(dev))
1181 pci_fixup_device(pci_fixup_suspend, to_pci_dev(dev));
1183 return pm_generic_poweroff_late(dev);
1186 static int pci_pm_poweroff_noirq(struct device *dev)
1188 struct pci_dev *pci_dev = to_pci_dev(dev);
1189 const struct dev_pm_ops *pm = dev->driver ? dev->driver->pm : NULL;
1191 if (dev_pm_skip_suspend(dev))
1194 if (pci_has_legacy_pm_support(pci_dev))
1195 return pci_legacy_suspend_late(dev);
1198 pci_fixup_device(pci_fixup_suspend_late, pci_dev);
1202 if (pm->poweroff_noirq) {
1205 error = pm->poweroff_noirq(dev);
1206 suspend_report_result(dev, pm->poweroff_noirq, error);
1211 if (!pci_dev->state_saved && !pci_has_subordinate(pci_dev))
1212 pci_prepare_to_sleep(pci_dev);
1215 * The reason for doing this here is the same as for the analogous code
1216 * in pci_pm_suspend_noirq().
1218 if (pci_dev->class == PCI_CLASS_SERIAL_USB_EHCI)
1219 pci_write_config_word(pci_dev, PCI_COMMAND, 0);
1221 pci_fixup_device(pci_fixup_suspend_late, pci_dev);
1226 static int pci_pm_restore_noirq(struct device *dev)
1228 struct pci_dev *pci_dev = to_pci_dev(dev);
1229 const struct dev_pm_ops *pm = dev->driver ? dev->driver->pm : NULL;
1231 pci_pm_default_resume_early(pci_dev);
1232 pci_fixup_device(pci_fixup_resume_early, pci_dev);
1234 if (pci_has_legacy_pm_support(pci_dev))
1237 if (pm && pm->restore_noirq)
1238 return pm->restore_noirq(dev);
1243 static int pci_pm_restore(struct device *dev)
1245 struct pci_dev *pci_dev = to_pci_dev(dev);
1246 const struct dev_pm_ops *pm = dev->driver ? dev->driver->pm : NULL;
1249 * This is necessary for the hibernation error path in which restore is
1250 * called without restoring the standard config registers of the device.
1252 if (pci_dev->state_saved)
1253 pci_restore_standard_config(pci_dev);
1255 if (pci_has_legacy_pm_support(pci_dev))
1256 return pci_legacy_resume(dev);
1258 pci_pm_default_resume(pci_dev);
1262 return pm->restore(dev);
1264 pci_pm_reenable_device(pci_dev);
1270 #else /* !CONFIG_HIBERNATE_CALLBACKS */
1272 #define pci_pm_freeze NULL
1273 #define pci_pm_freeze_noirq NULL
1274 #define pci_pm_thaw NULL
1275 #define pci_pm_thaw_noirq NULL
1276 #define pci_pm_poweroff NULL
1277 #define pci_pm_poweroff_late NULL
1278 #define pci_pm_poweroff_noirq NULL
1279 #define pci_pm_restore NULL
1280 #define pci_pm_restore_noirq NULL
1282 #endif /* !CONFIG_HIBERNATE_CALLBACKS */
1286 static int pci_pm_runtime_suspend(struct device *dev)
1288 struct pci_dev *pci_dev = to_pci_dev(dev);
1289 const struct dev_pm_ops *pm = dev->driver ? dev->driver->pm : NULL;
1290 pci_power_t prev = pci_dev->current_state;
1293 pci_suspend_ptm(pci_dev);
1296 * If pci_dev->driver is not set (unbound), we leave the device in D0,
1297 * but it may go to D3cold when the bridge above it runtime suspends.
1298 * Save its config space in case that happens.
1300 if (!pci_dev->driver) {
1301 pci_save_state(pci_dev);
1305 pci_dev->state_saved = false;
1306 if (pm && pm->runtime_suspend) {
1307 error = pm->runtime_suspend(dev);
1309 * -EBUSY and -EAGAIN is used to request the runtime PM core
1310 * to schedule a new suspend, so log the event only with debug
1313 if (error == -EBUSY || error == -EAGAIN) {
1314 pci_dbg(pci_dev, "can't suspend now (%ps returned %d)\n",
1315 pm->runtime_suspend, error);
1318 pci_err(pci_dev, "can't suspend (%ps returned %d)\n",
1319 pm->runtime_suspend, error);
1324 pci_fixup_device(pci_fixup_suspend, pci_dev);
1326 if (pm && pm->runtime_suspend
1327 && !pci_dev->state_saved && pci_dev->current_state != PCI_D0
1328 && pci_dev->current_state != PCI_UNKNOWN) {
1329 pci_WARN_ONCE(pci_dev, pci_dev->current_state != prev,
1330 "PCI PM: State of device not saved by %pS\n",
1331 pm->runtime_suspend);
1335 if (!pci_dev->state_saved) {
1336 pci_save_state(pci_dev);
1337 pci_finish_runtime_suspend(pci_dev);
1343 static int pci_pm_runtime_resume(struct device *dev)
1345 struct pci_dev *pci_dev = to_pci_dev(dev);
1346 const struct dev_pm_ops *pm = dev->driver ? dev->driver->pm : NULL;
1347 pci_power_t prev_state = pci_dev->current_state;
1351 * Restoring config space is necessary even if the device is not bound
1352 * to a driver because although we left it in D0, it may have gone to
1353 * D3cold when the bridge above it runtime suspended.
1355 pci_pm_default_resume_early(pci_dev);
1356 pci_resume_ptm(pci_dev);
1358 if (!pci_dev->driver)
1361 pci_fixup_device(pci_fixup_resume_early, pci_dev);
1362 pci_pm_default_resume(pci_dev);
1364 if (prev_state == PCI_D3cold)
1365 pci_pm_bridge_power_up_actions(pci_dev);
1367 if (pm && pm->runtime_resume)
1368 error = pm->runtime_resume(dev);
1373 static int pci_pm_runtime_idle(struct device *dev)
1375 struct pci_dev *pci_dev = to_pci_dev(dev);
1376 const struct dev_pm_ops *pm = dev->driver ? dev->driver->pm : NULL;
1379 * If pci_dev->driver is not set (unbound), the device should
1380 * always remain in D0 regardless of the runtime PM status
1382 if (!pci_dev->driver)
1388 if (pm->runtime_idle)
1389 return pm->runtime_idle(dev);
1394 static const struct dev_pm_ops pci_dev_pm_ops = {
1395 .prepare = pci_pm_prepare,
1396 .complete = pci_pm_complete,
1397 .suspend = pci_pm_suspend,
1398 .suspend_late = pci_pm_suspend_late,
1399 .resume = pci_pm_resume,
1400 .resume_early = pci_pm_resume_early,
1401 .freeze = pci_pm_freeze,
1402 .thaw = pci_pm_thaw,
1403 .poweroff = pci_pm_poweroff,
1404 .poweroff_late = pci_pm_poweroff_late,
1405 .restore = pci_pm_restore,
1406 .suspend_noirq = pci_pm_suspend_noirq,
1407 .resume_noirq = pci_pm_resume_noirq,
1408 .freeze_noirq = pci_pm_freeze_noirq,
1409 .thaw_noirq = pci_pm_thaw_noirq,
1410 .poweroff_noirq = pci_pm_poweroff_noirq,
1411 .restore_noirq = pci_pm_restore_noirq,
1412 .runtime_suspend = pci_pm_runtime_suspend,
1413 .runtime_resume = pci_pm_runtime_resume,
1414 .runtime_idle = pci_pm_runtime_idle,
1417 #define PCI_PM_OPS_PTR (&pci_dev_pm_ops)
1419 #else /* !CONFIG_PM */
1421 #define pci_pm_runtime_suspend NULL
1422 #define pci_pm_runtime_resume NULL
1423 #define pci_pm_runtime_idle NULL
1425 #define PCI_PM_OPS_PTR NULL
1427 #endif /* !CONFIG_PM */
1430 * __pci_register_driver - register a new pci driver
1431 * @drv: the driver structure to register
1432 * @owner: owner module of drv
1433 * @mod_name: module name string
1435 * Adds the driver structure to the list of registered drivers.
1436 * Returns a negative value on error, otherwise 0.
1437 * If no error occurred, the driver remains registered even if
1438 * no device was claimed during registration.
1440 int __pci_register_driver(struct pci_driver *drv, struct module *owner,
1441 const char *mod_name)
1443 /* initialize common driver fields */
1444 drv->driver.name = drv->name;
1445 drv->driver.bus = &pci_bus_type;
1446 drv->driver.owner = owner;
1447 drv->driver.mod_name = mod_name;
1448 drv->driver.groups = drv->groups;
1449 drv->driver.dev_groups = drv->dev_groups;
1451 spin_lock_init(&drv->dynids.lock);
1452 INIT_LIST_HEAD(&drv->dynids.list);
1454 /* register with core */
1455 return driver_register(&drv->driver);
1457 EXPORT_SYMBOL(__pci_register_driver);
1460 * pci_unregister_driver - unregister a pci driver
1461 * @drv: the driver structure to unregister
1463 * Deletes the driver structure from the list of registered PCI drivers,
1464 * gives it a chance to clean up by calling its remove() function for
1465 * each device it was responsible for, and marks those devices as
1469 void pci_unregister_driver(struct pci_driver *drv)
1471 driver_unregister(&drv->driver);
1472 pci_free_dynids(drv);
1474 EXPORT_SYMBOL(pci_unregister_driver);
1476 static struct pci_driver pci_compat_driver = {
1481 * pci_dev_driver - get the pci_driver of a device
1482 * @dev: the device to query
1484 * Returns the appropriate pci_driver structure or %NULL if there is no
1485 * registered driver for the device.
1487 struct pci_driver *pci_dev_driver(const struct pci_dev *dev)
1494 for (i = 0; i <= PCI_ROM_RESOURCE; i++)
1495 if (dev->resource[i].flags & IORESOURCE_BUSY)
1496 return &pci_compat_driver;
1500 EXPORT_SYMBOL(pci_dev_driver);
1503 * pci_bus_match - Tell if a PCI device structure has a matching PCI device id structure
1504 * @dev: the PCI device structure to match against
1505 * @drv: the device driver to search for matching PCI device id structures
1507 * Used by a driver to check whether a PCI device present in the
1508 * system is in its list of supported devices. Returns the matching
1509 * pci_device_id structure or %NULL if there is no match.
1511 static int pci_bus_match(struct device *dev, struct device_driver *drv)
1513 struct pci_dev *pci_dev = to_pci_dev(dev);
1514 struct pci_driver *pci_drv;
1515 const struct pci_device_id *found_id;
1517 if (!pci_dev->match_driver)
1520 pci_drv = to_pci_driver(drv);
1521 found_id = pci_match_device(pci_drv, pci_dev);
1529 * pci_dev_get - increments the reference count of the pci device structure
1530 * @dev: the device being referenced
1532 * Each live reference to a device should be refcounted.
1534 * Drivers for PCI devices should normally record such references in
1535 * their probe() methods, when they bind to a device, and release
1536 * them by calling pci_dev_put(), in their disconnect() methods.
1538 * A pointer to the device with the incremented reference counter is returned.
1540 struct pci_dev *pci_dev_get(struct pci_dev *dev)
1543 get_device(&dev->dev);
1546 EXPORT_SYMBOL(pci_dev_get);
1549 * pci_dev_put - release a use of the pci device structure
1550 * @dev: device that's been disconnected
1552 * Must be called when a user of a device is finished with it. When the last
1553 * user of the device calls this function, the memory of the device is freed.
1555 void pci_dev_put(struct pci_dev *dev)
1558 put_device(&dev->dev);
1560 EXPORT_SYMBOL(pci_dev_put);
1562 static int pci_uevent(const struct device *dev, struct kobj_uevent_env *env)
1564 const struct pci_dev *pdev;
1569 pdev = to_pci_dev(dev);
1571 if (add_uevent_var(env, "PCI_CLASS=%04X", pdev->class))
1574 if (add_uevent_var(env, "PCI_ID=%04X:%04X", pdev->vendor, pdev->device))
1577 if (add_uevent_var(env, "PCI_SUBSYS_ID=%04X:%04X", pdev->subsystem_vendor,
1578 pdev->subsystem_device))
1581 if (add_uevent_var(env, "PCI_SLOT_NAME=%s", pci_name(pdev)))
1584 if (add_uevent_var(env, "MODALIAS=pci:v%08Xd%08Xsv%08Xsd%08Xbc%02Xsc%02Xi%02X",
1585 pdev->vendor, pdev->device,
1586 pdev->subsystem_vendor, pdev->subsystem_device,
1587 (u8)(pdev->class >> 16), (u8)(pdev->class >> 8),
1594 #if defined(CONFIG_PCIEAER) || defined(CONFIG_EEH)
1596 * pci_uevent_ers - emit a uevent during recovery path of PCI device
1597 * @pdev: PCI device undergoing error recovery
1598 * @err_type: type of error event
1600 void pci_uevent_ers(struct pci_dev *pdev, enum pci_ers_result err_type)
1606 case PCI_ERS_RESULT_NONE:
1607 case PCI_ERS_RESULT_CAN_RECOVER:
1608 envp[idx++] = "ERROR_EVENT=BEGIN_RECOVERY";
1609 envp[idx++] = "DEVICE_ONLINE=0";
1611 case PCI_ERS_RESULT_RECOVERED:
1612 envp[idx++] = "ERROR_EVENT=SUCCESSFUL_RECOVERY";
1613 envp[idx++] = "DEVICE_ONLINE=1";
1615 case PCI_ERS_RESULT_DISCONNECT:
1616 envp[idx++] = "ERROR_EVENT=FAILED_RECOVERY";
1617 envp[idx++] = "DEVICE_ONLINE=0";
1625 kobject_uevent_env(&pdev->dev.kobj, KOBJ_CHANGE, envp);
1630 static int pci_bus_num_vf(struct device *dev)
1632 return pci_num_vf(to_pci_dev(dev));
1636 * pci_dma_configure - Setup DMA configuration
1637 * @dev: ptr to dev structure
1639 * Function to update PCI devices's DMA configuration using the same
1640 * info from the OF node or ACPI node of host bridge's parent (if any).
1642 static int pci_dma_configure(struct device *dev)
1644 struct pci_driver *driver = to_pci_driver(dev->driver);
1645 struct device *bridge;
1648 bridge = pci_get_host_bridge_device(to_pci_dev(dev));
1650 if (IS_ENABLED(CONFIG_OF) && bridge->parent &&
1651 bridge->parent->of_node) {
1652 ret = of_dma_configure(dev, bridge->parent->of_node, true);
1653 } else if (has_acpi_companion(bridge)) {
1654 struct acpi_device *adev = to_acpi_device_node(bridge->fwnode);
1656 ret = acpi_dma_configure(dev, acpi_get_dma_attr(adev));
1659 pci_put_host_bridge_device(bridge);
1661 if (!ret && !driver->driver_managed_dma) {
1662 ret = iommu_device_use_default_domain(dev);
1664 arch_teardown_dma_ops(dev);
1670 static void pci_dma_cleanup(struct device *dev)
1672 struct pci_driver *driver = to_pci_driver(dev->driver);
1674 if (!driver->driver_managed_dma)
1675 iommu_device_unuse_default_domain(dev);
1678 struct bus_type pci_bus_type = {
1680 .match = pci_bus_match,
1681 .uevent = pci_uevent,
1682 .probe = pci_device_probe,
1683 .remove = pci_device_remove,
1684 .shutdown = pci_device_shutdown,
1685 .dev_groups = pci_dev_groups,
1686 .bus_groups = pci_bus_groups,
1687 .drv_groups = pci_drv_groups,
1688 .pm = PCI_PM_OPS_PTR,
1689 .num_vf = pci_bus_num_vf,
1690 .dma_configure = pci_dma_configure,
1691 .dma_cleanup = pci_dma_cleanup,
1693 EXPORT_SYMBOL(pci_bus_type);
1695 #ifdef CONFIG_PCIEPORTBUS
1696 static int pcie_port_bus_match(struct device *dev, struct device_driver *drv)
1698 struct pcie_device *pciedev;
1699 struct pcie_port_service_driver *driver;
1701 if (drv->bus != &pcie_port_bus_type || dev->bus != &pcie_port_bus_type)
1704 pciedev = to_pcie_device(dev);
1705 driver = to_service_driver(drv);
1707 if (driver->service != pciedev->service)
1710 if (driver->port_type != PCIE_ANY_PORT &&
1711 driver->port_type != pci_pcie_type(pciedev->port))
1717 struct bus_type pcie_port_bus_type = {
1718 .name = "pci_express",
1719 .match = pcie_port_bus_match,
1723 static int __init pci_driver_init(void)
1727 ret = bus_register(&pci_bus_type);
1731 #ifdef CONFIG_PCIEPORTBUS
1732 ret = bus_register(&pcie_port_bus_type);
1736 dma_debug_add_bus(&pci_bus_type);
1739 postcore_initcall(pci_driver_init);