lists.openwall.net   lists  /  announce  owl-users  owl-dev  john-users  john-dev  passwdqc-users  yescrypt  popa3d-users  /  oss-security  kernel-hardening  musl  sabotage  tlsify  passwords  /  crypt-dev  xvendor  /  Bugtraq  Full-Disclosure  linux-kernel  linux-netdev  linux-ext4  linux-hardening  linux-cve-announce  PHC 
Open Source and information security mailing list archives
 
Hash Suite: Windows password security audit tool. GUI, reports in PDF.
[<prev] [next>] [<thread-prev] [day] [month] [year] [list]
Message-id: <4F5F0192.3020209@huawei.com>
Date:	Tue, 13 Mar 2012 16:13:06 +0800
From:	Jiang Liu <jiang.liu@...wei.com>
To:	Bjorn Helgaas <bhelgaas@...gle.com>
Cc:	Jiang Liu <liuj97@...il.com>, Yinghai Lu <yinghai@...nel.org>,
	Jesse Barnes <jbarnes@...tuousgeek.org>,
	Ashok Raj <ashok.raj@...el.com>,
	Suresh Siddha <suresh.b.siddha@...el.com>,
	Youquan Song <youquan.song@...el.com>,
	linux-pci@...r.kernel.org, linux-kernel@...r.kernel.org,
	chenkeping@...wei.com
Subject: Re: [RFC PATCH 4/5] PCI: Introduce hotplug-safe pci bus searching
 interfaces

Hi Bjorn,
	As you have mentioned, for most cases they are safe to
use pci_find_bus()/pci_find_next_bus(), as in following cases:
	1) invoked by platform specific code during boot because
it's single-threaded.
	2) invoked by hotplug driver because hotplug driver has
serialization mechanism.
	3) invoked by driver has platform specific knowledge
	After scanning the kernel source code, I have fount two
cases which can't be covered by above scenario.
	The first case is that PCIe PME driver invokes pci_find_bus()
when handling PME events. The second case is that i7core_edac
driver invokes pci_find_next_bus() from its probe method.
AFAICT there's no mechanism to protect these two cases from hotplug
operations currently.

	Bjorn, you are right. I'm a little over-reacting here.
The better solution here should be keeping the original
pci_find_bus/pci_find_next_bus usage model and only introducing
new mechanism to protect the above two cases. By that way,
the code change will be much more smaller.
	Thanks!

On 2012-3-13 11:49, Bjorn Helgaas wrote:
> On Sun, Mar 11, 2012 at 11:48 AM, Jiang Liu<liuj97@...il.com>  wrote:
>> By design, pci_find_bus() and pci_find_next_bus() should be used at boot
>> time only. But currently these two interfaces have been used at runtime
>> by other components. With the introduction of pci root bus hotplug,
>> the situation becomes more serious. So introduce several hotplug-safe pci
>> bus searching interfaces to be used at runtime.  The new interfaces use
>> rculist instead of the pci_bus_sem to protect themselves from dynamic changes.
>> The proposed interfaces are straight-forward replacement of the old ones:
>> pci_bus_get()/put(), pci_get_bus(), pci_get_next_bus() and pci_bus_present().
>> And the old interface may be deprecated or marked as __init in future.
>
> This looks like a lot of work to fix something that shouldn't need to
> be fixed.  I don't think we should be doing any of this blind probing
> at hotplug-time.  If we do blind probing at all, it should only be
> done at boot-time.
>
>> Signed-off-by: Jiang Liu<jiang.liu@...wei.com>
>> ---
>>   drivers/pci/bus.c    |   20 ++++++-
>>   drivers/pci/probe.c  |    5 +-
>>   drivers/pci/remove.c |    5 +-
>>   drivers/pci/search.c |  165 ++++++++++++++++++++++++++++++++++++++++++--------
>>   include/linux/pci.h  |    8 +++
>>   5 files changed, 173 insertions(+), 30 deletions(-)
>>
>> diff --git a/drivers/pci/bus.c b/drivers/pci/bus.c
>> index 1eb7944..0543d47 100644
>> --- a/drivers/pci/bus.c
>> +++ b/drivers/pci/bus.c
>> @@ -15,6 +15,7 @@
>>   #include<linux/proc_fs.h>
>>   #include<linux/init.h>
>>   #include<linux/slab.h>
>> +#include<linux/rculist.h>
>>
>>   #include "pci.h"
>>
>> @@ -238,7 +239,7 @@ void pci_bus_add_devices(const struct pci_bus *bus)
>>                         continue;
>>                 if (list_empty(&child->node)) {
>>                         down_write(&pci_bus_sem);
>> -                       list_add_tail(&child->node,&dev->bus->children);
>> +                       list_add_tail_rcu(&child->node,&dev->bus->children);
>>                         up_write(&pci_bus_sem);
>>                 }
>>                 pci_bus_add_devices(child);
>> @@ -277,7 +278,7 @@ void pci_bus_add_single_device(struct pci_dev *dev)
>>         if (child) {
>>                 if (list_empty(&child->node)) {
>>                         down_write(&pci_bus_sem);
>> -                       list_add_tail(&child->node,&dev->bus->children);
>> +                       list_add_tail_rcu(&child->node,&dev->bus->children);
>>                         up_write(&pci_bus_sem);
>>                 }
>>                 pci_bus_add_devices(child);
>> @@ -364,6 +365,21 @@ void pci_walk_bus(struct pci_bus *top, int (*cb)(struct pci_dev *, void *),
>>   }
>>   EXPORT_SYMBOL_GPL(pci_walk_bus);
>>
>> +struct pci_bus *pci_bus_get(struct pci_bus *bus)
>> +{
>> +       if (bus)
>> +               get_device(&bus->dev);
>> +       return bus;
>> +}
>> +EXPORT_SYMBOL(pci_bus_get);
>> +
>> +void pci_bus_put(struct pci_bus *bus)
>> +{
>> +       if (bus)
>> +               put_device(&bus->dev);
>> +}
>> +EXPORT_SYMBOL(pci_bus_put);
>> +
>>   EXPORT_SYMBOL(pci_bus_alloc_resource);
>>   EXPORT_SYMBOL_GPL(pci_bus_add_device);
>>   EXPORT_SYMBOL(pci_bus_add_devices);
>> diff --git a/drivers/pci/probe.c b/drivers/pci/probe.c
>> index 0ca213c..273c387 100644
>> --- a/drivers/pci/probe.c
>> +++ b/drivers/pci/probe.c
>> @@ -10,6 +10,7 @@
>>   #include<linux/module.h>
>>   #include<linux/cpumask.h>
>>   #include<linux/pci-aspm.h>
>> +#include<linux/rculist.h>
>>   #include "pci.h"
>>
>>   #define CARDBUS_LATENCY_TIMER  176     /* secondary latency timer */
>> @@ -633,7 +634,7 @@ struct pci_bus *__ref pci_add_new_bus(struct pci_bus *parent, struct pci_dev *de
>>         child = pci_alloc_child_bus(parent, dev, busnr);
>>         if (child) {
>>                 down_write(&pci_bus_sem);
>> -               list_add_tail(&child->node,&parent->children);
>> +               list_add_tail_rcu(&child->node,&parent->children);
>>                 up_write(&pci_bus_sem);
>>         }
>>         return child;
>> @@ -1889,7 +1890,7 @@ struct pci_bus *pci_create_root_bus(struct device *parent, int bus,
>>         }
>>
>>         down_write(&pci_bus_sem);
>> -       list_add_tail(&b->node,&pci_root_buses);
>> +       list_add_tail_rcu(&b->node,&pci_root_buses);
>>         up_write(&pci_bus_sem);
>>
>>         return b;
>> diff --git a/drivers/pci/remove.c b/drivers/pci/remove.c
>> index 25f368e..120bee9 100644
>> --- a/drivers/pci/remove.c
>> +++ b/drivers/pci/remove.c
>> @@ -1,6 +1,7 @@
>>   #include<linux/pci.h>
>>   #include<linux/module.h>
>>   #include<linux/pci-aspm.h>
>> +#include<linux/rculist.h>
>>   #include "pci.h"
>>
>>   static void pci_free_resources(struct pci_dev *dev)
>> @@ -67,9 +68,11 @@ void pci_remove_bus(struct pci_bus *pci_bus)
>>         pci_proc_detach_bus(pci_bus);
>>
>>         down_write(&pci_bus_sem);
>> -       list_del(&pci_bus->node);
>> +       list_del_rcu(&pci_bus->node);
>>         pci_bus_release_busn_res(pci_bus);
>>         up_write(&pci_bus_sem);
>> +       synchronize_rcu();
>> +
>>         if (pci_bus->is_added || pci_is_root_bus(pci_bus)) {
>>                 pci_remove_legacy_files(pci_bus);
>>                 device_unregister(&pci_bus->dev);
>> diff --git a/drivers/pci/search.c b/drivers/pci/search.c
>> index b572730..de31957 100644
>> --- a/drivers/pci/search.c
>> +++ b/drivers/pci/search.c
>> @@ -12,6 +12,7 @@
>>   #include<linux/slab.h>
>>   #include<linux/module.h>
>>   #include<linux/interrupt.h>
>> +#include<linux/rculist.h>
>>   #include "pci.h"
>>
>>   DECLARE_RWSEM(pci_bus_sem);
>> @@ -52,20 +53,63 @@ pci_find_upstream_pcie_bridge(struct pci_dev *pdev)
>>
>>   static struct pci_bus *pci_do_find_bus(struct pci_bus *bus, unsigned char busnr)
>>   {
>> -       struct pci_bus* child;
>> -       struct list_head *tmp;
>> +       struct pci_bus *child;
>> +       struct pci_bus *tmp_bus;
>>
>>         if(bus->number == busnr)
>>                 return bus;
>>
>> -       list_for_each(tmp,&bus->children) {
>> -               child = pci_do_find_bus(pci_bus_b(tmp), busnr);
>> -               if(child)
>> -                       return child;
>> +       list_for_each_entry_rcu(child,&bus->children, node) {
>> +               tmp_bus = pci_do_find_bus(child, busnr);
>> +               if(tmp_bus)
>> +                       return tmp_bus;
>>         }
>>         return NULL;
>>   }
>>
>> +static struct pci_bus *__pci_find_bus(int domain, int busnr)
>> +{
>> +       struct pci_bus *bus;
>> +       struct pci_bus *tmp_bus;
>> +
>> +       list_for_each_entry_rcu(bus,&pci_root_buses, node) {
>> +               if (pci_domain_nr(bus) != domain)
>> +                       continue;
>> +               tmp_bus = pci_do_find_bus(bus, busnr);
>> +               if (tmp_bus)
>> +                       return tmp_bus;
>> +       }
>> +
>> +       return NULL;
>> +}
>> +
>> +static struct pci_bus *__pci_find_next_bus(const struct pci_bus *from)
>> +{
>> +       struct list_head *n;
>> +       struct pci_bus *b = NULL;
>> +
>> +       /* First search, start from the pci root bus list */
>> +       if (from == NULL) {
>> +               n = rcu_dereference(list_next_rcu(&pci_root_buses));
>> +               if (n !=&pci_root_buses)
>> +                       b = pci_bus_b(n);
>> +       /* Continue on the pci root bus list */
>> +       } else if (pci_is_root_bus((struct pci_bus *)from)) {
>> +               n = rcu_dereference(list_next_rcu(&from->node));
>> +               if (n !=&pci_root_buses)
>> +                       b = pci_bus_b(n);
>> +       /* Continue on other non pci root bus list */
>> +       } else {
>> +               struct pci_bus *parent = from->self->bus;
>> +
>> +               n = rcu_dereference(list_next_rcu(&from->node));
>> +               if (n !=&parent->children)
>> +                       b = pci_bus_b(n);
>> +       }
>> +
>> +       return b;
>> +}
>> +
>>   /**
>>   * pci_find_bus - locate PCI bus from a given domain and bus number
>>   * @domain: number of PCI domain to search
>> @@ -74,20 +118,19 @@ static struct pci_bus *pci_do_find_bus(struct pci_bus *bus, unsigned char busnr)
>>   * Given a PCI bus number and domain number, the desired PCI bus is located
>>   * in the global list of PCI buses.  If the bus is found, a pointer to its
>>   * data structure is returned.  If no bus is found, %NULL is returned.
>> + *
>> + * TODO: By design, this function should only be called at boot time.
>> + * So either mark it as __init or deprecate it.
>>   */
>>   struct pci_bus * pci_find_bus(int domain, int busnr)
>>   {
>> -       struct pci_bus *bus = NULL;
>> -       struct pci_bus *tmp_bus;
>> +       struct pci_bus *bus;
>>
>> -       while ((bus = pci_find_next_bus(bus)) != NULL)  {
>> -               if (pci_domain_nr(bus) != domain)
>> -                       continue;
>> -               tmp_bus = pci_do_find_bus(bus, busnr);
>> -               if (tmp_bus)
>> -                       return tmp_bus;
>> -       }
>> -       return NULL;
>> +       rcu_read_lock();
>> +       bus = __pci_find_bus(domain, busnr);
>> +       rcu_read_unlock();
>> +
>> +       return bus;
>>   }
>>
>>   /**
>> @@ -98,21 +141,93 @@ struct pci_bus * pci_find_bus(int domain, int busnr)
>>   * initiated by passing %NULL as the @from argument.  Otherwise if
>>   * @from is not %NULL, searches continue from next device on the
>>   * global list.
>> + *
>> + * TODO: By design, this function should only be called at boot time.
>> + * So either mark it as __init or deprecate it.
>>   */
>>   struct pci_bus *
>>   pci_find_next_bus(const struct pci_bus *from)
>>   {
>> -       struct list_head *n;
>> -       struct pci_bus *b = NULL;
>> +       struct pci_bus *bus;
>>
>> -       WARN_ON(in_interrupt());
>> -       down_read(&pci_bus_sem);
>> -       n = from ? from->node.next : pci_root_buses.next;
>> -       if (n !=&pci_root_buses)
>> -               b = pci_bus_b(n);
>> -       up_read(&pci_bus_sem);
>> -       return b;
>> +       rcu_read_lock();
>> +       bus = __pci_find_next_bus(from);
>> +       rcu_read_unlock();
>> +
>> +       return bus;
>> +}
>> +
>> +/**
>> + * pci_get_bus - locate PCI bus from a given domain and bus number
>> + * @domain: number of PCI domain to search
>> + * @busnr: number of desired PCI bus
>> + *
>> + * Given a PCI bus number and domain number, the desired PCI bus is located
>> + * in the global list of PCI buses. If the bus is found, a pointer to its
>> + * data structure is returned, and the reference count to the bus is increased.
>> + * Otherwise, %NULL is returned.
>> + */
>> +struct pci_bus *
>> +pci_get_bus(int domain, int busnr)
>> +{
>> +       struct pci_bus *bus;
>> +
>> +       rcu_read_lock();
>> +       bus = pci_bus_get(__pci_find_bus(domain, busnr));
>> +       rcu_read_unlock();
>> +
>> +       return bus;
>> +}
>> +EXPORT_SYMBOL(pci_get_bus);
>> +
>> +/**
>> + * pci_get_next_bus - begin or continue searching for a PCI bus
>> + * @from: Previous PCI bus found, or %NULL for new search.
>> + *
>> + * Iterates through the list of known PCI busses.  A new search is
>> + * initiated by passing %NULL as the @from argument.  Otherwise if
>> + * @from is not %NULL, searches continue from next device on the
>> + * global list. If a bus is found, a pointer to its data structure
>> + * is returned, and the reference count to the bus is increased.
>> + * Otherwise, %NULL is returned.
>> + * The reference count for @from is always decremented if it is not %NULL.
>> + */
>> +struct pci_bus *
>> +pci_get_next_bus(struct pci_bus *from)
>> +{
>> +       struct pci_bus *bus;
>> +
>> +       rcu_read_lock();
>> +       bus = pci_bus_get(__pci_find_next_bus(from));
>> +       rcu_read_unlock();
>> +
>> +       return bus;
>> +}
>> +EXPORT_SYMBOL(pci_get_next_bus);
>> +
>> +/**
>> + * pci_bus_present - Returns true if a bus with the (@domain, @busnr)
>> + * is present, false if not.
>> + * @domain: number of PCI domain to search
>> + * @busnr: number of desired PCI bus
>> + *
>> + * Obvious fact: You do not have a reference to any bus that might be found
>> + * by this function, so if that bus is removed from the system right after
>> + * this function is finished, the value will be stale.  Use this function to
>> + * find buses that are usually built into a system, or for a general hint as
>> + * to if another device happens to be present at this specific moment in time.
>> + */
>> +bool pci_bus_present(int domain, int busnr)
>> +{
>> +       struct pci_bus *bus;
>> +
>> +       rcu_read_lock();
>> +       bus = __pci_find_bus(domain, busnr);
>> +       rcu_read_unlock();
>> +
>> +       return !!bus;
>>   }
>> +EXPORT_SYMBOL(pci_bus_present);
>>
>>   /**
>>   * pci_get_slot - locate PCI device for a given PCI slot
>> diff --git a/include/linux/pci.h b/include/linux/pci.h
>> index ec8c4cf..222bc88 100644
>> --- a/include/linux/pci.h
>> +++ b/include/linux/pci.h
>> @@ -731,6 +731,11 @@ int pci_find_ht_capability(struct pci_dev *dev, int ht_cap);
>>   int pci_find_next_ht_capability(struct pci_dev *dev, int pos, int ht_cap);
>>   struct pci_bus *pci_find_next_bus(const struct pci_bus *from);
>>
>> +struct pci_bus *pci_bus_get(struct pci_bus *bus);
>> +void pci_bus_put(struct pci_bus *bus);
>> +struct pci_bus *pci_get_bus(int domain, int busnr);
>> +struct pci_bus *pci_get_next_bus(struct pci_bus *from);
>> +bool pci_bus_present(int domain, int busnr);
>>   struct pci_dev *pci_get_device(unsigned int vendor, unsigned int device,
>>                                 struct pci_dev *from);
>>   struct pci_dev *pci_get_subsys(unsigned int vendor, unsigned int device,
>> @@ -1321,6 +1326,9 @@ static inline void pci_unblock_cfg_access(struct pci_dev *dev)
>>   static inline struct pci_bus *pci_find_next_bus(const struct pci_bus *from)
>>   { return NULL; }
>>
>> +static inline struct pci_bus *pci_get_next_bus(const struct pci_bus *from)
>> +{ return NULL; }
>> +
>>   static inline struct pci_dev *pci_get_slot(struct pci_bus *bus,
>>                                                 unsigned int devfn)
>>   { return NULL; }
>> --
>> 1.7.5.4
>>
>
> .
>


--
To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
the body of a message to majordomo@...r.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html
Please read the FAQ at  http://www.tux.org/lkml/

Powered by blists - more mailing lists

Powered by Openwall GNU/*/Linux Powered by OpenVZ