[Open-FCoE] [RFC PATCH 4/4] libfc, fcoe: Allocate XIDs by CPU ID

Robert Love Mon, 18 May 2009 13:57:15 -0700

This patch makes the EMs SMP aware. They will allocate
XIDs by pools determined by the number of possible CPUs
in the system.


The goal is to have I/O echanges processed on one CPU to
avoid cache misses. This means that whatever CPU is processing
the READ request should also process the READ response. To
do so, this patch carves up an XID space in an EM by the number
of CPUs in the system. It then checks the processor ID and
gives out XIDs to the active CPU from its pool. On Rx, there
is a queue/thread per CPU already, so this patch just uses
(XID % num_possible_cpus) to determine which CPU/queue/thread
the response should be processed by.

If a CPU is offlined there is no reallocation of resources
(i.e. XIDs), they just go unused. Also, if a CPU is offlined
our Rx handler will move the response frame to another CPU.
We will take a cache miss, but that isn't a concern as online/
offline CPU should be infrequent and the number of frames
that might go to the wrong CPU would likely show no impact.

Signed-off-by: Robert Love <[email protected]>
---

 drivers/scsi/fcoe/fcoe.c     |    2 +
 drivers/scsi/libfc/fc_exch.c |   77 +++++++++++++++++++++++++++++++++++++-----
 2 files changed, 69 insertions(+), 10 deletions(-)

diff --git a/drivers/scsi/fcoe/fcoe.c b/drivers/scsi/fcoe/fcoe.c
index f589a47..0001de8 100644
--- a/drivers/scsi/fcoe/fcoe.c
+++ b/drivers/scsi/fcoe/fcoe.c
@@ -991,7 +991,7 @@ int fcoe_rcv(struct sk_buff *skb, struct net_device *dev,
         * cpu bits to get cpu and then this cpu is used for selecting
         * a per cpu kernel thread from fcoe_percpu.
         */
-       cpu = oxid & (num_online_cpus() - 1);
+       cpu = oxid % num_online_cpus();
 #endif
 
        fps = &per_cpu(fcoe_percpu, cpu);
diff --git a/drivers/scsi/libfc/fc_exch.c b/drivers/scsi/libfc/fc_exch.c
index 0664366..1670bad 100644
--- a/drivers/scsi/libfc/fc_exch.c
+++ b/drivers/scsi/libfc/fc_exch.c
@@ -69,7 +69,7 @@ struct fc_exch_mgr {
        spinlock_t      em_lock;        /* exchange manager lock,
                                           must be taken before ex_lock */
        u16             em_user;        /* exchange manager user count */
-       u16             last_xid;       /* last allocated exchange ID */
+       u16             *last_xid;      /* last allocated exchange ID */
        u16             min_xid;        /* min exchange ID */
        u16             max_xid;        /* max exchange ID */
        u32             total_exches;   /* total allocated exchanges */
@@ -471,6 +471,49 @@ static struct fc_seq *fc_seq_alloc(struct fc_exch *ep, u8 
seq_id)
        return sp;
 }
 
+static u16 fc_exch_xid_find(struct fc_exch_mgr *mp, unsigned int cpu_idx)
+{
+       int found = 0;
+       unsigned int nr_cpus = num_possible_cpus();
+       u16 xid, prev_xid;
+       prev_xid = xid = *per_cpu_ptr(mp->last_xid, cpu_idx);
+
+       while (!found) {
+               /* Wrap around or increment */
+               if (xid == FC_XID_UNKNOWN)
+                       xid = mp->min_xid + cpu_idx;
+               else
+                       xid = xid + nr_cpus;
+
+               /*
+                * We've come back to the original last_xid,
+                * so we've exhausted the list.
+                */
+               if (xid == prev_xid) {
+                       xid = FC_XID_UNKNOWN;
+                       found = 1;
+                       break;
+               }
+
+               /* Have we exceeded the max XIDs? */
+               if (xid > mp->max_xid) {
+                       xid = FC_XID_UNKNOWN;
+                       continue;
+               }
+
+               /*
+                * Always deal with real XIDs until now, where we
+                * need to look at the array index by subtracting one.
+                */
+               if (!mp->exches[xid - mp->min_xid]) {
+                       *per_cpu_ptr(mp->last_xid, cpu_idx) = xid;
+                       found = 1;
+                       break;
+               }
+       }
+       return xid;
+}
+
 /*
  * fc_exch_alloc - allocate an exchange and its exchange id.
  * @mp : ptr to the exchange manager
@@ -481,6 +524,7 @@ struct fc_exch *fc_exch_alloc(struct fc_exch_mgr *mp)
 {
        struct fc_exch *ep;
        u16 min, max, xid;
+       unsigned int cpu;
 
        /* allocate memory for exchange */
        ep = mempool_alloc(mp->ep_pool, GFP_ATOMIC);
@@ -494,14 +538,25 @@ struct fc_exch *fc_exch_alloc(struct fc_exch_mgr *mp)
        max = mp->max_xid;
 
        spin_lock_bh(&mp->em_lock);
-       xid = mp->last_xid;
-       /* alloc a new xid */
-       while (mp->exches[xid - min]) {
-               xid = (xid == max) ? min : xid + 1;
-               if (xid == mp->last_xid)
-                       goto err;
+
+       xid = fc_exch_xid_find(mp, smp_processor_id());
+       if (xid == FC_XID_UNKNOWN) {
+               /*
+                * It would be nice to have a more intelligent
+                * algorithm here instead of starting with CPU 0
+                * everytime.
+                */
+               for_each_online_cpu(cpu) {
+                       if (cpu == smp_processor_id())
+                               continue;
+                       xid = fc_exch_xid_find(mp, cpu);
+                       if (xid != FC_XID_UNKNOWN)
+                               break;
+               }
        }
-       mp->last_xid = xid;
+
+       if (xid == FC_XID_UNKNOWN)
+               goto err;
 
        fc_exch_hold(ep);       /* hold for exch in mp */
        spin_lock_init(&ep->ex_lock);
@@ -1689,6 +1744,7 @@ struct fc_exch_mgr *fc_exch_mgr_alloc(struct fc_lport *lp,
                                      u16 min_xid, u16 max_xid)
 {
        size_t len;
+       unsigned int cpu;
 
        /*
         * if an existing em instance specified
@@ -1725,7 +1781,9 @@ struct fc_exch_mgr *fc_exch_mgr_alloc(struct fc_lport *lp,
        /* adjust em exch xid range for offload */
        mp->min_xid = min_xid;
        mp->max_xid = max_xid;
-       mp->last_xid = min_xid;
+       mp->last_xid = alloc_percpu(u16);
+       for_each_possible_cpu(cpu)
+               *per_cpu_ptr(mp->last_xid, cpu) = FC_XID_UNKNOWN;
 
        INIT_LIST_HEAD(&mp->ex_list);
        spin_lock_init(&mp->em_lock);
@@ -1760,6 +1818,7 @@ void fc_exch_mgr_free(struct fc_exch_mgr *mp)
         * before freeing exchange manager.
         */
        WARN_ON(mp->total_exches != 0);
+       free_percpu(mp->last_xid);
        mempool_destroy(mp->ep_pool);
        kfree(mp);
 }

_______________________________________________
devel mailing list
[email protected]
http://www.open-fcoe.org/mailman/listinfo/devel

[Open-FCoE] [RFC PATCH 4/4] libfc, fcoe: Allocate XIDs by CPU ID

Reply via email to