LU-2432 ptlrpc: alloc_rqbd spin on vmap_area_lock

[fs/lustre-release.git] / lustre / include / lustre_net.h
diff --git a/lustre/include/lustre_net.h b/lustre/include/lustre_net.h

index 0c00e64..fb49288 100644 (file)
--- a/lustre/include/lustre_net.h
+++ b/lustre/include/lustre_net.h
@@ -150,17 +150,17 @@
   *
   * Examples
   *
- * #define MDT_NTHRS_INIT      2
- * #define MDT_NTHRS_BASE      64
- * #define MDT_NTHRS_FACTOR    8
- * #define MDT_NTHRS_MAX       1024
+ * #define MDS_NTHRS_INIT      2
+ * #define MDS_NTHRS_BASE      64
+ * #define MDS_NTHRS_FACTOR    8
+ * #define MDS_NTHRS_MAX       1024
   *
   * Example 1):
   * ---------------------------------------------------------------------
   * Server(A) has 16 cores, user configured it to 4 partitions so each
   * partition has 4 cores, then actual number of service threads on each
   * partition is:
- *     MDT_NTHRS_BASE(64) + cores(4) * MDT_NTHRS_FACTOR(8) = 96
+ *     MDS_NTHRS_BASE(64) + cores(4) * MDS_NTHRS_FACTOR(8) = 96
   *
   * Total number of threads for the service is:
   *     96 * partitions(4) = 384
@@ -170,7 +170,7 @@
   * Server(B) has 32 cores, user configured it to 4 partitions so each
   * partition has 8 cores, then actual number of service threads on each
   * partition is:
- *     MDT_NTHRS_BASE(64) + cores(8) * MDT_NTHRS_FACTOR(8) = 128
+ *     MDS_NTHRS_BASE(64) + cores(8) * MDS_NTHRS_FACTOR(8) = 128
   *
   * Total number of threads for the service is:
   *     128 * partitions(4) = 512
@@ -180,22 +180,22 @@
   * Server(B) has 96 cores, user configured it to 8 partitions so each
   * partition has 12 cores, then actual number of service threads on each
   * partition is:
- *     MDT_NTHRS_BASE(64) + cores(12) * MDT_NTHRS_FACTOR(8) = 160
+ *     MDS_NTHRS_BASE(64) + cores(12) * MDS_NTHRS_FACTOR(8) = 160
   *
   * Total number of threads for the service is:
   *     160 * partitions(8) = 1280
   *
- * However, it's above the soft limit MDT_NTHRS_MAX, so we choose this number
+ * However, it's above the soft limit MDS_NTHRS_MAX, so we choose this number
   * as upper limit of threads number for each partition:
- *     MDT_NTHRS_MAX(1024) / partitions(8) = 128
+ *     MDS_NTHRS_MAX(1024) / partitions(8) = 128
   *
   * Example 4):
   * ---------------------------------------------------------------------
   * Server(C) have a thousand of cores and user configured it to 32 partitions
- *     MDT_NTHRS_BASE(64) * 32 = 2048
+ *     MDS_NTHRS_BASE(64) * 32 = 2048
   *
- * which is already above soft limit MDT_NTHRS_MAX(1024), but we still need
- * to guarantee that each partition has at least MDT_NTHRS_BASE(64) threads
+ * which is already above soft limit MDS_NTHRS_MAX(1024), but we still need
+ * to guarantee that each partition has at least MDS_NTHRS_BASE(64) threads
   * to keep service healthy, so total number of threads will just be 2048.
   *
   * NB: we don't suggest to choose server with that many cores because backend
@@ -252,39 +252,39 @@
    * Please see examples in "Thread Constants", MDS threads number will be at
    * the comparable level of old versions, unless the server has many cores.
    */
-#ifndef MDT_MAX_THREADS
-#define MDT_MAX_THREADS                1024
-#define MDT_MAX_OTHR_THREADS   256
-
-#else /* MDT_MAX_THREADS */
-#if MDT_MAX_THREADS < PTLRPC_NTHRS_INIT
-#undef MDT_MAX_THREADS
-#define MDT_MAX_THREADS        PTLRPC_NTHRS_INIT
+#ifndef MDS_MAX_THREADS
+#define MDS_MAX_THREADS                1024
+#define MDS_MAX_OTHR_THREADS   256
+
+#else /* MDS_MAX_THREADS */
+#if MDS_MAX_THREADS < PTLRPC_NTHRS_INIT
+#undef MDS_MAX_THREADS
+#define MDS_MAX_THREADS        PTLRPC_NTHRS_INIT
  #endif
-#define MDT_MAX_OTHR_THREADS   max(PTLRPC_NTHRS_INIT, MDT_MAX_THREADS / 2)
+#define MDS_MAX_OTHR_THREADS   max(PTLRPC_NTHRS_INIT, MDS_MAX_THREADS / 2)
  #endif
  
  /* default service */
-#define MDT_THR_FACTOR         8
-#define MDT_NTHRS_INIT         PTLRPC_NTHRS_INIT
-#define MDT_NTHRS_MAX          MDT_MAX_THREADS
-#define MDT_NTHRS_BASE         min(64, MDT_NTHRS_MAX)
+#define MDS_THR_FACTOR         8
+#define MDS_NTHRS_INIT         PTLRPC_NTHRS_INIT
+#define MDS_NTHRS_MAX          MDS_MAX_THREADS
+#define MDS_NTHRS_BASE         min(64, MDS_NTHRS_MAX)
  
  /* read-page service */
-#define MDT_RDPG_THR_FACTOR    4
-#define MDT_RDPG_NTHRS_INIT    PTLRPC_NTHRS_INIT
-#define MDT_RDPG_NTHRS_MAX     MDT_MAX_OTHR_THREADS
-#define MDT_RDPG_NTHRS_BASE    min(48, MDT_RDPG_NTHRS_MAX)
+#define MDS_RDPG_THR_FACTOR    4
+#define MDS_RDPG_NTHRS_INIT    PTLRPC_NTHRS_INIT
+#define MDS_RDPG_NTHRS_MAX     MDS_MAX_OTHR_THREADS
+#define MDS_RDPG_NTHRS_BASE    min(48, MDS_RDPG_NTHRS_MAX)
  
  /* these should be removed when we remove setattr service in the future */
-#define MDT_SETA_THR_FACTOR    4
-#define MDT_SETA_NTHRS_INIT    PTLRPC_NTHRS_INIT
-#define MDT_SETA_NTHRS_MAX     MDT_MAX_OTHR_THREADS
-#define MDT_SETA_NTHRS_BASE    min(48, MDT_SETA_NTHRS_MAX)
+#define MDS_SETA_THR_FACTOR    4
+#define MDS_SETA_NTHRS_INIT    PTLRPC_NTHRS_INIT
+#define MDS_SETA_NTHRS_MAX     MDS_MAX_OTHR_THREADS
+#define MDS_SETA_NTHRS_BASE    min(48, MDS_SETA_NTHRS_MAX)
  
  /* non-affinity threads */
-#define MDT_OTHR_NTHRS_INIT    PTLRPC_NTHRS_INIT
-#define MDT_OTHR_NTHRS_MAX     MDT_MAX_OTHR_THREADS
+#define MDS_OTHR_NTHRS_INIT    PTLRPC_NTHRS_INIT
+#define MDS_OTHR_NTHRS_MAX     MDS_MAX_OTHR_THREADS
  
  #define MDS_NBUFS              (64 * cfs_num_online_cpus())
  /**
@@ -473,7 +473,7 @@ struct ptlrpc_request_set {
          * locked so that any old caller can communicate requests to
          * the set holder who can then fold them into the lock-free set
          */
-       cfs_spinlock_t        set_new_req_lock;
+       spinlock_t              set_new_req_lock;
         /** List of new yet unsent requests. Only used with ptlrpcd now. */
         cfs_list_t            set_new_requests;
  
@@ -535,7 +535,7 @@ struct ptlrpc_reply_state {
          cfs_list_t             rs_debug_list;
  #endif
          /** A spinlock to protect the reply state flags */
-        cfs_spinlock_t         rs_lock;
+       spinlock_t              rs_lock;
          /** Reply state flags */
          unsigned long          rs_difficult:1;     /* ACK/commit stuff */
          unsigned long          rs_no_ack:1;    /* no ACK, even for
@@ -610,8 +610,8 @@ typedef int (*ptlrpc_interpterer_t)(const struct lu_env *env,
   * any allocations (to avoid e.g. OOM).
   */
  struct ptlrpc_request_pool {
-        /** Locks the list */
-        cfs_spinlock_t prp_lock;
+       /** Locks the list */
+       spinlock_t prp_lock;
          /** list of ptlrpc_request structs */
          cfs_list_t prp_req_list;
          /** Maximum message size that would fit into a rquest from this pool */
@@ -691,8 +691,8 @@ struct ptlrpc_request {
          /** Lock to protect request flags and some other important bits, like
           * rq_list
           */
-        cfs_spinlock_t rq_lock;
-        /** client-side flags are serialized by rq_lock */
+       spinlock_t rq_lock;
+       /** client-side flags are serialized by rq_lock */
         unsigned int rq_intr:1, rq_replied:1, rq_err:1,
                  rq_timedout:1, rq_resend:1, rq_restart:1,
                  /**
@@ -1109,7 +1109,7 @@ struct ptlrpc_bulk_desc {
          /** client side */
          unsigned long bd_registered:1;
          /** For serialization with callback */
-        cfs_spinlock_t bd_lock;
+       spinlock_t bd_lock;
          /** Import generation when request for this bulk was sent */
          int bd_import_generation;
          /** Server side - export this bulk created for */
@@ -1322,7 +1322,7 @@ struct ptlrpc_service_ops {
   */
  struct ptlrpc_service {
         /** serialize /proc operations */
-       cfs_spinlock_t                  srv_lock;
+       spinlock_t                      srv_lock;
          /** most often accessed fields */
          /** chain thru all services */
          cfs_list_t                      srv_list;
@@ -1421,11 +1421,13 @@ struct ptlrpc_service_part {
          * rqbd list and incoming requests waiting for preprocess,
          * threads starting & stopping are also protected by this lock.
          */
-       cfs_spinlock_t                  scp_lock  __cfs_cacheline_aligned;
+       spinlock_t                      scp_lock  __cfs_cacheline_aligned;
         /** total # req buffer descs allocated */
         int                             scp_nrqbds_total;
         /** # posted request buffers for receiving */
         int                             scp_nrqbds_posted;
+       /** in progress of allocating rqbd */
+       int                             scp_rqbd_allocating;
         /** # incoming reqs */
         int                             scp_nreqs_incoming;
         /** request buffers to be reposted */
@@ -1457,7 +1459,7 @@ struct ptlrpc_service_part {
          * serialize the following fields, used for processing requests
          * sent to this portal
          */
-       cfs_spinlock_t                  scp_req_lock __cfs_cacheline_aligned;
+       spinlock_t                      scp_req_lock __cfs_cacheline_aligned;
         /** # reqs in either of the queues below */
         /** reqs waiting for service */
         cfs_list_t                      scp_req_pending;
@@ -1476,7 +1478,7 @@ struct ptlrpc_service_part {
          * serialize the following fields, used for changes on
          * adaptive timeout
          */
-       cfs_spinlock_t                  scp_at_lock __cfs_cacheline_aligned;
+       spinlock_t                      scp_at_lock __cfs_cacheline_aligned;
         /** estimated rpc service time */
         struct adaptive_timeout         scp_at_estimate;
         /** reqs waiting for replies */
@@ -1493,7 +1495,7 @@ struct ptlrpc_service_part {
          * serialize the following fields, used for processing
          * replies for this portal
          */
-       cfs_spinlock_t                  scp_rep_lock __cfs_cacheline_aligned;
+       spinlock_t                      scp_rep_lock __cfs_cacheline_aligned;
         /** all the active replies */
         cfs_list_t                      scp_rep_active;
  #ifndef __KERNEL__
@@ -1518,22 +1520,22 @@ struct ptlrpc_service_part {
   * Declaration of ptlrpcd control structure
   */
  struct ptlrpcd_ctl {
-        /**
-         * Ptlrpc thread control flags (LIOD_START, LIOD_STOP, LIOD_FORCE)
-         */
-        unsigned long               pc_flags;
-        /**
-         * Thread lock protecting structure fields.
-         */
-        cfs_spinlock_t              pc_lock;
-        /**
-         * Start completion.
-         */
-        cfs_completion_t            pc_starting;
-        /**
-         * Stop completion.
-         */
-        cfs_completion_t            pc_finishing;
+       /**
+        * Ptlrpc thread control flags (LIOD_START, LIOD_STOP, LIOD_FORCE)
+        */
+       unsigned long                   pc_flags;
+       /**
+        * Thread lock protecting structure fields.
+        */
+       spinlock_t                      pc_lock;
+       /**
+        * Start completion.
+        */
+       struct completion               pc_starting;
+       /**
+        * Stop completion.
+        */
+       struct completion               pc_finishing;
          /**
           * Thread requests set.
           */
@@ -1651,14 +1653,14 @@ void ptlrpc_abort_bulk(struct ptlrpc_bulk_desc *desc);
  
  static inline int ptlrpc_server_bulk_active(struct ptlrpc_bulk_desc *desc)
  {
-        int rc;
+       int rc;
  
-        LASSERT(desc != NULL);
+       LASSERT(desc != NULL);
  
-        cfs_spin_lock(&desc->bd_lock);
-        rc = desc->bd_network_rw;
-        cfs_spin_unlock(&desc->bd_lock);
-        return rc;
+       spin_lock(&desc->bd_lock);
+       rc = desc->bd_network_rw;
+       spin_unlock(&desc->bd_lock);
+       return rc;
  }
  #endif
  
@@ -1679,10 +1681,10 @@ static inline int ptlrpc_client_bulk_active(struct ptlrpc_request *req)
          if (!desc)
                  return 0;
  
-        cfs_spin_lock(&desc->bd_lock);
-        rc = desc->bd_network_rw;
-        cfs_spin_unlock(&desc->bd_lock);
-        return rc;
+       spin_lock(&desc->bd_lock);
+       rc = desc->bd_network_rw;
+       spin_unlock(&desc->bd_lock);
+       return rc;
  }
  
  #define PTLRPC_REPLY_MAYBE_DIFFICULT 0x01
@@ -2080,17 +2082,17 @@ ptlrpc_client_recv(struct ptlrpc_request *req)
  static inline int
  ptlrpc_client_recv_or_unlink(struct ptlrpc_request *req)
  {
-        int rc;
-
-        cfs_spin_lock(&req->rq_lock);
-        if (OBD_FAIL_CHECK(OBD_FAIL_PTLRPC_LONG_REPL_UNLINK) &&
-            req->rq_reply_deadline > cfs_time_current_sec()) {
-                cfs_spin_unlock(&req->rq_lock);
-                return 1;
-        }
-        rc = req->rq_receiving_reply || req->rq_must_unlink;
-        cfs_spin_unlock(&req->rq_lock);
-        return rc;
+       int rc;
+
+       spin_lock(&req->rq_lock);
+       if (OBD_FAIL_CHECK(OBD_FAIL_PTLRPC_LONG_REPL_UNLINK) &&
+           req->rq_reply_deadline > cfs_time_current_sec()) {
+               spin_unlock(&req->rq_lock);
+               return 1;
+       }
+       rc = req->rq_receiving_reply || req->rq_must_unlink;
+       spin_unlock(&req->rq_lock);
+       return rc;
  }
  
  static inline void
@@ -2157,12 +2159,12 @@ static inline int ptlrpc_send_limit_expired(struct ptlrpc_request *req)
  
  static inline int ptlrpc_no_resend(struct ptlrpc_request *req)
  {
-        if (!req->rq_no_resend && ptlrpc_send_limit_expired(req)) {
-                cfs_spin_lock(&req->rq_lock);
-                req->rq_no_resend = 1;
-                cfs_spin_unlock(&req->rq_lock);
-        }
-        return req->rq_no_resend;
+       if (!req->rq_no_resend && ptlrpc_send_limit_expired(req)) {
+               spin_lock(&req->rq_lock);
+               req->rq_no_resend = 1;
+               spin_unlock(&req->rq_lock);
+       }
+       return req->rq_no_resend;
  }
  
  static inline int