LU-874 ldlm: prioritize LDLM_CANCEL requests

[fs/lustre-release.git] / lustre / ldlm / ldlm_lockd.c
diff --git a/lustre/ldlm/ldlm_lockd.c b/lustre/ldlm/ldlm_lockd.c

index 1b80090..d77a893 100644 (file)
--- a/lustre/ldlm/ldlm_lockd.c
+++ b/lustre/ldlm/ldlm_lockd.c
@@ -279,7 +279,7 @@ static int ldlm_lock_busy(struct ldlm_lock *lock)
  /* This is called from within a timer interrupt and cannot schedule */
  static void waiting_locks_callback(unsigned long unused)
  {
-        struct ldlm_lock *lock, *last = NULL;
+        struct ldlm_lock *lock;
  
  repeat:
          cfs_spin_lock_bh(&waiting_locks_spinlock);
@@ -355,8 +355,6 @@ repeat:
                             libcfs_nid2str(
                                     lock->l_export->exp_connection->c_peer.nid));
  
-                last = lock;
-
                  /* no needs to take an extra ref on the lock since it was in
                   * the waiting_locks_list and ldlm_add_waiting_lock()
                   * already grabbed a ref */
@@ -652,7 +650,6 @@ static int ldlm_cb_interpret(const struct lu_env *env,
          struct ldlm_cb_async_args *ca   = data;
          struct ldlm_lock          *lock = ca->ca_lock;
          struct ldlm_cb_set_arg    *arg  = ca->ca_set_arg;
-        struct ptlrpc_request_set *set  = arg->set;
          ENTRY;
  
          LASSERT(lock != NULL);
@@ -665,7 +662,8 @@ static int ldlm_cb_interpret(const struct lu_env *env,
          }
          LDLM_LOCK_RELEASE(lock);
  
-        cfs_waitq_signal(&set->set_waitq);
+        if (cfs_atomic_dec_return(&arg->rpcs) < arg->threshold)
+                cfs_waitq_signal(&arg->waitq);
          RETURN(0);
  }
  
@@ -684,8 +682,8 @@ static inline int ldlm_bl_and_cp_ast_tail(struct ptlrpc_request *req,
                          cfs_atomic_inc(&arg->restart);
          } else {
                  LDLM_LOCK_GET(lock);
-                ptlrpc_set_add_req(arg->set, req);
-                ++arg->rpcs;
+                ptlrpcd_add_req(req, PDL_POLICY_ROUND, -1);
+                cfs_atomic_inc(&arg->rpcs);
          }
  
          RETURN(rc);
@@ -708,7 +706,11 @@ static void ldlm_lock_reorder_req(struct ldlm_lock *lock)
          cfs_spin_lock_bh(&lock->l_export->exp_rpc_lock);
          cfs_list_for_each_entry(req, &lock->l_export->exp_queued_rpc,
                                  rq_exp_list) {
-                if (!req->rq_hp && req->rq_ops->hpreq_lock_match &&
+                /* Do not process requests that were not yet added to there
+                 * incoming queue or were already removed from there for
+                 * processing */
+                if (!req->rq_hp && !cfs_list_empty(&req->rq_list) &&
+                    req->rq_ops->hpreq_lock_match &&
                      req->rq_ops->hpreq_lock_match(req, lock))
                          ptlrpc_hpreq_reorder(req);
          }
@@ -2097,6 +2099,90 @@ static int ldlm_cancel_handler(struct ptlrpc_request *req)
          RETURN(0);
  }
  
+static int ldlm_cancel_hpreq_lock_match(struct ptlrpc_request *req,
+                                        struct ldlm_lock *lock)
+{
+        struct ldlm_request *dlm_req;
+        struct lustre_handle lockh;
+        int rc = 0;
+        int i;
+        ENTRY;
+
+        dlm_req = req_capsule_client_get(&req->rq_pill, &RMF_DLM_REQ);
+        if (dlm_req == NULL)
+                RETURN(0);
+
+        ldlm_lock2handle(lock, &lockh);
+        for (i = 0; i < dlm_req->lock_count; i++) {
+                if (lustre_handle_equal(&dlm_req->lock_handle[i],
+                                        &lockh)) {
+                        DEBUG_REQ(D_RPCTRACE, req,
+                                  "Prio raised by lock "LPX64".", lockh.cookie);
+
+                        rc = 1;
+                        break;
+                }
+        }
+
+        RETURN(rc);
+
+}
+
+static int ldlm_cancel_hpreq_check(struct ptlrpc_request *req)
+{
+        struct ldlm_request *dlm_req;
+        int rc = 0;
+        int i;
+        ENTRY;
+
+        /* no prolong in recovery */
+        if (lustre_msg_get_flags(req->rq_reqmsg) & MSG_REPLAY)
+                RETURN(0);
+
+        dlm_req = req_capsule_client_get(&req->rq_pill, &RMF_DLM_REQ);
+        if (dlm_req == NULL)
+                RETURN(-EFAULT);
+
+        for (i = 0; i < dlm_req->lock_count; i++) {
+                struct ldlm_lock *lock;
+
+                lock = ldlm_handle2lock(&dlm_req->lock_handle[i]);
+                if (lock == NULL)
+                        continue;
+
+                rc = !!(lock->l_flags & LDLM_FL_AST_SENT);
+                if (rc)
+                        LDLM_DEBUG(lock, "hpreq cancel lock");
+                LDLM_LOCK_PUT(lock);
+
+                if (rc)
+                        break;
+        }
+
+        RETURN(rc);
+}
+
+static struct ptlrpc_hpreq_ops ldlm_cancel_hpreq_ops = {
+        .hpreq_lock_match = ldlm_cancel_hpreq_lock_match,
+        .hpreq_check      = ldlm_cancel_hpreq_check
+};
+
+static int ldlm_hpreq_handler(struct ptlrpc_request *req)
+{
+        ENTRY;
+
+        req_capsule_init(&req->rq_pill, req, RCL_SERVER);
+
+        if (req->rq_export == NULL)
+                RETURN(0);
+
+        if (LDLM_CANCEL == lustre_msg_get_opc(req->rq_reqmsg)) {
+                req_capsule_set(&req->rq_pill, &RQF_LDLM_CANCEL);
+                req->rq_ops = &ldlm_cancel_hpreq_ops;
+        }
+        RETURN(0);
+}
+
  int ldlm_revoke_lock_cb(cfs_hash_t *hs, cfs_hash_bd_t *bd,
                          cfs_hlist_node_t *hnode, void *data)
  
@@ -2232,33 +2318,31 @@ static int ldlm_bl_thread_main(void *arg)
          while (1) {
                  struct l_wait_info lwi = { 0 };
                  struct ldlm_bl_work_item *blwi = NULL;
+                int busy;
  
                  blwi = ldlm_bl_get_work(blp);
  
                  if (blwi == NULL) {
-                        int busy;
-
                          cfs_atomic_dec(&blp->blp_busy_threads);
                          l_wait_event_exclusive(blp->blp_waitq,
                                           (blwi = ldlm_bl_get_work(blp)) != NULL,
                                           &lwi);
                          busy = cfs_atomic_inc_return(&blp->blp_busy_threads);
-
-                        if (blwi->blwi_ns == NULL)
-                                /* added by ldlm_cleanup() */
-                                break;
-
-                        /* Not fatal if racy and have a few too many threads */
-                        if (unlikely(busy < blp->blp_max_threads &&
-                            busy >= cfs_atomic_read(&blp->blp_num_threads) &&
-                            !blwi->blwi_mem_pressure))
-                                /* discard the return value, we tried */
-                                ldlm_bl_thread_start(blp);
                  } else {
-                        if (blwi->blwi_ns == NULL)
-                                /* added by ldlm_cleanup() */
-                                break;
+                        busy = cfs_atomic_read(&blp->blp_busy_threads);
                  }
+
+                if (blwi->blwi_ns == NULL)
+                        /* added by ldlm_cleanup() */
+                        break;
+
+                /* Not fatal if racy and have a few too many threads */
+                if (unlikely(busy < blp->blp_max_threads &&
+                             busy >= cfs_atomic_read(&blp->blp_num_threads) &&
+                             !blwi->blwi_mem_pressure))
+                        /* discard the return value, we tried */
+                        ldlm_bl_thread_start(blp);
+
                  if (blwi->blwi_mem_pressure)
                          cfs_memory_pressure_set();
  
@@ -2486,7 +2570,7 @@ static int ldlm_setup(void)
                                  ldlm_min_threads, ldlm_max_threads,
                                  "ldlm_cn",
                                  LCT_MD_THREAD|LCT_DT_THREAD|LCT_CL_THREAD,
-                                NULL);
+                                ldlm_hpreq_handler);
  
          if (!ldlm_state->ldlm_cancel_service) {
                  CERROR("failed to start service\n");
@@ -2616,7 +2700,7 @@ static int ldlm_cleanup(void)
          RETURN(0);
  }
  
-int __init ldlm_init(void)
+int ldlm_init(void)
  {
          cfs_init_mutex(&ldlm_ref_sem);
          cfs_init_mutex(ldlm_namespace_lock(LDLM_NAMESPACE_SERVER));
@@ -2649,7 +2733,7 @@ int __init ldlm_init(void)
          return 0;
  }
  
-void __exit ldlm_exit(void)
+void ldlm_exit(void)
  {
          int rc;
          if (ldlm_refcount)