Whamcloud - gitweb
LU-17197 obdclass: preserve fairness when waiting for rpc slot 32/53232/3
authorShaun Tancheff <shaun.tancheff@hpe.com>
Wed, 18 Oct 2023 03:54:59 +0000 (22:54 -0500)
committerOleg Drokin <green@whamcloud.com>
Sun, 16 Jun 2024 03:35:01 +0000 (03:35 +0000)
When obd_get_mod_rpc_slot() waits for an available slot it places the
waiting thread at the HEAD of the queue, so it will be woken before
anything else that is already queued.  This is clearly unfair and can
hurt performance.

So change to always add to the tail to ensure a FIFO ordering (except
that CLOSE might sometimes be woken a bit early).

This regression was introduced in a rewrite that was supposed to make
waiting more fair - by avoiding a broadcast wakeup for "close"
requests.

Also fix some stale comments and expose __add_wait_queue_entry_tail

Running mdtest with the patch applied shows about a 3% improvement:

                             master            patched
  mdtest-easy-write      350.585906 kIOPS   353.783545 kIOPS
   mdtest-easy-stat     1320.329353 kIOPS  1408.320419 kIOPS
 mdtest-easy-delete      285.084103 kIOPS   289.625900 kIOPS
            [SCORE]      509.115803 kiops   524.516113 kiops

Lustre-change: https://review.whamcloud.com/52738
Lustre-commit: b5fde4d6c02324a8511afe30d02eb2cf46ea799d

Fixes: 5243630b09d2 ("LU-15947 obdclass: improve precision of wakeups for mod_rpcs")
Signed-off-by: Mr NeilBrown <neilb@suse.de>
Signed-off-by: Shaun Tancheff <shaun.tancheff@hpe.com>
Change-Id: If767c4299bcbab71589b0f3c01e85bf461686ca5
Reviewed-by: James Simmons <jsimmons@infradead.org>
Reviewed-by: Andreas Dilger <adilger@whamcloud.com>
Signed-off-by: Etienne AUJAMES <eaujames@ddn.com>
Reviewed-on: https://review.whamcloud.com/c/fs/lustre-release/+/53232
Reviewed-by: Oleg Drokin <green@whamcloud.com>
Tested-by: jenkins <devops@whamcloud.com>
Tested-by: Maloo <maloo@whamcloud.com>
libcfs/include/libcfs/linux/linux-wait.h
libcfs/libcfs/linux/linux-wait.c
lustre/obdclass/genops.c

index aa257fc..b54370f 100644 (file)
 #define wait_queue_entry_t wait_queue_t
 #endif
 
+#ifndef HAVE_PREPARE_TO_WAIT_EVENT
+#define __add_wait_queue_entry_tail __add_wait_queue_tail
+#endif
+
 #ifndef HAVE_WAIT_BIT_HEADER_H
 struct wait_bit_queue_entry {
        struct wait_bit_key     key;
index 33117c2..bedd5bb 100644 (file)
@@ -10,8 +10,6 @@
 
 #ifndef HAVE_PREPARE_TO_WAIT_EVENT
 
-#define __add_wait_queue_entry_tail __add_wait_queue_tail
-
 long prepare_to_wait_event(wait_queue_head_t *wq_head,
                           wait_queue_entry_t *wq_entry, int state)
 {
index 90088dc..b753098 100644 (file)
@@ -2304,9 +2304,9 @@ __u16 obd_get_mod_rpc_slot(struct client_obd *cli, __u32 opc)
        wait.wqe.func = claim_mod_rpc_function;
 
        spin_lock_irq(&cli->cl_mod_rpcs_waitq.lock);
-       __add_wait_queue(&cli->cl_mod_rpcs_waitq, &wait.wqe);
+       __add_wait_queue_entry_tail(&cli->cl_mod_rpcs_waitq, &wait.wqe);
        /* This wakeup will only succeed if the maximums haven't
-        * been reached.  If that happens, WQ_FLAG_WOKEN will be cleared
+        * been reached.  If that happens, wait.woken will be set
         * and there will be no need to wait.
         * If a close_req was enqueue, ensure we search all the way to the
         * end of the waitqueue for a close request.
@@ -2314,7 +2314,6 @@ __u16 obd_get_mod_rpc_slot(struct client_obd *cli, __u32 opc)
        __wake_up_locked_key(&cli->cl_mod_rpcs_waitq, TASK_NORMAL,
                             (void*)wait.close_req);
 
-       /* XXX: handle spurious wakeups (from unknown yet source */
        while (wait.woken == false) {
                spin_unlock_irq(&cli->cl_mod_rpcs_waitq.lock);
                wait_woken(&wait.wqe, TASK_UNINTERRUPTIBLE,