LU-13569 lnet: Recover peer NI w/exponential backoff interval

author Chris Horn <chris.horn@hpe.com>

Sun, 23 Aug 2020 15:16:18 +0000 (10:16 -0500)

committer Oleg Drokin <green@whamcloud.com>

Tue, 30 Mar 2021 04:16:05 +0000 (04:16 +0000)
author Chris Horn <chris.horn@hpe.com>
Sun, 23 Aug 2020 15:16:18 +0000 (10:16 -0500)
committer Oleg Drokin <green@whamcloud.com>
Tue, 30 Mar 2021 04:16:05 +0000 (04:16 +0000)
diff --git a/lnet/include/lnet/lib-lnet.h b/lnet/include/lnet/lib-lnet.h

index bb5eed0..1358f6f 100644 (file)
--- a/lnet/include/lnet/lib-lnet.h
+++ b/lnet/include/lnet/lib-lnet.h
@@ -986,6 +986,28 @@ lnet_peer_needs_push(struct lnet_peer *lp)
         return false;
  }
  
+#define LNET_RECOVERY_INTERVAL_MAX 900
+static inline unsigned int
+lnet_get_next_recovery_ping(unsigned int ping_count, time64_t now)
+{
+       unsigned int interval;
+
+       /* 2^9 = 512, 2^10 = 1024 */
+       if (ping_count > 9)
+               interval = LNET_RECOVERY_INTERVAL_MAX;
+       else
+               interval = 1 << ping_count;
+
+       return now + interval;
+}
+
+static inline void
+lnet_peer_ni_set_next_ping(struct lnet_peer_ni *lpni, time64_t now)
+{
+       lpni->lpni_next_ping =
+               lnet_get_next_recovery_ping(lpni->lpni_ping_count, now);
+}
+
  /*
   * A peer NI is alive if it satisfies the following two conditions:
   *  1. peer NI health >= LNET_MAX_HEALTH_VALUE * router_sensitivity_percentage
diff --git a/lnet/include/lnet/lib-types.h b/lnet/include/lnet/lib-types.h

index 2bf7039..010cf32 100644 (file)
--- a/lnet/include/lnet/lib-types.h
+++ b/lnet/include/lnet/lib-types.h
@@ -586,6 +586,12 @@ struct lnet_peer_ni {
         atomic_t                lpni_healthv;
         /* recovery ping mdh */
         struct lnet_handle_md   lpni_recovery_ping_mdh;
+       /* When to send the next recovery ping */
+       time64_t                lpni_next_ping;
+       /* How many pings sent during current recovery period did not receive
+        * a reply. NB: reset whenever _any_ message arrives from this peer NI
+        */
+       unsigned int            lpni_ping_count;
         /* CPT this peer attached on */
         int                     lpni_cpt;
         /* state flags -- protected by lpni_lock */
diff --git a/lnet/lnet/lib-move.c b/lnet/lnet/lib-move.c

index 5987b1b..0cc7767 100644 (file)
--- a/lnet/lnet/lib-move.c
+++ b/lnet/lnet/lib-move.c
@@ -3653,6 +3653,12 @@ lnet_recover_peer_nis(void)
                 }
  
                 spin_unlock(&lpni->lpni_lock);
+
+               if (now < lpni->lpni_next_ping) {
+                       lnet_net_unlock(0);
+                       continue;
+               }
+
                 lnet_net_unlock(0);
  
                 /*
@@ -3702,6 +3708,8 @@ lnet_recover_peer_nis(void)
                                 continue;
                         }
  
+                       lpni->lpni_ping_count++;
+
                         lpni->lpni_recovery_ping_mdh = mdh;
  
                         lnet_peer_ni_add_to_recoveryq_locked(lpni,
diff --git a/lnet/lnet/lib-msg.c b/lnet/lnet/lib-msg.c

index 94f2a78..3015fd8 100644 (file)
--- a/lnet/lnet/lib-msg.c
+++ b/lnet/lnet/lib-msg.c
@@ -867,8 +867,11 @@ lnet_health_check(struct lnet_msg *msg)
         switch (hstatus) {
         case LNET_MSG_STATUS_OK:
                 /*
-                * increment the local ni health weather we successfully
+                * increment the local ni health whether we successfully
                  * received or sent a message on it.
+                *
+                * Ping counts are reset to 0 as appropriate to allow for
+                * faster recovery.
                  */
                 lnet_inc_healthv(&ni->ni_healthv, lnet_health_sensitivity);
                 /*
@@ -880,6 +883,7 @@ lnet_health_check(struct lnet_msg *msg)
                  * as indication that the router is fully healthy.
                  */
                 if (lpni && msg->msg_rx_committed) {
+                       lpni->lpni_ping_count = 0;
                         /*
                          * If we're receiving a message from the router or
                          * I'm a router, then set that lpni's health to
diff --git a/lnet/lnet/peer.c b/lnet/lnet/peer.c

index 903bf78..04765cf 100644 (file)
--- a/lnet/lnet/peer.c
+++ b/lnet/lnet/peer.c
@@ -4029,14 +4029,22 @@ lnet_peer_ni_add_to_recoveryq_locked(struct lnet_peer_ni *lpni,
                 CDEBUG(D_NET, "lpni %s aged out last alive %lld\n",
                        libcfs_nid2str(lpni->lpni_nid),
                        lpni->lpni_last_alive);
+               /* Reset the ping count so that if this peer NI is added back to
+                * the recovery queue we will send the first ping right away.
+                */
+               lpni->lpni_ping_count = 0;
                 return;
         }
  
         /* This peer NI is going on the recovery queue, so take a ref on it */
         lnet_peer_ni_addref_locked(lpni);
  
-       CDEBUG(D_NET, "%s added to recovery queue. last alive: %lld health: %d\n",
+       lnet_peer_ni_set_next_ping(lpni, now);
+
+       CDEBUG(D_NET, "%s added to recovery queue. ping count: %u next ping: %lld last alive: %lld health: %d\n",
                libcfs_nid2str(lpni->lpni_nid),
+              lpni->lpni_ping_count,
+              lpni->lpni_next_ping,
                lpni->lpni_last_alive,
                atomic_read(&lpni->lpni_healthv));
author	Chris Horn <chris.horn@hpe.com>
	Sun, 23 Aug 2020 15:16:18 +0000 (10:16 -0500)
committer	Oleg Drokin <green@whamcloud.com>
	Tue, 30 Mar 2021 04:16:05 +0000 (04:16 +0000)
lnet/include/lnet/lib-lnet.h		patch \| blob \| history
lnet/include/lnet/lib-types.h		patch \| blob \| history
lnet/lnet/lib-move.c		patch \| blob \| history
lnet/lnet/lib-msg.c		patch \| blob \| history
lnet/lnet/peer.c		patch \| blob \| history