Whamcloud - gitweb
LU-10391 socklnd: don't deref lnet_hdr in LNDs
[fs/lustre-release.git] / lnet / klnds / socklnd / socklnd_cb.c
index 1ba4f14..3ad0eee 100644 (file)
@@ -39,9 +39,9 @@ ksocknal_alloc_tx(int type, int size)
                /* searching for a noop tx in free list */
                spin_lock(&ksocknal_data.ksnd_tx_lock);
 
-               if (!list_empty(&ksocknal_data.ksnd_idle_noop_txs)) {
-                       tx = list_entry(ksocknal_data.ksnd_idle_noop_txs.next,
-                                       struct ksock_tx, tx_list);
+               tx = list_first_entry_or_null(&ksocknal_data.ksnd_idle_noop_txs,
+                                             struct ksock_tx, tx_list);
+               if (tx) {
                        LASSERT(tx->tx_desc_size == size);
                        list_del(&tx->tx_list);
                }
@@ -423,15 +423,14 @@ ksocknal_txlist_done(struct lnet_ni *ni, struct list_head *txlist, int error)
 {
        struct ksock_tx *tx;
 
-       while (!list_empty(txlist)) {
-               tx = list_entry(txlist->next, struct ksock_tx, tx_list);
-
-               if (error && tx->tx_lnetmsg != NULL) {
+       while ((tx = list_first_entry_or_null(txlist, struct ksock_tx,
+                                             tx_list)) != NULL) {
+               if (error && tx->tx_lnetmsg) {
                        CNETERR("Deleting packet type %d len %d %s->%s\n",
-                               le32_to_cpu(tx->tx_lnetmsg->msg_hdr.type),
-                               le32_to_cpu(tx->tx_lnetmsg->msg_hdr.payload_length),
-                               libcfs_nid2str(le64_to_cpu(tx->tx_lnetmsg->msg_hdr.src_nid)),
-                               libcfs_nid2str(le64_to_cpu(tx->tx_lnetmsg->msg_hdr.dest_nid)));
+                               tx->tx_lnetmsg->msg_type,
+                               tx->tx_lnetmsg->msg_len,
+                               libcfs_nidstr(&tx->tx_lnetmsg->msg_initiator),
+                               libcfs_nidstr(&tx->tx_lnetmsg->msg_target.nid));
                } else if (error) {
                        CNETERR("Deleting noop packet\n");
                }
@@ -618,7 +617,7 @@ simulate_error:
                        break;
                }
                CDEBUG(D_NET, "[%p] Error %d on write to %s ip %pISp\n",
-                      conn, rc, libcfs_id2str(conn->ksnc_peer->ksnp_id),
+                      conn, rc, libcfs_idstr(&conn->ksnc_peer->ksnp_id),
                       &conn->ksnc_peeraddr);
        }
 
@@ -633,22 +632,24 @@ simulate_error:
 }
 
 static void
-ksocknal_launch_connection_locked(struct ksock_route *route)
+ksocknal_launch_connection_locked(struct ksock_conn_cb *conn_cb)
 {
+       /* called holding write lock on ksnd_global_lock */
 
-        /* called holding write lock on ksnd_global_lock */
+       LASSERT(!conn_cb->ksnr_scheduled);
+       LASSERT(!conn_cb->ksnr_connecting);
+       LASSERT((ksocknal_conn_cb_mask() & ~conn_cb->ksnr_connected) != 0);
 
-        LASSERT (!route->ksnr_scheduled);
-        LASSERT (!route->ksnr_connecting);
-        LASSERT ((ksocknal_route_mask() & ~route->ksnr_connected) != 0);
+       /* scheduling conn for connd */
+       conn_cb->ksnr_scheduled = 1;
 
-        route->ksnr_scheduled = 1;              /* scheduling conn for connd */
-        ksocknal_route_addref(route);           /* extra ref for connd */
+       /* extra ref for connd */
+       ksocknal_conn_cb_addref(conn_cb);
 
        spin_lock_bh(&ksocknal_data.ksnd_connd_lock);
 
-       list_add_tail(&route->ksnr_connd_list,
-                         &ksocknal_data.ksnd_connd_routes);
+       list_add_tail(&conn_cb->ksnr_connd_list,
+                     &ksocknal_data.ksnd_connd_routes);
        wake_up(&ksocknal_data.ksnd_connd_waitq);
 
        spin_unlock_bh(&ksocknal_data.ksnd_connd_lock);
@@ -657,32 +658,30 @@ ksocknal_launch_connection_locked(struct ksock_route *route)
 void
 ksocknal_launch_all_connections_locked(struct ksock_peer_ni *peer_ni)
 {
-       struct ksock_route *route;
+       struct ksock_conn_cb *conn_cb;
 
-        /* called holding write lock on ksnd_global_lock */
-        for (;;) {
-                /* launch any/all connections that need it */
-                route = ksocknal_find_connectable_route_locked(peer_ni);
-                if (route == NULL)
-                        return;
+       /* called holding write lock on ksnd_global_lock */
+       for (;;) {
+               /* launch any/all connections that need it */
+               conn_cb = ksocknal_find_connectable_conn_cb_locked(peer_ni);
+               if (conn_cb == NULL)
+                       return;
 
-                ksocknal_launch_connection_locked(route);
-        }
+               ksocknal_launch_connection_locked(conn_cb);
+       }
 }
 
 struct ksock_conn *
 ksocknal_find_conn_locked(struct ksock_peer_ni *peer_ni, struct ksock_tx *tx, int nonblk)
 {
-       struct list_head *tmp;
+       struct ksock_conn *c;
        struct ksock_conn *conn;
        struct ksock_conn *typed = NULL;
        struct ksock_conn *fallback = NULL;
        int tnob = 0;
        int fnob = 0;
 
-       list_for_each(tmp, &peer_ni->ksnp_conns) {
-               struct ksock_conn *c = list_entry(tmp, struct ksock_conn,
-                                                 ksnc_list);
+       list_for_each_entry(c, &peer_ni->ksnp_conns, ksnc_list) {
                int nob = atomic_read(&c->ksnc_tx_nob) +
                          c->ksnc_sock->sk->sk_wmem_queued;
                int rc;
@@ -753,7 +752,7 @@ ksocknal_queue_tx_locked(struct ksock_tx *tx, struct ksock_conn *conn)
         LASSERT(!conn->ksnc_closing);
 
        CDEBUG(D_NET, "Sending to %s ip %pISp\n",
-              libcfs_id2str(conn->ksnc_peer->ksnp_id),
+              libcfs_idstr(&conn->ksnc_peer->ksnp_id),
               &conn->ksnc_peeraddr);
 
         ksocknal_tx_prep(conn, tx);
@@ -771,10 +770,9 @@ ksocknal_queue_tx_locked(struct ksock_tx *tx, struct ksock_conn *conn)
        LASSERT(tx->tx_niov >= 1);
        LASSERT(tx->tx_resid == tx->tx_nob);
 
-        CDEBUG (D_NET, "Packet %p type %d, nob %d niov %d nkiov %d\n",
-                tx, (tx->tx_lnetmsg != NULL) ? tx->tx_lnetmsg->msg_hdr.type:
-                                               KSOCK_MSG_NOOP,
-                tx->tx_nob, tx->tx_niov, tx->tx_nkiov);
+       CDEBUG(D_NET, "Packet %p type %d, nob %d niov %d nkiov %d\n",
+              tx, tx->tx_lnetmsg ? tx->tx_lnetmsg->msg_type : KSOCK_MSG_NOOP,
+              tx->tx_nob, tx->tx_niov, tx->tx_nkiov);
 
        bufnob = conn->ksnc_sock->sk->sk_wmem_queued;
        spin_lock_bh(&sched->kss_lock);
@@ -827,122 +825,125 @@ ksocknal_queue_tx_locked(struct ksock_tx *tx, struct ksock_conn *conn)
 }
 
 
-struct ksock_route *
-ksocknal_find_connectable_route_locked(struct ksock_peer_ni *peer_ni)
+struct ksock_conn_cb *
+ksocknal_find_connectable_conn_cb_locked(struct ksock_peer_ni *peer_ni)
 {
        time64_t now = ktime_get_seconds();
-       struct list_head *tmp;
-       struct ksock_route *route;
-
-       list_for_each(tmp, &peer_ni->ksnp_routes) {
-               route = list_entry(tmp, struct ksock_route, ksnr_list);
+       struct ksock_conn_cb *conn_cb;
 
-                LASSERT (!route->ksnr_connecting || route->ksnr_scheduled);
+       conn_cb = peer_ni->ksnp_conn_cb;
+       if (!conn_cb)
+               return NULL;
 
-                if (route->ksnr_scheduled)      /* connections being established */
-                        continue;
+       LASSERT(!conn_cb->ksnr_connecting || conn_cb->ksnr_scheduled);
 
-                /* all route types connected ? */
-                if ((ksocknal_route_mask() & ~route->ksnr_connected) == 0)
-                        continue;
+       if (conn_cb->ksnr_scheduled)    /* connections being established */
+               return NULL;
 
-               if (!(route->ksnr_retry_interval == 0 || /* first attempt */
-                     now >= route->ksnr_timeout)) {
-                       CDEBUG(D_NET,
-                              "Too soon to retry route %pIS (cnted %d, interval %lld, %lld secs later)\n",
-                              &route->ksnr_addr,
-                              route->ksnr_connected,
-                              route->ksnr_retry_interval,
-                              route->ksnr_timeout - now);
-                       continue;
-               }
+       /* all conn types connected ? */
+       if ((ksocknal_conn_cb_mask() & ~conn_cb->ksnr_connected) == 0)
+               return NULL;
 
-                return (route);
-        }
+       if (!(conn_cb->ksnr_retry_interval == 0 || /* first attempt */
+             now >= conn_cb->ksnr_timeout)) {
+               CDEBUG(D_NET,
+                      "Too soon to retry route %pIS (cnted %d, interval %lld, %lld secs later)\n",
+                      &conn_cb->ksnr_addr,
+                      conn_cb->ksnr_connected,
+                      conn_cb->ksnr_retry_interval,
+                      conn_cb->ksnr_timeout - now);
+               return NULL;
+       }
 
-        return (NULL);
+       return conn_cb;
 }
 
-struct ksock_route *
-ksocknal_find_connecting_route_locked(struct ksock_peer_ni *peer_ni)
+struct ksock_conn_cb *
+ksocknal_find_connecting_conn_cb_locked(struct ksock_peer_ni *peer_ni)
 {
-       struct list_head *tmp;
-       struct ksock_route *route;
-
-       list_for_each(tmp, &peer_ni->ksnp_routes) {
-               route = list_entry(tmp, struct ksock_route, ksnr_list);
+       struct ksock_conn_cb *conn_cb;
 
-                LASSERT (!route->ksnr_connecting || route->ksnr_scheduled);
+       conn_cb = peer_ni->ksnp_conn_cb;
+       if (!conn_cb)
+               return NULL;
 
-                if (route->ksnr_scheduled)
-                        return (route);
-        }
+       LASSERT(!conn_cb->ksnr_connecting || conn_cb->ksnr_scheduled);
 
-        return (NULL);
+       return conn_cb->ksnr_scheduled ? conn_cb : NULL;
 }
 
 int
 ksocknal_launch_packet(struct lnet_ni *ni, struct ksock_tx *tx,
-                      struct lnet_process_id id)
+                      struct lnet_processid *id)
 {
        struct ksock_peer_ni *peer_ni;
        struct ksock_conn *conn;
+       struct sockaddr_in sa;
        rwlock_t *g_lock;
        int retry;
        int rc;
 
-        LASSERT (tx->tx_conn == NULL);
+       LASSERT(tx->tx_conn == NULL);
 
-        g_lock = &ksocknal_data.ksnd_global_lock;
+       g_lock = &ksocknal_data.ksnd_global_lock;
 
-        for (retry = 0;; retry = 1) {
+       for (retry = 0;; retry = 1) {
                read_lock(g_lock);
-                peer_ni = ksocknal_find_peer_locked(ni, id);
-                if (peer_ni != NULL) {
-                        if (ksocknal_find_connectable_route_locked(peer_ni) == NULL) {
-                                conn = ksocknal_find_conn_locked(peer_ni, tx, tx->tx_nonblk);
-                                if (conn != NULL) {
-                                        /* I've got no routes that need to be
-                                         * connecting and I do have an actual
-                                         * connection... */
-                                        ksocknal_queue_tx_locked (tx, conn);
+               peer_ni = ksocknal_find_peer_locked(ni, id);
+               if (peer_ni != NULL) {
+                       if (ksocknal_find_connectable_conn_cb_locked(peer_ni) == NULL) {
+                               conn = ksocknal_find_conn_locked(peer_ni, tx, tx->tx_nonblk);
+                               if (conn != NULL) {
+                                       /* I've got nothing that need to be
+                                        * connecting and I do have an actual
+                                        * connection...
+                                        */
+                                       ksocknal_queue_tx_locked(tx, conn);
                                        read_unlock(g_lock);
-                                        return (0);
-                                }
-                        }
-                }
+                                       return 0;
+                               }
+                       }
+               }
 
-                /* I'll need a write lock... */
+               /* I'll need a write lock... */
                read_unlock(g_lock);
 
                write_lock_bh(g_lock);
 
-                peer_ni = ksocknal_find_peer_locked(ni, id);
-                if (peer_ni != NULL)
-                        break;
+               peer_ni = ksocknal_find_peer_locked(ni, id);
+               if (peer_ni != NULL)
+                       break;
 
                write_unlock_bh(g_lock);
 
-                if ((id.pid & LNET_PID_USERFLAG) != 0) {
-                        CERROR("Refusing to create a connection to "
-                               "userspace process %s\n", libcfs_id2str(id));
-                        return -EHOSTUNREACH;
-                }
+               if ((id->pid & LNET_PID_USERFLAG) != 0) {
+                       CERROR("Refusing to create a connection to userspace process %s\n",
+                              libcfs_idstr(id));
+                       return -EHOSTUNREACH;
+               }
 
-                if (retry) {
-                        CERROR("Can't find peer_ni %s\n", libcfs_id2str(id));
-                        return -EHOSTUNREACH;
-                }
+               if (retry) {
+                       CERROR("Can't find peer_ni %s\n", libcfs_idstr(id));
+                       return -EHOSTUNREACH;
+               }
 
-                rc = ksocknal_add_peer(ni, id,
-                                       LNET_NIDADDR(id.nid),
-                                       lnet_acceptor_port());
-                if (rc != 0) {
-                        CERROR("Can't add peer_ni %s: %d\n",
-                               libcfs_id2str(id), rc);
-                        return rc;
-                }
-        }
+               memset(&sa, 0, sizeof(sa));
+               sa.sin_family = AF_INET;
+               sa.sin_addr.s_addr = id->nid.nid_addr[0];
+               sa.sin_port = htons(lnet_acceptor_port());
+               {
+                       struct lnet_process_id id4 = {
+                               .pid = id->pid,
+                               .nid = lnet_nid_to_nid4(&id->nid),
+                       };
+                       rc = ksocknal_add_peer(ni, id4, (struct sockaddr *)&sa);
+               }
+               if (rc != 0) {
+                       CERROR("Can't add peer_ni %s: %d\n",
+                              libcfs_idstr(id), rc);
+                       return rc;
+               }
+       }
 
         ksocknal_launch_all_connections_locked(peer_ni);
 
@@ -954,8 +955,8 @@ ksocknal_launch_packet(struct lnet_ni *ni, struct ksock_tx *tx,
                 return (0);
         }
 
-        if (peer_ni->ksnp_accepting > 0 ||
-            ksocknal_find_connecting_route_locked (peer_ni) != NULL) {
+       if (peer_ni->ksnp_accepting > 0 ||
+           ksocknal_find_connecting_conn_cb_locked(peer_ni) != NULL) {
                 /* the message is going to be pinned to the peer_ni */
                tx->tx_deadline = ktime_get_seconds() +
                                  ksocknal_timeout();
@@ -964,12 +965,12 @@ ksocknal_launch_packet(struct lnet_ni *ni, struct ksock_tx *tx,
                list_add_tail(&tx->tx_list, &peer_ni->ksnp_tx_queue);
                write_unlock_bh(g_lock);
                 return 0;
-        }
+       }
 
        write_unlock_bh(g_lock);
 
         /* NB Routes may be ignored if connections to them failed recently */
-        CNETERR("No usable routes to %s\n", libcfs_id2str(id));
+       CNETERR("No usable routes to %s\n", libcfs_idstr(id));
        tx->tx_hstatus = LNET_MSG_STATUS_REMOTE_ERROR;
         return (-EHOSTUNREACH);
 }
@@ -980,7 +981,7 @@ ksocknal_send(struct lnet_ni *ni, void *private, struct lnet_msg *lntmsg)
        /* '1' for consistency with code that checks !mpflag to restore */
        unsigned int mpflag = 1;
        int type = lntmsg->msg_type;
-       struct lnet_process_id target = lntmsg->msg_target;
+       struct lnet_processid *target = &lntmsg->msg_target;
        unsigned int payload_niov = lntmsg->msg_niov;
        struct bio_vec *payload_kiov = lntmsg->msg_kiov;
        unsigned int payload_offset = lntmsg->msg_offset;
@@ -989,11 +990,12 @@ ksocknal_send(struct lnet_ni *ni, void *private, struct lnet_msg *lntmsg)
        int desc_size;
        int rc;
 
-        /* NB 'private' is different depending on what we're sending.
-         * Just ignore it... */
+       /* NB 'private' is different depending on what we're sending.
+        * Just ignore it...
+        */
 
-        CDEBUG(D_NET, "sending %u bytes in %d frags to %s\n",
-               payload_nob, payload_niov, libcfs_id2str(target));
+       CDEBUG(D_NET, "sending %u bytes in %d frags to %s\n",
+              payload_nob, payload_niov, libcfs_idstr(target));
 
        LASSERT (payload_nob == 0 || payload_niov > 0);
        LASSERT (payload_niov <= LNET_MAX_IOV);
@@ -1040,24 +1042,12 @@ ksocknal_send(struct lnet_ni *ni, void *private, struct lnet_msg *lntmsg)
        if (!mpflag)
                memalloc_noreclaim_restore(mpflag);
 
-        if (rc == 0)
-                return (0);
+       if (rc == 0)
+               return (0);
 
        lntmsg->msg_health_status = tx->tx_hstatus;
-        ksocknal_free_tx(tx);
-        return (-EIO);
-}
-
-int
-ksocknal_thread_start(int (*fn)(void *arg), void *arg, char *name)
-{
-       struct task_struct *task = kthread_run(fn, arg, "%s", name);
-
-       if (IS_ERR(task))
-               return PTR_ERR(task);
-
-       atomic_inc(&ksocknal_data.ksnd_nthreads);
-       return 0;
+       ksocknal_free_tx(tx);
+       return -EIO;
 }
 
 void
@@ -1089,14 +1079,15 @@ ksocknal_new_packet(struct ksock_conn *conn, int nob_to_skip)
                switch (conn->ksnc_proto->pro_version) {
                case  KSOCK_PROTO_V2:
                case  KSOCK_PROTO_V3:
-                        conn->ksnc_rx_state = SOCKNAL_RX_KSM_HEADER;
+                       conn->ksnc_rx_state = SOCKNAL_RX_KSM_HEADER;
                        conn->ksnc_rx_iov = (struct kvec *)&conn->ksnc_rx_iov_space;
-                        conn->ksnc_rx_iov[0].iov_base = (char *)&conn->ksnc_msg;
+                       conn->ksnc_rx_iov[0].iov_base = (char *)&conn->ksnc_msg;
 
-                       conn->ksnc_rx_nob_wanted = offsetof(struct ksock_msg, ksm_u);
-                       conn->ksnc_rx_nob_left = offsetof(struct ksock_msg, ksm_u);
-                       conn->ksnc_rx_iov[0].iov_len  = offsetof(struct ksock_msg, ksm_u);
-                        break;
+                       conn->ksnc_rx_nob_wanted = sizeof(struct ksock_msg_hdr);
+                       conn->ksnc_rx_nob_left = sizeof(struct ksock_msg_hdr);
+                       conn->ksnc_rx_iov[0].iov_len =
+                               sizeof(struct ksock_msg_hdr);
+                       break;
 
                case KSOCK_PROTO_V1:
                        /* Receiving bare struct lnet_hdr */
@@ -1154,7 +1145,7 @@ ksocknal_process_receive(struct ksock_conn *conn,
                         struct kvec *scratch_iov)
 {
        struct lnet_hdr *lhdr;
-       struct lnet_process_id *id;
+       struct lnet_processid *id;
        int rc;
 
        LASSERT(refcount_read(&conn->ksnc_conn_refcount) > 0);
@@ -1171,18 +1162,18 @@ ksocknal_process_receive(struct ksock_conn *conn,
                                      scratch_iov);
 
                if (rc <= 0) {
-                       struct lnet_process_id ksnp_id;
+                       struct lnet_processid *ksnp_id;
 
-                       ksnp_id = conn->ksnc_peer->ksnp_id;
+                       ksnp_id = &conn->ksnc_peer->ksnp_id;
 
                        LASSERT(rc != -EAGAIN);
                        if (rc == 0)
                                CDEBUG(D_NET, "[%p] EOF from %s ip %pISp\n",
-                                      conn, libcfs_id2str(ksnp_id),
+                                      conn, libcfs_idstr(ksnp_id),
                                       &conn->ksnc_peeraddr);
                        else if (!conn->ksnc_closing)
                                CERROR("[%p] Error %d on read from %s ip %pISp\n",
-                                      conn, rc, libcfs_id2str(ksnp_id),
+                                      conn, rc, libcfs_idstr(ksnp_id),
                                       &conn->ksnc_peeraddr);
 
                         /* it's not an error if conn is being closed */
@@ -1196,161 +1187,167 @@ ksocknal_process_receive(struct ksock_conn *conn,
                         return (-EAGAIN);
                 }
         }
-        switch (conn->ksnc_rx_state) {
-        case SOCKNAL_RX_KSM_HEADER:
-                if (conn->ksnc_flip) {
-                        __swab32s(&conn->ksnc_msg.ksm_type);
-                        __swab32s(&conn->ksnc_msg.ksm_csum);
-                        __swab64s(&conn->ksnc_msg.ksm_zc_cookies[0]);
-                        __swab64s(&conn->ksnc_msg.ksm_zc_cookies[1]);
-                }
-
-                if (conn->ksnc_msg.ksm_type != KSOCK_MSG_NOOP &&
-                    conn->ksnc_msg.ksm_type != KSOCK_MSG_LNET) {
-                        CERROR("%s: Unknown message type: %x\n",
-                               libcfs_id2str(conn->ksnc_peer->ksnp_id),
-                               conn->ksnc_msg.ksm_type);
-                        ksocknal_new_packet(conn, 0);
-                        ksocknal_close_conn_and_siblings(conn, -EPROTO);
-                        return (-EPROTO);
-                }
+       switch (conn->ksnc_rx_state) {
+       case SOCKNAL_RX_KSM_HEADER:
+               if (conn->ksnc_flip) {
+                       __swab32s(&conn->ksnc_msg.ksm_type);
+                       __swab32s(&conn->ksnc_msg.ksm_csum);
+                       __swab64s(&conn->ksnc_msg.ksm_zc_cookies[0]);
+                       __swab64s(&conn->ksnc_msg.ksm_zc_cookies[1]);
+               }
 
-                if (conn->ksnc_msg.ksm_type == KSOCK_MSG_NOOP &&
-                    conn->ksnc_msg.ksm_csum != 0 &&     /* has checksum */
-                    conn->ksnc_msg.ksm_csum != conn->ksnc_rx_csum) {
-                        /* NOOP Checksum error */
-                        CERROR("%s: Checksum error, wire:0x%08X data:0x%08X\n",
-                               libcfs_id2str(conn->ksnc_peer->ksnp_id),
-                               conn->ksnc_msg.ksm_csum, conn->ksnc_rx_csum);
-                        ksocknal_new_packet(conn, 0);
-                        ksocknal_close_conn_and_siblings(conn, -EPROTO);
-                        return (-EIO);
-                }
+               if (conn->ksnc_msg.ksm_type == KSOCK_MSG_NOOP &&
+                   conn->ksnc_msg.ksm_csum != 0 &&     /* has checksum */
+                   conn->ksnc_msg.ksm_csum != conn->ksnc_rx_csum) {
+                       /* NOOP Checksum error */
+                       CERROR("%s: Checksum error, wire:0x%08X data:0x%08X\n",
+                              libcfs_idstr(&conn->ksnc_peer->ksnp_id),
+                              conn->ksnc_msg.ksm_csum, conn->ksnc_rx_csum);
+                       ksocknal_new_packet(conn, 0);
+                       ksocknal_close_conn_and_siblings(conn, -EPROTO);
+                       return (-EIO);
+               }
 
-                if (conn->ksnc_msg.ksm_zc_cookies[1] != 0) {
-                        __u64 cookie = 0;
+               if (conn->ksnc_msg.ksm_zc_cookies[1] != 0) {
+                       __u64 cookie = 0;
 
-                        LASSERT (conn->ksnc_proto != &ksocknal_protocol_v1x);
+                       LASSERT(conn->ksnc_proto != &ksocknal_protocol_v1x);
 
-                        if (conn->ksnc_msg.ksm_type == KSOCK_MSG_NOOP)
-                                cookie = conn->ksnc_msg.ksm_zc_cookies[0];
+                       if (conn->ksnc_msg.ksm_type == KSOCK_MSG_NOOP)
+                               cookie = conn->ksnc_msg.ksm_zc_cookies[0];
 
-                        rc = conn->ksnc_proto->pro_handle_zcack(conn, cookie,
-                                               conn->ksnc_msg.ksm_zc_cookies[1]);
+                       rc = conn->ksnc_proto->pro_handle_zcack(
+                               conn, cookie, conn->ksnc_msg.ksm_zc_cookies[1]);
 
-                        if (rc != 0) {
+                       if (rc != 0) {
                                CERROR("%s: Unknown ZC-ACK cookie: %llu, %llu\n",
-                                       libcfs_id2str(conn->ksnc_peer->ksnp_id),
-                                       cookie, conn->ksnc_msg.ksm_zc_cookies[1]);
-                                ksocknal_new_packet(conn, 0);
-                                ksocknal_close_conn_and_siblings(conn, -EPROTO);
-                                return (rc);
-                        }
-                }
+                                      libcfs_idstr(&conn->ksnc_peer->ksnp_id),
+                                      cookie,
+                                      conn->ksnc_msg.ksm_zc_cookies[1]);
+                               ksocknal_new_packet(conn, 0);
+                               ksocknal_close_conn_and_siblings(conn, -EPROTO);
+                               return rc;
+                       }
+               }
 
-                if (conn->ksnc_msg.ksm_type == KSOCK_MSG_NOOP) {
-                        ksocknal_new_packet (conn, 0);
-                        return 0;       /* NOOP is done and just return */
-                }
+               switch (conn->ksnc_msg.ksm_type) {
+               case KSOCK_MSG_NOOP:
+                       ksocknal_new_packet(conn, 0);
+                       return 0;       /* NOOP is done and just return */
 
-                conn->ksnc_rx_state = SOCKNAL_RX_LNET_HEADER;
-               conn->ksnc_rx_nob_wanted = sizeof(struct ksock_lnet_msg);
-               conn->ksnc_rx_nob_left = sizeof(struct ksock_lnet_msg);
+               case KSOCK_MSG_LNET:
 
-               conn->ksnc_rx_iov = (struct kvec *)&conn->ksnc_rx_iov_space;
-                conn->ksnc_rx_iov[0].iov_base = (char *)&conn->ksnc_msg.ksm_u.lnetmsg;
-               conn->ksnc_rx_iov[0].iov_len  = sizeof(struct ksock_lnet_msg);
+                       conn->ksnc_rx_state = SOCKNAL_RX_LNET_HEADER;
+                       conn->ksnc_rx_nob_wanted = sizeof(struct lnet_hdr);
+                       conn->ksnc_rx_nob_left = sizeof(struct lnet_hdr);
 
-                conn->ksnc_rx_niov = 1;
-                conn->ksnc_rx_kiov = NULL;
-                conn->ksnc_rx_nkiov = 0;
+                       conn->ksnc_rx_iov = conn->ksnc_rx_iov_space.iov;
+                       conn->ksnc_rx_iov[0].iov_base =
+                               (void *)&conn->ksnc_msg.ksm_u.lnetmsg;
+                       conn->ksnc_rx_iov[0].iov_len = sizeof(struct lnet_hdr);
 
-                goto again;     /* read lnet header now */
+                       conn->ksnc_rx_niov = 1;
+                       conn->ksnc_rx_kiov = NULL;
+                       conn->ksnc_rx_nkiov = 0;
 
-        case SOCKNAL_RX_LNET_HEADER:
-                /* unpack message header */
-                conn->ksnc_proto->pro_unpack(&conn->ksnc_msg);
+                       goto again;     /* read lnet header now */
 
-                if ((conn->ksnc_peer->ksnp_id.pid & LNET_PID_USERFLAG) != 0) {
-                        /* Userspace peer_ni */
-                        lhdr = &conn->ksnc_msg.ksm_u.lnetmsg.ksnm_hdr;
-                        id   = &conn->ksnc_peer->ksnp_id;
+               default:
+                       CERROR("%s: Unknown message type: %x\n",
+                              libcfs_idstr(&conn->ksnc_peer->ksnp_id),
+                              conn->ksnc_msg.ksm_type);
+                       ksocknal_new_packet(conn, 0);
+                       ksocknal_close_conn_and_siblings(conn, -EPROTO);
+                       return -EPROTO;
+               }
 
-                        /* Substitute process ID assigned at connection time */
-                        lhdr->src_pid = cpu_to_le32(id->pid);
-                        lhdr->src_nid = cpu_to_le64(id->nid);
-                }
+       case SOCKNAL_RX_LNET_HEADER:
+               /* unpack message header */
+               conn->ksnc_proto->pro_unpack(&conn->ksnc_msg);
 
-                conn->ksnc_rx_state = SOCKNAL_RX_PARSE;
-                ksocknal_conn_addref(conn);     /* ++ref while parsing */
-
-                rc = lnet_parse(conn->ksnc_peer->ksnp_ni,
-                                &conn->ksnc_msg.ksm_u.lnetmsg.ksnm_hdr,
-                                conn->ksnc_peer->ksnp_id.nid, conn, 0);
-                if (rc < 0) {
-                        /* I just received garbage: give up on this conn */
-                        ksocknal_new_packet(conn, 0);
-                        ksocknal_close_conn_and_siblings (conn, rc);
-                        ksocknal_conn_decref(conn);
-                        return (-EPROTO);
-                }
+               if ((conn->ksnc_peer->ksnp_id.pid & LNET_PID_USERFLAG) != 0) {
+                       /* Userspace peer_ni */
+                       lhdr = &conn->ksnc_msg.ksm_u.lnetmsg;
+                       id = &conn->ksnc_peer->ksnp_id;
 
-                /* I'm racing with ksocknal_recv() */
-                LASSERT (conn->ksnc_rx_state == SOCKNAL_RX_PARSE ||
-                         conn->ksnc_rx_state == SOCKNAL_RX_LNET_PAYLOAD);
+                       /* Substitute process ID assigned at connection time */
+                       lhdr->src_pid = cpu_to_le32(id->pid);
+                       lhdr->src_nid = cpu_to_le64(lnet_nid_to_nid4(&id->nid));
+               }
 
-                if (conn->ksnc_rx_state != SOCKNAL_RX_LNET_PAYLOAD)
-                        return 0;
+               conn->ksnc_rx_state = SOCKNAL_RX_PARSE;
+               ksocknal_conn_addref(conn);     /* ++ref while parsing */
 
-                /* ksocknal_recv() got called */
-                goto again;
+               rc = lnet_parse(conn->ksnc_peer->ksnp_ni,
+                               &conn->ksnc_msg.ksm_u.lnetmsg,
+                               lnet_nid_to_nid4(&conn->ksnc_peer->ksnp_id.nid),
+                               conn, 0);
+               if (rc < 0) {
+                       /* I just received garbage: give up on this conn */
+                       ksocknal_new_packet(conn, 0);
+                       ksocknal_close_conn_and_siblings(conn, rc);
+                       ksocknal_conn_decref(conn);
+                       return (-EPROTO);
+               }
 
-        case SOCKNAL_RX_LNET_PAYLOAD:
-                /* payload all received */
-                rc = 0;
-
-                if (conn->ksnc_rx_nob_left == 0 &&   /* not truncating */
-                    conn->ksnc_msg.ksm_csum != 0 &&  /* has checksum */
-                    conn->ksnc_msg.ksm_csum != conn->ksnc_rx_csum) {
-                        CERROR("%s: Checksum error, wire:0x%08X data:0x%08X\n",
-                               libcfs_id2str(conn->ksnc_peer->ksnp_id),
-                               conn->ksnc_msg.ksm_csum, conn->ksnc_rx_csum);
-                        rc = -EIO;
-                }
+               /* I'm racing with ksocknal_recv() */
+               LASSERT(conn->ksnc_rx_state == SOCKNAL_RX_PARSE ||
+                       conn->ksnc_rx_state == SOCKNAL_RX_LNET_PAYLOAD);
 
-                if (rc == 0 && conn->ksnc_msg.ksm_zc_cookies[0] != 0) {
-                        LASSERT(conn->ksnc_proto != &ksocknal_protocol_v1x);
+               if (conn->ksnc_rx_state != SOCKNAL_RX_LNET_PAYLOAD)
+                       return 0;
 
-                        lhdr = &conn->ksnc_msg.ksm_u.lnetmsg.ksnm_hdr;
-                        id   = &conn->ksnc_peer->ksnp_id;
+               /* ksocknal_recv() got called */
+               goto again;
 
-                        rc = conn->ksnc_proto->pro_handle_zcreq(conn,
-                                        conn->ksnc_msg.ksm_zc_cookies[0],
-                                        *ksocknal_tunables.ksnd_nonblk_zcack ||
-                                        le64_to_cpu(lhdr->src_nid) != id->nid);
-                }
+       case SOCKNAL_RX_LNET_PAYLOAD:
+               /* payload all received */
+               rc = 0;
+
+               if (conn->ksnc_rx_nob_left == 0 &&   /* not truncating */
+                   conn->ksnc_msg.ksm_csum != 0 &&  /* has checksum */
+                   conn->ksnc_msg.ksm_csum != conn->ksnc_rx_csum) {
+                       CERROR("%s: Checksum error, wire:0x%08X data:0x%08X\n",
+                              libcfs_idstr(&conn->ksnc_peer->ksnp_id),
+                              conn->ksnc_msg.ksm_csum, conn->ksnc_rx_csum);
+                       rc = -EIO;
+               }
+
+               if (rc == 0 && conn->ksnc_msg.ksm_zc_cookies[0] != 0) {
+                       LASSERT(conn->ksnc_proto != &ksocknal_protocol_v1x);
+
+                       lhdr = &conn->ksnc_msg.ksm_u.lnetmsg;
+                       id = &conn->ksnc_peer->ksnp_id;
+
+                       rc = conn->ksnc_proto->pro_handle_zcreq(
+                               conn,
+                               conn->ksnc_msg.ksm_zc_cookies[0],
+                               *ksocknal_tunables.ksnd_nonblk_zcack ||
+                               le64_to_cpu(lhdr->src_nid) !=
+                               lnet_nid_to_nid4(&id->nid));
+               }
 
                if (rc && conn->ksnc_lnet_msg)
                        conn->ksnc_lnet_msg->msg_health_status =
                                LNET_MSG_STATUS_REMOTE_ERROR;
                lnet_finalize(conn->ksnc_lnet_msg, rc);
 
-                if (rc != 0) {
-                        ksocknal_new_packet(conn, 0);
-                        ksocknal_close_conn_and_siblings (conn, rc);
-                        return (-EPROTO);
-                }
-                /* Fall through */
+               if (rc != 0) {
+                       ksocknal_new_packet(conn, 0);
+                       ksocknal_close_conn_and_siblings(conn, rc);
+                       return (-EPROTO);
+               }
+               /* Fall through */
 
-        case SOCKNAL_RX_SLOP:
-                /* starting new packet? */
-                if (ksocknal_new_packet (conn, conn->ksnc_rx_nob_left))
-                        return 0;       /* come back later */
-                goto again;             /* try to finish reading slop now */
+       case SOCKNAL_RX_SLOP:
+               /* starting new packet? */
+               if (ksocknal_new_packet(conn, conn->ksnc_rx_nob_left))
+                       return 0;       /* come back later */
+               goto again;             /* try to finish reading slop now */
 
-        default:
-                break;
-        }
+       default:
+               break;
+       }
 
         /* Not Reached */
         LBUG ();
@@ -1464,13 +1461,13 @@ int ksocknal_scheduler(void *arg)
        spin_lock_bh(&sched->kss_lock);
 
        while (!ksocknal_data.ksnd_shuttingdown) {
-               int did_something = 0;
+               bool did_something = false;
 
                /* Ensure I progress everything semi-fairly */
-
-               if (!list_empty(&sched->kss_rx_conns)) {
-                       conn = list_entry(sched->kss_rx_conns.next,
-                                         struct ksock_conn, ksnc_rx_list);
+               conn = list_first_entry_or_null(&sched->kss_rx_conns,
+                                               struct ksock_conn,
+                                               ksnc_rx_list);
+               if (conn) {
                        list_del(&conn->ksnc_rx_list);
 
                        LASSERT(conn->ksnc_rx_scheduled);
@@ -1510,7 +1507,7 @@ int ksocknal_scheduler(void *arg)
                                ksocknal_conn_decref(conn);
                        }
 
-                       did_something = 1;
+                       did_something = true;
                }
 
                if (!list_empty(&sched->kss_tx_conns)) {
@@ -1518,16 +1515,17 @@ int ksocknal_scheduler(void *arg)
 
                        list_splice_init(&sched->kss_zombie_noop_txs, &zlist);
 
-                       conn = list_entry(sched->kss_tx_conns.next,
-                                         struct ksock_conn, ksnc_tx_list);
+                       conn = list_first_entry(&sched->kss_tx_conns,
+                                               struct ksock_conn,
+                                               ksnc_tx_list);
                        list_del(&conn->ksnc_tx_list);
 
                        LASSERT(conn->ksnc_tx_scheduled);
                        LASSERT(conn->ksnc_tx_ready);
                        LASSERT(!list_empty(&conn->ksnc_tx_queue));
 
-                       tx = list_entry(conn->ksnc_tx_queue.next,
-                                       struct ksock_tx, tx_list);
+                       tx = list_first_entry(&conn->ksnc_tx_queue,
+                                             struct ksock_tx, tx_list);
 
                        if (conn->ksnc_tx_carrier == tx)
                                ksocknal_next_tx_carrier(conn);
@@ -1578,7 +1576,7 @@ int ksocknal_scheduler(void *arg)
                                ksocknal_conn_decref(conn);
                        }
 
-                       did_something = 1;
+                       did_something = true;
                }
                if (!did_something ||   /* nothing to do */
                    need_resched()) {   /* hogging CPU? */
@@ -1719,7 +1717,7 @@ ksocknal_send_hello(struct lnet_ni *ni, struct ksock_conn *conn,
        /* rely on caller to hold a ref on socket so it wouldn't disappear */
        LASSERT(conn->ksnc_proto != NULL);
 
-       hello->kshm_src_nid         = ni->ni_nid;
+       hello->kshm_src_nid         = lnet_nid_to_nid4(&ni->ni_nid);
        hello->kshm_dst_nid         = peer_nid;
        hello->kshm_src_pid         = the_lnet.ln_pid;
 
@@ -1752,16 +1750,16 @@ ksocknal_recv_hello(struct lnet_ni *ni, struct ksock_conn *conn,
                    struct lnet_process_id *peerid,
                    __u64 *incarnation)
 {
-        /* Return < 0        fatal error
-         *        0          success
-         *        EALREADY   lost connection race
-         *        EPROTO     protocol version mismatch
-         */
+       /* Return < 0        fatal error
+        *        0          success
+        *        EALREADY   lost connection race
+        *        EPROTO     protocol version mismatch
+        */
        struct socket        *sock = conn->ksnc_sock;
-        int                  active = (conn->ksnc_proto != NULL);
-        int                  timeout;
-        int                  proto_match;
-        int                  rc;
+       int                  active = (conn->ksnc_proto != NULL);
+       int                  timeout;
+       int                  proto_match;
+       int                  rc;
        const struct ksock_proto *proto;
        struct lnet_process_id recv_id;
 
@@ -1769,7 +1767,7 @@ ksocknal_recv_hello(struct lnet_ni *ni, struct ksock_conn *conn,
        LASSERT(!active == !(conn->ksnc_type != SOCKLND_CONN_NONE));
 
        timeout = active ? ksocknal_timeout() :
-                           lnet_acceptor_timeout();
+               lnet_acceptor_timeout();
 
        rc = lnet_sock_read(sock, &hello->kshm_magic,
                            sizeof(hello->kshm_magic), timeout);
@@ -1792,47 +1790,51 @@ ksocknal_recv_hello(struct lnet_ni *ni, struct ksock_conn *conn,
 
        rc = lnet_sock_read(sock, &hello->kshm_version,
                            sizeof(hello->kshm_version), timeout);
-        if (rc != 0) {
+       if (rc != 0) {
                CERROR("Error %d reading HELLO from %pIS\n",
                       rc, &conn->ksnc_peeraddr);
                LASSERT(rc < 0);
-                return rc;
-        }
+               return rc;
+       }
 
-        proto = ksocknal_parse_proto_version(hello);
-        if (proto == NULL) {
-                if (!active) {
-                        /* unknown protocol from peer_ni, tell peer_ni my protocol */
-                        conn->ksnc_proto = &ksocknal_protocol_v3x;
+       proto = ksocknal_parse_proto_version(hello);
+       if (proto == NULL) {
+               if (!active) {
+                       /* unknown protocol from peer_ni,
+                        * tell peer_ni my protocol.
+                        */
+                       conn->ksnc_proto = &ksocknal_protocol_v3x;
 #if SOCKNAL_VERSION_DEBUG
-                        if (*ksocknal_tunables.ksnd_protocol == 2)
-                                conn->ksnc_proto = &ksocknal_protocol_v2x;
-                        else if (*ksocknal_tunables.ksnd_protocol == 1)
-                                conn->ksnc_proto = &ksocknal_protocol_v1x;
+                       if (*ksocknal_tunables.ksnd_protocol == 2)
+                               conn->ksnc_proto = &ksocknal_protocol_v2x;
+                       else if (*ksocknal_tunables.ksnd_protocol == 1)
+                               conn->ksnc_proto = &ksocknal_protocol_v1x;
 #endif
-                        hello->kshm_nips = 0;
-                        ksocknal_send_hello(ni, conn, ni->ni_nid, hello);
-                }
+                       hello->kshm_nips = 0;
+                       ksocknal_send_hello(ni, conn,
+                                           lnet_nid_to_nid4(&ni->ni_nid),
+                                           hello);
+               }
 
                CERROR("Unknown protocol version (%d.x expected) from %pIS\n",
                       conn->ksnc_proto->pro_version, &conn->ksnc_peeraddr);
 
-                return -EPROTO;
-        }
+               return -EPROTO;
+       }
 
-        proto_match = (conn->ksnc_proto == proto);
-        conn->ksnc_proto = proto;
+       proto_match = (conn->ksnc_proto == proto);
+       conn->ksnc_proto = proto;
 
-        /* receive the rest of hello message anyway */
-        rc = conn->ksnc_proto->pro_recv_hello(conn, hello, timeout);
-        if (rc != 0) {
+       /* receive the rest of hello message anyway */
+       rc = conn->ksnc_proto->pro_recv_hello(conn, hello, timeout);
+       if (rc != 0) {
                CERROR("Error %d reading or checking hello from from %pIS\n",
                       rc, &conn->ksnc_peeraddr);
-                LASSERT (rc < 0);
-                return rc;
-        }
+               LASSERT(rc < 0);
+               return rc;
+       }
 
-        *incarnation = hello->kshm_src_incarnation;
+       *incarnation = hello->kshm_src_incarnation;
 
        if (hello->kshm_src_nid == LNET_NID_ANY) {
                CERROR("Expecting a HELLO hdr with a NID, but got LNET_NID_ANY from %pIS\n",
@@ -1849,7 +1851,7 @@ ksocknal_recv_hello(struct lnet_ni *ni, struct ksock_conn *conn,
                        LNET_PID_USERFLAG;
                LASSERT(conn->ksnc_peeraddr.ss_family == AF_INET);
                recv_id.nid = LNET_MKNID(
-                       LNET_NIDNET(ni->ni_nid),
+                       LNET_NID_NET(&ni->ni_nid),
                        ntohl(((struct sockaddr_in *)
                               &conn->ksnc_peeraddr)->sin_addr.s_addr));
        } else {
@@ -1857,8 +1859,8 @@ ksocknal_recv_hello(struct lnet_ni *ni, struct ksock_conn *conn,
                recv_id.pid = hello->kshm_src_pid;
        }
 
-        if (!active) {
-                *peerid = recv_id;
+       if (!active) {
+               *peerid = recv_id;
 
                /* peer_ni determines type */
                conn->ksnc_type = ksocknal_invert_type(hello->kshm_ctype);
@@ -1881,10 +1883,10 @@ ksocknal_recv_hello(struct lnet_ni *ni, struct ksock_conn *conn,
                return -EPROTO;
        }
 
-        if (hello->kshm_ctype == SOCKLND_CONN_NONE) {
-                /* Possible protocol mismatch or I lost the connection race */
-                return proto_match ? EALREADY : EPROTO;
-        }
+       if (hello->kshm_ctype == SOCKLND_CONN_NONE) {
+               /* Possible protocol mismatch or I lost the connection race */
+               return proto_match ? EALREADY : EPROTO;
+       }
 
        if (ksocknal_invert_type(hello->kshm_ctype) != conn->ksnc_type) {
                CERROR("Mismatched types: me %d, %s ip %pIS %d\n",
@@ -1896,35 +1898,36 @@ ksocknal_recv_hello(struct lnet_ni *ni, struct ksock_conn *conn,
        return 0;
 }
 
-static int
-ksocknal_connect(struct ksock_route *route)
+static bool
+ksocknal_connect(struct ksock_conn_cb *conn_cb)
 {
        LIST_HEAD(zombies);
-       struct ksock_peer_ni *peer_ni = route->ksnr_peer;
-        int               type;
-        int               wanted;
-       struct socket     *sock;
+       struct ksock_peer_ni *peer_ni = conn_cb->ksnr_peer;
+       int type;
+       int wanted;
+       struct socket *sock;
        time64_t deadline;
-        int               retry_later = 0;
-        int               rc = 0;
+       bool retry_later = false;
+       int rc = 0;
 
        deadline = ktime_get_seconds() + ksocknal_timeout();
 
        write_lock_bh(&ksocknal_data.ksnd_global_lock);
 
-        LASSERT (route->ksnr_scheduled);
-        LASSERT (!route->ksnr_connecting);
+       LASSERT(conn_cb->ksnr_scheduled);
+       LASSERT(!conn_cb->ksnr_connecting);
 
-        route->ksnr_connecting = 1;
+       conn_cb->ksnr_connecting = 1;
 
        for (;;) {
-               wanted = ksocknal_route_mask() & ~route->ksnr_connected;
+               wanted = ksocknal_conn_cb_mask() & ~conn_cb->ksnr_connected;
 
-               /* stop connecting if peer_ni/route got closed under me, or
-                * route got connected while queued */
-               if (peer_ni->ksnp_closing || route->ksnr_deleted ||
+               /* stop connecting if peer_ni/cb got closed under me, or
+                * conn cb got connected while queued
+                */
+               if (peer_ni->ksnp_closing || conn_cb->ksnr_deleted ||
                    wanted == 0) {
-                       retry_later = 0;
+                       retry_later = false;
                        break;
                }
 
@@ -1932,8 +1935,9 @@ ksocknal_connect(struct ksock_route *route)
                if (peer_ni->ksnp_accepting > 0) {
                        CDEBUG(D_NET,
                               "peer_ni %s(%d) already connecting to me, retry later.\n",
-                              libcfs_nid2str(peer_ni->ksnp_id.nid), peer_ni->ksnp_accepting);
-                       retry_later = 1;
+                              libcfs_nidstr(&peer_ni->ksnp_id.nid),
+                              peer_ni->ksnp_accepting);
+                       retry_later = true;
                }
 
                if (retry_later) /* needs reschedule */
@@ -1943,7 +1947,8 @@ ksocknal_connect(struct ksock_route *route)
                        type = SOCKLND_CONN_ANY;
                } else if ((wanted & BIT(SOCKLND_CONN_CONTROL)) != 0) {
                        type = SOCKLND_CONN_CONTROL;
-               } else if ((wanted & BIT(SOCKLND_CONN_BULK_IN)) != 0) {
+               } else if ((wanted & BIT(SOCKLND_CONN_BULK_IN)) != 0 &&
+                          conn_cb->ksnr_blki_conn_count <= conn_cb->ksnr_blko_conn_count) {
                        type = SOCKLND_CONN_BULK_IN;
                } else {
                        LASSERT ((wanted & BIT(SOCKLND_CONN_BULK_OUT)) != 0);
@@ -1954,98 +1959,105 @@ ksocknal_connect(struct ksock_route *route)
 
                if (ktime_get_seconds() >= deadline) {
                        rc = -ETIMEDOUT;
-                       lnet_connect_console_error(rc, peer_ni->ksnp_id.nid,
-                                                  (struct sockaddr *)
-                                                  &route->ksnr_addr);
+                       lnet_connect_console_error(
+                               rc, &peer_ni->ksnp_id.nid,
+                               (struct sockaddr *)&conn_cb->ksnr_addr);
                        goto failed;
                }
 
-               sock = lnet_connect(peer_ni->ksnp_id.nid,
-                                   route->ksnr_myiface,
-                                   (struct sockaddr *)&route->ksnr_addr,
+               sock = lnet_connect(&peer_ni->ksnp_id.nid,
+                                   conn_cb->ksnr_myiface,
+                                   (struct sockaddr *)&conn_cb->ksnr_addr,
                                    peer_ni->ksnp_ni->ni_net_ns);
                if (IS_ERR(sock)) {
                        rc = PTR_ERR(sock);
                        goto failed;
                }
 
-               rc = ksocknal_create_conn(peer_ni->ksnp_ni, route, sock, type);
+               rc = ksocknal_create_conn(peer_ni->ksnp_ni, conn_cb, sock,
+                                         type);
                if (rc < 0) {
-                       lnet_connect_console_error(rc, peer_ni->ksnp_id.nid,
-                                                  (struct sockaddr *)
-                                                  &route->ksnr_addr);
+                       lnet_connect_console_error(
+                               rc, &peer_ni->ksnp_id.nid,
+                               (struct sockaddr *)&conn_cb->ksnr_addr);
                        goto failed;
                }
 
                /* A +ve RC means I have to retry because I lost the connection
-                * race or I have to renegotiate protocol version */
+                * race or I have to renegotiate protocol version
+                */
                retry_later = (rc != 0);
                if (retry_later)
                        CDEBUG(D_NET, "peer_ni %s: conn race, retry later.\n",
-                              libcfs_nid2str(peer_ni->ksnp_id.nid));
+                              libcfs_nidstr(&peer_ni->ksnp_id.nid));
 
                write_lock_bh(&ksocknal_data.ksnd_global_lock);
        }
 
-        route->ksnr_scheduled = 0;
-        route->ksnr_connecting = 0;
-
-        if (retry_later) {
-                /* re-queue for attention; this frees me up to handle
-                 * the peer_ni's incoming connection request */
-
-                if (rc == EALREADY ||
-                    (rc == 0 && peer_ni->ksnp_accepting > 0)) {
-                        /* We want to introduce a delay before next
-                         * attempt to connect if we lost conn race,
-                         * but the race is resolved quickly usually,
-                         * so min_reconnectms should be good heuristic */
-                       route->ksnr_retry_interval = *ksocknal_tunables.ksnd_min_reconnectms / 1000;
-                       route->ksnr_timeout = ktime_get_seconds() +
-                                             route->ksnr_retry_interval;
-                }
+       conn_cb->ksnr_scheduled = 0;
+       conn_cb->ksnr_connecting = 0;
 
-                ksocknal_launch_connection_locked(route);
-        }
+       if (retry_later) {
+               /* re-queue for attention; this frees me up to handle
+                * the peer_ni's incoming connection request
+                */
+
+               if (rc == EALREADY ||
+                   (rc == 0 && peer_ni->ksnp_accepting > 0)) {
+                       /* We want to introduce a delay before next
+                        * attempt to connect if we lost conn race, but
+                        * the race is resolved quickly usually, so
+                        * min_reconnectms should be good heuristic
+                        */
+                       conn_cb->ksnr_retry_interval =
+                               *ksocknal_tunables.ksnd_min_reconnectms / 1000;
+                       conn_cb->ksnr_timeout = ktime_get_seconds() +
+                                               conn_cb->ksnr_retry_interval;
+               }
+
+               ksocknal_launch_connection_locked(conn_cb);
+       }
 
        write_unlock_bh(&ksocknal_data.ksnd_global_lock);
-        return retry_later;
+       return retry_later;
 
  failed:
        write_lock_bh(&ksocknal_data.ksnd_global_lock);
 
-        route->ksnr_scheduled = 0;
-        route->ksnr_connecting = 0;
+       conn_cb->ksnr_scheduled = 0;
+       conn_cb->ksnr_connecting = 0;
 
        /* This is a retry rather than a new connection */
-       route->ksnr_retry_interval *= 2;
-       route->ksnr_retry_interval =
-               max_t(time64_t, route->ksnr_retry_interval,
+       conn_cb->ksnr_retry_interval *= 2;
+       conn_cb->ksnr_retry_interval =
+               max_t(time64_t, conn_cb->ksnr_retry_interval,
                      *ksocknal_tunables.ksnd_min_reconnectms / 1000);
-       route->ksnr_retry_interval =
-               min_t(time64_t, route->ksnr_retry_interval,
+       conn_cb->ksnr_retry_interval =
+               min_t(time64_t, conn_cb->ksnr_retry_interval,
                      *ksocknal_tunables.ksnd_max_reconnectms / 1000);
 
-       LASSERT(route->ksnr_retry_interval);
-       route->ksnr_timeout = ktime_get_seconds() + route->ksnr_retry_interval;
+       LASSERT(conn_cb->ksnr_retry_interval);
+       conn_cb->ksnr_timeout = ktime_get_seconds() +
+                               conn_cb->ksnr_retry_interval;
 
        if (!list_empty(&peer_ni->ksnp_tx_queue) &&
-            peer_ni->ksnp_accepting == 0 &&
-            ksocknal_find_connecting_route_locked(peer_ni) == NULL) {
+           peer_ni->ksnp_accepting == 0 &&
+           !ksocknal_find_connecting_conn_cb_locked(peer_ni)) {
                struct ksock_conn *conn;
 
-                /* ksnp_tx_queue is queued on a conn on successful
-                 * connection for V1.x and V2.x */
-               if (!list_empty(&peer_ni->ksnp_conns)) {
-                       conn = list_entry(peer_ni->ksnp_conns.next,
-                                         struct ksock_conn, ksnc_list);
-                        LASSERT (conn->ksnc_proto == &ksocknal_protocol_v3x);
-                }
+               /* ksnp_tx_queue is queued on a conn on successful
+                * connection for V1.x and V2.x
+                */
+               conn = list_first_entry_or_null(&peer_ni->ksnp_conns,
+                                               struct ksock_conn, ksnc_list);
+               if (conn)
+                       LASSERT(conn->ksnc_proto == &ksocknal_protocol_v3x);
 
-                /* take all the blocked packets while I've got the lock and
-                 * complete below... */
+               /* take all the blocked packets while I've got the lock and
+                * complete below...
+                */
                list_splice_init(&peer_ni->ksnp_tx_queue, &zombies);
-        }
+       }
 
        write_unlock_bh(&ksocknal_data.ksnd_global_lock);
 
@@ -2063,7 +2075,6 @@ ksocknal_connect(struct ksock_route *route)
 static int
 ksocknal_connd_check_start(time64_t sec, long *timeout)
 {
-       char name[16];
         int rc;
         int total = ksocknal_data.ksnd_connd_starting +
                     ksocknal_data.ksnd_connd_running;
@@ -2101,8 +2112,8 @@ ksocknal_connd_check_start(time64_t sec, long *timeout)
        spin_unlock_bh(&ksocknal_data.ksnd_connd_lock);
 
        /* NB: total is the next id */
-       snprintf(name, sizeof(name), "socknal_cd%02d", total);
-       rc = ksocknal_thread_start(ksocknal_connd, NULL, name);
+       rc = ksocknal_thread_start(ksocknal_connd, NULL,
+                                  "socknal_cd%02d", total);
 
        spin_lock_bh(&ksocknal_data.ksnd_connd_lock);
         if (rc == 0)
@@ -2157,25 +2168,28 @@ ksocknal_connd_check_stop(time64_t sec, long *timeout)
                ksocknal_data.ksnd_connd_connecting + SOCKNAL_CONND_RESV;
 }
 
-/* Go through connd_routes queue looking for a route that we can process
+/* Go through connd_cbs queue looking for a conn_cb that we can process
  * right now, @timeout_p can be updated if we need to come back later */
-static struct ksock_route *
-ksocknal_connd_get_route_locked(signed long *timeout_p)
+static struct ksock_conn_cb *
+ksocknal_connd_get_conn_cb_locked(signed long *timeout_p)
 {
        time64_t now = ktime_get_seconds();
-       struct ksock_route *route;
+       time64_t conn_timeout;
+       struct ksock_conn_cb *conn_cb;
 
        /* connd_routes can contain both pending and ordinary routes */
-       list_for_each_entry(route, &ksocknal_data.ksnd_connd_routes,
-                                ksnr_connd_list) {
+       list_for_each_entry(conn_cb, &ksocknal_data.ksnd_connd_routes,
+                           ksnr_connd_list) {
 
-               if (route->ksnr_retry_interval == 0 ||
-                   now >= route->ksnr_timeout)
-                       return route;
+               conn_timeout = conn_cb->ksnr_timeout;
+
+               if (conn_cb->ksnr_retry_interval == 0 ||
+                   now >= conn_timeout)
+                       return conn_cb;
 
                if (*timeout_p == MAX_SCHEDULE_TIMEOUT ||
-                   *timeout_p > cfs_time_seconds(route->ksnr_timeout - now))
-                       *timeout_p = cfs_time_seconds(route->ksnr_timeout - now);
+                   *timeout_p > cfs_time_seconds(conn_timeout - now))
+                       *timeout_p = cfs_time_seconds(conn_timeout - now);
        }
 
        return NULL;
@@ -2189,7 +2203,7 @@ ksocknal_connd(void *arg)
        wait_queue_entry_t wait;
        int cons_retry = 0;
 
-       init_waitqueue_entry(&wait, current);
+       init_wait(&wait);
 
        spin_lock_bh(connd_lock);
 
@@ -2198,10 +2212,10 @@ ksocknal_connd(void *arg)
        ksocknal_data.ksnd_connd_running++;
 
        while (!ksocknal_data.ksnd_shuttingdown) {
-               struct ksock_route *route = NULL;
+               struct ksock_conn_cb *conn_cb = NULL;
                time64_t sec = ktime_get_real_seconds();
                long timeout = MAX_SCHEDULE_TIMEOUT;
-               int  dropped_lock = 0;
+               bool dropped_lock = false;
 
                if (ksocknal_connd_check_stop(sec, &timeout)) {
                        /* wakeup another one to check stop */
@@ -2209,19 +2223,18 @@ ksocknal_connd(void *arg)
                        break;
                }
 
-                if (ksocknal_connd_check_start(sec, &timeout)) {
-                        /* created new thread */
-                        dropped_lock = 1;
-                }
-
-               if (!list_empty(&ksocknal_data.ksnd_connd_connreqs)) {
-                        /* Connection accepted by the listener */
-                       cr = list_entry(ksocknal_data.ksnd_connd_connreqs.next,
-                                       struct ksock_connreq, ksncr_list);
+               if (ksocknal_connd_check_start(sec, &timeout)) {
+                       /* created new thread */
+                       dropped_lock = true;
+               }
 
+               cr = list_first_entry_or_null(&ksocknal_data.ksnd_connd_connreqs,
+                                             struct ksock_connreq, ksncr_list);
+               if (cr) {
+                       /* Connection accepted by the listener */
                        list_del(&cr->ksncr_list);
                        spin_unlock_bh(connd_lock);
-                       dropped_lock = 1;
+                       dropped_lock = true;
 
                        ksocknal_create_conn(cr->ksncr_ni, NULL,
                                             cr->ksncr_sock, SOCKLND_CONN_NONE);
@@ -2229,33 +2242,34 @@ ksocknal_connd(void *arg)
                        LIBCFS_FREE(cr, sizeof(*cr));
 
                        spin_lock_bh(connd_lock);
-                }
+               }
 
-                /* Only handle an outgoing connection request if there
-                 * is a thread left to handle incoming connections and
-                 * create new connd */
-                if (ksocknal_data.ksnd_connd_connecting + SOCKNAL_CONND_RESV <
-                    ksocknal_data.ksnd_connd_running) {
-                        route = ksocknal_connd_get_route_locked(&timeout);
-                }
-                if (route != NULL) {
-                       list_del(&route->ksnr_connd_list);
-                        ksocknal_data.ksnd_connd_connecting++;
+               /* Only handle an outgoing connection request if there
+                * is a thread left to handle incoming connections and
+                * create new connd
+                */
+               if (ksocknal_data.ksnd_connd_connecting + SOCKNAL_CONND_RESV <
+                   ksocknal_data.ksnd_connd_running)
+                       conn_cb = ksocknal_connd_get_conn_cb_locked(&timeout);
+
+               if (conn_cb) {
+                       list_del(&conn_cb->ksnr_connd_list);
+                       ksocknal_data.ksnd_connd_connecting++;
                        spin_unlock_bh(connd_lock);
-                        dropped_lock = 1;
+                       dropped_lock = true;
 
-                       if (ksocknal_connect(route)) {
+                       if (ksocknal_connect(conn_cb)) {
                                /* consecutive retry */
                                if (cons_retry++ > SOCKNAL_INSANITY_RECONN) {
                                        CWARN("massive consecutive re-connecting to %pIS\n",
-                                             &route->ksnr_addr);
+                                             &conn_cb->ksnr_addr);
                                        cons_retry = 0;
                                }
                        } else {
                                cons_retry = 0;
                        }
 
-                        ksocknal_route_decref(route);
+                       ksocknal_conn_cb_decref(conn_cb);
 
                        spin_lock_bh(connd_lock);
                        ksocknal_data.ksnd_connd_connecting--;
@@ -2272,7 +2286,8 @@ ksocknal_connd(void *arg)
 
                /* Nothing to do for 'timeout'  */
                set_current_state(TASK_INTERRUPTIBLE);
-               add_wait_queue_exclusive(&ksocknal_data.ksnd_connd_waitq, &wait);
+               add_wait_queue_exclusive(&ksocknal_data.ksnd_connd_waitq,
+                                        &wait);
                spin_unlock_bh(connd_lock);
 
                schedule_timeout(timeout);
@@ -2292,16 +2307,15 @@ ksocknal_find_timed_out_conn(struct ksock_peer_ni *peer_ni)
 {
         /* We're called with a shared lock on ksnd_global_lock */
        struct ksock_conn *conn;
-       struct list_head *ctmp;
        struct ksock_tx *tx;
+       struct ksock_sched *sched;
 
-       list_for_each(ctmp, &peer_ni->ksnp_conns) {
+       list_for_each_entry(conn, &peer_ni->ksnp_conns, ksnc_list) {
                int error;
 
-               conn = list_entry(ctmp, struct ksock_conn, ksnc_list);
-
                 /* Don't need the {get,put}connsock dance to deref ksnc_sock */
                 LASSERT (!conn->ksnc_closing);
+               sched = conn->ksnc_scheduler;
 
                error = conn->ksnc_sock->sk->sk_err;
                 if (error != 0) {
@@ -2310,18 +2324,18 @@ ksocknal_find_timed_out_conn(struct ksock_peer_ni *peer_ni)
                        switch (error) {
                        case ECONNRESET:
                                CNETERR("A connection with %s (%pISp) was reset; it may have rebooted.\n",
-                                       libcfs_id2str(peer_ni->ksnp_id),
+                                       libcfs_idstr(&peer_ni->ksnp_id),
                                        &conn->ksnc_peeraddr);
                                break;
                        case ETIMEDOUT:
                                CNETERR("A connection with %s (%pISp) timed out; the network or node may be down.\n",
-                                       libcfs_id2str(peer_ni->ksnp_id),
+                                       libcfs_idstr(&peer_ni->ksnp_id),
                                        &conn->ksnc_peeraddr);
                                break;
                        default:
                                CNETERR("An unexpected network error %d occurred with %s (%pISp\n",
                                        error,
-                                       libcfs_id2str(peer_ni->ksnp_id),
+                                       libcfs_idstr(&peer_ni->ksnp_id),
                                        &conn->ksnc_peeraddr);
                                break;
                        }
@@ -2334,7 +2348,7 @@ ksocknal_find_timed_out_conn(struct ksock_peer_ni *peer_ni)
                        /* Timed out incomplete incoming message */
                        ksocknal_conn_addref(conn);
                        CNETERR("Timeout receiving from %s (%pISp), state %d wanted %d left %d\n",
-                               libcfs_id2str(peer_ni->ksnp_id),
+                               libcfs_idstr(&peer_ni->ksnp_id),
                                &conn->ksnc_peeraddr,
                                conn->ksnc_rx_state,
                                conn->ksnc_rx_nob_wanted,
@@ -2342,6 +2356,7 @@ ksocknal_find_timed_out_conn(struct ksock_peer_ni *peer_ni)
                        return conn;
                }
 
+               spin_lock_bh(&sched->kss_lock);
                if ((!list_empty(&conn->ksnc_tx_queue) ||
                     conn->ksnc_sock->sk->sk_wmem_queued != 0) &&
                    ktime_get_seconds() >= conn->ksnc_tx_deadline) {
@@ -2354,10 +2369,12 @@ ksocknal_find_timed_out_conn(struct ksock_peer_ni *peer_ni)
                                tx->tx_hstatus =
                                        LNET_MSG_STATUS_LOCAL_TIMEOUT;
                        CNETERR("Timeout sending data to %s (%pISp) the network or that node may be down.\n",
-                               libcfs_id2str(peer_ni->ksnp_id),
+                               libcfs_idstr(&peer_ni->ksnp_id),
                                &conn->ksnc_peeraddr);
+                               spin_unlock_bh(&sched->kss_lock);
                                return conn;
                }
+               spin_unlock_bh(&sched->kss_lock);
        }
 
        return (NULL);
@@ -2371,10 +2388,9 @@ ksocknal_flush_stale_txs(struct ksock_peer_ni *peer_ni)
 
        write_lock_bh(&ksocknal_data.ksnd_global_lock);
 
-       while (!list_empty(&peer_ni->ksnp_tx_queue)) {
-               tx = list_entry(peer_ni->ksnp_tx_queue.next,
-                               struct ksock_tx, tx_list);
-
+       while ((tx = list_first_entry_or_null(&peer_ni->ksnp_tx_queue,
+                                             struct ksock_tx,
+                                             tx_list)) != NULL) {
                if (ktime_get_seconds() < tx->tx_deadline)
                        break;
 
@@ -2438,7 +2454,8 @@ __must_hold(&ksocknal_data.ksnd_global_lock)
                return -ENOMEM;
        }
 
-       if (ksocknal_launch_packet(peer_ni->ksnp_ni, tx, peer_ni->ksnp_id) == 0) {
+       if (ksocknal_launch_packet(peer_ni->ksnp_ni, tx, &peer_ni->ksnp_id)
+           == 0) {
                read_lock(&ksocknal_data.ksnd_global_lock);
                return 1;
        }
@@ -2494,20 +2511,16 @@ ksocknal_check_peer_timeouts(int idx)
                /* we can't process stale txs right here because we're
                 * holding only shared lock
                 */
-               if (!list_empty(&peer_ni->ksnp_tx_queue)) {
-                       struct ksock_tx *tx;
-
-                       tx = list_entry(peer_ni->ksnp_tx_queue.next,
-                                       struct ksock_tx, tx_list);
-                       if (ktime_get_seconds() >= tx->tx_deadline) {
-                               ksocknal_peer_addref(peer_ni);
-                               read_unlock(&ksocknal_data.ksnd_global_lock);
+               tx = list_first_entry_or_null(&peer_ni->ksnp_tx_queue,
+                                             struct ksock_tx, tx_list);
+               if (tx && ktime_get_seconds() >= tx->tx_deadline) {
+                       ksocknal_peer_addref(peer_ni);
+                       read_unlock(&ksocknal_data.ksnd_global_lock);
 
-                               ksocknal_flush_stale_txs(peer_ni);
+                       ksocknal_flush_stale_txs(peer_ni);
 
-                               ksocknal_peer_decref(peer_ni);
-                               goto again;
-                       }
+                       ksocknal_peer_decref(peer_ni);
+                       goto again;
                }
 
                if (list_empty(&peer_ni->ksnp_zc_req_list))
@@ -2542,7 +2555,7 @@ ksocknal_check_peer_timeouts(int idx)
                CERROR("Total %d stale ZC_REQs for peer_ni %s detected; the "
                       "oldest(%p) timed out %lld secs ago, "
                       "resid: %d, wmem: %d\n",
-                      n, libcfs_nid2str(peer_ni->ksnp_id.nid), tx_stale,
+                      n, libcfs_nidstr(&peer_ni->ksnp_id.nid), tx_stale,
                       ktime_get_seconds() - deadline,
                       resid, conn->ksnc_sock->sk->sk_wmem_queued);
 
@@ -2566,14 +2579,14 @@ int ksocknal_reaper(void *arg)
        int peer_index = 0;
        time64_t deadline = ktime_get_seconds();
 
-       init_waitqueue_entry(&wait, current);
+       init_wait(&wait);
 
        spin_lock_bh(&ksocknal_data.ksnd_reaper_lock);
 
         while (!ksocknal_data.ksnd_shuttingdown) {
-               if (!list_empty(&ksocknal_data.ksnd_deathrow_conns)) {
-                       conn = list_entry(ksocknal_data.ksnd_deathrow_conns.next,
-                                         struct ksock_conn, ksnc_list);
+               conn = list_first_entry_or_null(&ksocknal_data.ksnd_deathrow_conns,
+                                               struct ksock_conn, ksnc_list);
+               if (conn) {
                        list_del(&conn->ksnc_list);
 
                        spin_unlock_bh(&ksocknal_data.ksnd_reaper_lock);
@@ -2585,9 +2598,9 @@ int ksocknal_reaper(void *arg)
                         continue;
                 }
 
-               if (!list_empty(&ksocknal_data.ksnd_zombie_conns)) {
-                       conn = list_entry(ksocknal_data.ksnd_zombie_conns.next,
-                                         struct ksock_conn, ksnc_list);
+               conn = list_first_entry_or_null(&ksocknal_data.ksnd_zombie_conns,
+                                               struct ksock_conn, ksnc_list);
+               if (conn) {
                        list_del(&conn->ksnc_list);
 
                        spin_unlock_bh(&ksocknal_data.ksnd_reaper_lock);
@@ -2605,9 +2618,9 @@ int ksocknal_reaper(void *arg)
 
                 /* reschedule all the connections that stalled with ENOMEM... */
                 nenomem_conns = 0;
-               while (!list_empty(&enomem_conns)) {
-                       conn = list_entry(enomem_conns.next,
-                                         struct ksock_conn, ksnc_tx_list);
+               while ((conn = list_first_entry_or_null(&enomem_conns,
+                                                       struct ksock_conn,
+                                                       ksnc_tx_list)) != NULL) {
                        list_del(&conn->ksnc_tx_list);
 
                         sched = conn->ksnc_scheduler;