Whamcloud - gitweb
LU-10391 socklnd: factor out key calculation for ksnd_peers
[fs/lustre-release.git] / lnet / klnds / socklnd / socklnd.c
index d9c428a..ad93203 100644 (file)
@@ -36,6 +36,7 @@
  * Author: Eric Barton <eric@bartonsoftware.com>
  */
 
+#include <linux/ethtool.h>
 #include <linux/inetdevice.h>
 #include "socklnd.h"
 #include <linux/sunrpc/addr.h>
@@ -134,6 +135,7 @@ ksocknal_create_conn_cb(struct sockaddr *addr)
        conn_cb->ksnr_ctrl_conn_count = 0;
        conn_cb->ksnr_blki_conn_count = 0;
        conn_cb->ksnr_blko_conn_count = 0;
+       conn_cb->ksnr_max_conns = 0;
 
        return conn_cb;
 }
@@ -219,9 +221,10 @@ struct ksock_peer_ni *
 ksocknal_find_peer_locked(struct lnet_ni *ni, struct lnet_process_id id)
 {
        struct ksock_peer_ni *peer_ni;
+       unsigned long hash = nidhash(id.nid);
 
        hash_for_each_possible(ksocknal_data.ksnd_peers, peer_ni,
-                              ksnp_list, id.nid) {
+                              ksnp_list, hash) {
                LASSERT(!peer_ni->ksnp_closing);
 
                if (peer_ni->ksnp_ni != ni)
@@ -393,6 +396,19 @@ ksocknal_get_conn_count_by_type(struct ksock_conn_cb *conn_cb,
        return count;
 }
 
+static unsigned int
+ksocknal_get_conns_per_peer(struct ksock_peer_ni *peer_ni)
+{
+       struct lnet_ni *ni = peer_ni->ksnp_ni;
+       struct lnet_ioctl_config_socklnd_tunables *tunables;
+
+       LASSERT(ni);
+
+       tunables = &ni->ni_lnd_tunables.lnd_tun_u.lnd_sock;
+
+       return tunables->lnd_conns_per_peer;
+}
+
 static void
 ksocknal_incr_conn_count(struct ksock_conn_cb *conn_cb,
                         int type)
@@ -408,29 +424,25 @@ ksocknal_incr_conn_count(struct ksock_conn_cb *conn_cb,
                break;
        case SOCKLND_CONN_BULK_IN:
                conn_cb->ksnr_blki_conn_count++;
-               if (conn_cb->ksnr_blki_conn_count >=
-                   *ksocknal_tunables.ksnd_conns_per_peer)
+               if (conn_cb->ksnr_blki_conn_count >= conn_cb->ksnr_max_conns)
                        conn_cb->ksnr_connected |= BIT(type);
                break;
        case SOCKLND_CONN_BULK_OUT:
                conn_cb->ksnr_blko_conn_count++;
-               if (conn_cb->ksnr_blko_conn_count >=
-                   *ksocknal_tunables.ksnd_conns_per_peer)
+               if (conn_cb->ksnr_blko_conn_count >= conn_cb->ksnr_max_conns)
                        conn_cb->ksnr_connected |= BIT(type);
                break;
        case SOCKLND_CONN_ANY:
-               if (conn_cb->ksnr_conn_count >=
-                   *ksocknal_tunables.ksnd_conns_per_peer)
+               if (conn_cb->ksnr_conn_count >= conn_cb->ksnr_max_conns)
                        conn_cb->ksnr_connected |= BIT(type);
                break;
        default:
                LBUG();
                break;
-
        }
 
-       CDEBUG(D_NET, "Add conn type %d, ksnr_connected %x conns_per_peer %d\n",
-              type, conn_cb->ksnr_connected, *ksocknal_tunables.ksnd_conns_per_peer);
+       CDEBUG(D_NET, "Add conn type %d, ksnr_connected %x ksnr_max_conns %d\n",
+              type, conn_cb->ksnr_connected, conn_cb->ksnr_max_conns);
 }
 
 static void
@@ -587,11 +599,19 @@ ksocknal_add_peer(struct lnet_ni *ni, struct lnet_process_id id,
                peer_ni = peer2;
        } else {
                /* peer_ni table takes my ref on peer_ni */
-               hash_add(ksocknal_data.ksnd_peers, &peer_ni->ksnp_list, id.nid);
+               hash_add(ksocknal_data.ksnd_peers, &peer_ni->ksnp_list,
+                        nidhash(id.nid));
        }
 
        ksocknal_add_conn_cb_locked(peer_ni, conn_cb);
 
+       /* Remember conns_per_peer setting at the time
+        * of connection initiation. It will define the
+        * max number of conns per type for this conn_cb
+        * while it's in use.
+        */
+       conn_cb->ksnr_max_conns = ksocknal_get_conns_per_peer(peer_ni);
+
        write_unlock_bh(&ksocknal_data.ksnd_global_lock);
 
        return 0;
@@ -634,7 +654,8 @@ ksocknal_del_peer(struct lnet_ni *ni, struct lnet_process_id id, __u32 ip)
        write_lock_bh(&ksocknal_data.ksnd_global_lock);
 
        if (id.nid != LNET_NID_ANY) {
-               lo = hash_min(id.nid, HASH_BITS(ksocknal_data.ksnd_peers));
+               lo = hash_min(nidhash(id.nid),
+                             HASH_BITS(ksocknal_data.ksnd_peers));
                hi = lo;
        } else {
                lo = 0;
@@ -906,7 +927,7 @@ ksocknal_create_conn(struct lnet_ni *ni, struct ksock_conn_cb *conn_cb,
                        /* NB this puts an "empty" peer_ni in the peer_ni
                         * table (which takes my ref) */
                        hash_add(ksocknal_data.ksnd_peers,
-                                &peer_ni->ksnp_list, peerid.nid);
+                                &peer_ni->ksnp_list, nidhash(peerid.nid));
                } else {
                        ksocknal_peer_decref(peer_ni);
                        peer_ni = peer2;
@@ -919,7 +940,7 @@ ksocknal_create_conn(struct lnet_ni *ni, struct ksock_conn_cb *conn_cb,
                /* Am I already connecting to this guy?  Resolve in
                 * favour of higher NID...
                 */
-               if (peerid.nid < ni->ni_nid &&
+               if (peerid.nid < lnet_nid_to_nid4(&ni->ni_nid) &&
                    ksocknal_connecting(peer_ni->ksnp_conn_cb,
                                        ((struct sockaddr *) &conn->ksnc_peeraddr))) {
                        rc = EALREADY;
@@ -988,7 +1009,13 @@ ksocknal_create_conn(struct lnet_ni *ni, struct ksock_conn_cb *conn_cb,
                                continue;
 
                        num_dup++;
-                       if (num_dup < *ksocknal_tunables.ksnd_conns_per_peer)
+                       /* If max conns per type is not registered in conn_cb
+                        * as ksnr_max_conns, use ni's conns_per_peer
+                        */
+                       if ((peer_ni->ksnp_conn_cb &&
+                           num_dup < peer_ni->ksnp_conn_cb->ksnr_max_conns) ||
+                           (!peer_ni->ksnp_conn_cb &&
+                           num_dup < ksocknal_get_conns_per_peer(peer_ni)))
                                continue;
 
                        /* Reply on a passive connection attempt so the peer_ni
@@ -1212,7 +1239,7 @@ ksocknal_close_conn_locked(struct ksock_conn *conn, int error)
                 * of the given type got created
                 */
                if (ksocknal_get_conn_count_by_type(conn_cb, conn->ksnc_type) ==
-                   *ksocknal_tunables.ksnd_conns_per_peer)
+                   conn_cb->ksnr_max_conns)
                        LASSERT((conn_cb->ksnr_connected &
                                BIT(conn->ksnc_type)) != 0);
 
@@ -1520,7 +1547,8 @@ ksocknal_close_matching_conns(struct lnet_process_id id, __u32 ipaddr)
        write_lock_bh(&ksocknal_data.ksnd_global_lock);
 
        if (id.nid != LNET_NID_ANY) {
-               lo = hash_min(id.nid, HASH_BITS(ksocknal_data.ksnd_peers));
+               lo = hash_min(nidhash(id.nid),
+                             HASH_BITS(ksocknal_data.ksnd_peers));
                hi = lo;
        } else {
                lo = 0;
@@ -1614,7 +1642,8 @@ ksocknal_push(struct lnet_ni *ni, struct lnet_process_id id)
        int rc = -ENOENT;
 
        if (id.nid != LNET_NID_ANY) {
-               lo = hash_min(id.nid, HASH_BITS(ksocknal_data.ksnd_peers));
+               lo = hash_min(nidhash(id.nid),
+                             HASH_BITS(ksocknal_data.ksnd_peers));
                hi = lo;
        } else {
                lo = 0;
@@ -1769,15 +1798,16 @@ ksocknal_ctl(struct lnet_ni *ni, unsigned int cmd, void *arg)
                 return ksocknal_close_matching_conns (id,
                                                       data->ioc_u32[0]);
 
-        case IOC_LIBCFS_REGISTER_MYNID:
-                /* Ignore if this is a noop */
-                if (data->ioc_nid == ni->ni_nid)
-                        return 0;
+       case IOC_LIBCFS_REGISTER_MYNID:
+               /* Ignore if this is a noop */
+               if (nid_is_nid4(&ni->ni_nid) &&
+                   data->ioc_nid == lnet_nid_to_nid4(&ni->ni_nid))
+                       return 0;
 
-                CERROR("obsolete IOC_LIBCFS_REGISTER_MYNID: %s(%s)\n",
-                       libcfs_nid2str(data->ioc_nid),
-                       libcfs_nid2str(ni->ni_nid));
-                return -EINVAL;
+               CERROR("obsolete IOC_LIBCFS_REGISTER_MYNID: %s(%s)\n",
+                      libcfs_nid2str(data->ioc_nid),
+                      libcfs_nidstr(&ni->ni_nid));
+               return -EINVAL;
 
         case IOC_LIBCFS_PUSH_CONNECTION:
                 id.nid = data->ioc_nid;
@@ -1817,6 +1847,78 @@ ksocknal_free_buffers (void)
        }
 }
 
+static int ksocknal_get_link_status(struct net_device *dev)
+{
+       int ret = -1;
+
+       LASSERT(dev);
+
+       if (!netif_running(dev))
+               ret = 0;
+       /* Some devices may not be providing link settings */
+       else if (dev->ethtool_ops->get_link)
+               ret = dev->ethtool_ops->get_link(dev);
+
+       return ret;
+}
+
+static int
+ksocknal_handle_link_state_change(struct net_device *dev,
+                                 unsigned char operstate)
+{
+       struct lnet_ni *ni;
+       struct ksock_net *net;
+       struct ksock_net *cnxt;
+       int ifindex;
+       unsigned char link_down = !(operstate == IF_OPER_UP);
+
+       ifindex = dev->ifindex;
+
+       if (!ksocknal_data.ksnd_nnets)
+               goto out;
+
+       list_for_each_entry_safe(net, cnxt, &ksocknal_data.ksnd_nets,
+                                ksnn_list) {
+               if (net->ksnn_interface.ksni_index != ifindex)
+                       continue;
+               ni = net->ksnn_ni;
+               if (link_down)
+                       atomic_set(&ni->ni_fatal_error_on, link_down);
+               else
+                       atomic_set(&ni->ni_fatal_error_on,
+                                  (ksocknal_get_link_status(dev) == 0));
+       }
+out:
+       return 0;
+}
+
+
+/************************************
+ * Net device notifier event handler
+ ************************************/
+static int ksocknal_device_event(struct notifier_block *unused,
+                                unsigned long event, void *ptr)
+{
+       struct net_device *dev = netdev_notifier_info_to_dev(ptr);
+       unsigned char operstate;
+
+       operstate = dev->operstate;
+
+       switch (event) {
+       case NETDEV_UP:
+       case NETDEV_DOWN:
+       case NETDEV_CHANGE:
+               ksocknal_handle_link_state_change(dev, operstate);
+               break;
+       }
+
+       return NOTIFY_OK;
+}
+
+static struct notifier_block ksocknal_notifier_block = {
+       .notifier_call = ksocknal_device_event,
+};
+
 static void
 ksocknal_base_shutdown(void)
 {
@@ -1828,6 +1930,9 @@ ksocknal_base_shutdown(void)
               libcfs_kmem_read());
        LASSERT (ksocknal_data.ksnd_nnets == 0);
 
+       if (ksocknal_data.ksnd_init == SOCKNAL_INIT_ALL)
+               unregister_netdevice_notifier(&ksocknal_notifier_block);
+
        switch (ksocknal_data.ksnd_init) {
        default:
                LASSERT(0);
@@ -1970,15 +2075,13 @@ ksocknal_base_startup(void)
         }
 
         for (i = 0; i < *ksocknal_tunables.ksnd_nconnds; i++) {
-               char name[16];
                spin_lock_bh(&ksocknal_data.ksnd_connd_lock);
                ksocknal_data.ksnd_connd_starting++;
                spin_unlock_bh(&ksocknal_data.ksnd_connd_lock);
 
-
-               snprintf(name, sizeof(name), "socknal_cd%02d", i);
                rc = ksocknal_thread_start(ksocknal_connd,
-                                          (void *)((uintptr_t)i), name);
+                                          (void *)((uintptr_t)i),
+                                          "socknal_cd%02d", i);
                if (rc != 0) {
                        spin_lock_bh(&ksocknal_data.ksnd_connd_lock);
                        ksocknal_data.ksnd_connd_starting--;
@@ -1994,6 +2097,8 @@ ksocknal_base_startup(void)
                 goto failed;
         }
 
+       register_netdevice_notifier(&ksocknal_notifier_block);
+
         /* flag everything initialised */
         ksocknal_data.ksnd_init = SOCKNAL_INIT_ALL;
 
@@ -2144,14 +2249,12 @@ ksocknal_start_schedulers(struct ksock_sched *sched)
 
        for (i = 0; i < nthrs; i++) {
                long id;
-               char name[20];
 
                id = KSOCK_THREAD_ID(sched->kss_cpt, sched->kss_nthreads + i);
-               snprintf(name, sizeof(name), "socknal_sd%02d_%02d",
-                        sched->kss_cpt, (int)KSOCK_THREAD_SID(id));
-
-               rc = ksocknal_thread_start(ksocknal_scheduler,
-                                          (void *)id, name);
+               rc = ksocknal_thread_start(ksocknal_scheduler, (void *)id,
+                                          "socknal_sd%02d_%02d",
+                                          sched->kss_cpt,
+                                          (int)KSOCK_THREAD_SID(id));
                if (rc == 0)
                        continue;
 
@@ -2195,7 +2298,6 @@ int
 ksocknal_startup(struct lnet_ni *ni)
 {
        struct ksock_net *net;
-       struct lnet_ioctl_config_lnd_cmn_tunables *net_tunables;
        struct ksock_interface *ksi = NULL;
        struct lnet_inetdev *ifaces = NULL;
        struct sockaddr_in *sa;
@@ -2213,27 +2315,8 @@ ksocknal_startup(struct lnet_ni *ni)
                goto fail_0;
        net->ksnn_incarnation = ktime_get_real_ns();
        ni->ni_data = net;
-       net_tunables = &ni->ni_net->net_tunables;
-       if (net_tunables->lct_peer_timeout == -1)
-               net_tunables->lct_peer_timeout =
-                       *ksocknal_tunables.ksnd_peertimeout;
-
-       if (net_tunables->lct_max_tx_credits == -1)
-               net_tunables->lct_max_tx_credits =
-                       *ksocknal_tunables.ksnd_credits;
 
-       if (net_tunables->lct_peer_tx_credits == -1)
-               net_tunables->lct_peer_tx_credits =
-                       *ksocknal_tunables.ksnd_peertxcredits;
-
-       if (net_tunables->lct_peer_tx_credits >
-           net_tunables->lct_max_tx_credits)
-               net_tunables->lct_peer_tx_credits =
-                       net_tunables->lct_max_tx_credits;
-
-       if (net_tunables->lct_peer_rtr_credits == -1)
-               net_tunables->lct_peer_rtr_credits =
-                       *ksocknal_tunables.ksnd_peerrtrcredits;
+       ksocknal_tunables_setup(ni);
 
        rc = lnet_inet_enumerate(&ifaces, ni->ni_net_ns);
        if (rc < 0)
@@ -2271,11 +2354,10 @@ ksocknal_startup(struct lnet_ni *ni)
 
        LASSERT(ksi);
        LASSERT(ksi->ksni_addr.ss_family == AF_INET);
-       ni->ni_nid = LNET_MKNID(
-               LNET_NIDNET(ni->ni_nid),
-               ntohl(((struct sockaddr_in *)
-                      &ksi->ksni_addr)->sin_addr.s_addr));
+       ni->ni_nid.nid_addr[0] =
+               ((struct sockaddr_in *)&ksi->ksni_addr)->sin_addr.s_addr;
        list_add(&net->ksnn_list, &ksocknal_data.ksnd_nets);
+       net->ksnn_ni = ni;
        ksocknal_data.ksnd_nnets++;
 
        return 0;
@@ -2289,7 +2371,6 @@ fail_0:
        return -ENETDOWN;
 }
 
-
 static void __exit ksocklnd_exit(void)
 {
        lnet_unregister_lnd(&the_ksocklnd);