2 * Copyright (c) 2007, 2010, Oracle and/or its affiliates. All rights reserved.
4 * Copyright (c) 2011, 2013, Intel Corporation.
6 * This file is part of Portals
7 * http://sourceforge.net/projects/sandiaportals/
9 * Portals is free software; you can redistribute it and/or
10 * modify it under the terms of version 2 of the GNU General Public
11 * License as published by the Free Software Foundation.
13 * Portals is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 * GNU General Public License for more details.
18 * You should have received a copy of the GNU General Public License
19 * along with Portals; if not, write to the Free Software
20 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
24 #define DEBUG_SUBSYSTEM S_LNET
25 #include <libcfs/libcfs.h>
26 #include <lnet/lib-lnet.h>
28 /* This is really lnet_proc.c. You might need to update sanity test 215
29 * if any file format is changed. */
31 static struct ctl_table_header *lnet_table_header = NULL;
33 #define LNET_LOFFT_BITS (sizeof(loff_t) * 8)
35 * NB: max allowed LNET_CPT_BITS is 8 on 64-bit system and 2 on 32-bit system
37 #define LNET_PROC_CPT_BITS (LNET_CPT_BITS + 1)
38 /* change version, 16 bits or 8 bits */
39 #define LNET_PROC_VER_BITS MAX(((MIN(LNET_LOFFT_BITS, 64)) / 4), 8)
41 #define LNET_PROC_HASH_BITS LNET_PEER_HASH_BITS
43 * bits for peer hash offset
44 * NB: we don't use the highest bit of *ppos because it's signed
46 #define LNET_PROC_HOFF_BITS (LNET_LOFFT_BITS - \
47 LNET_PROC_CPT_BITS - \
48 LNET_PROC_VER_BITS - \
49 LNET_PROC_HASH_BITS - 1)
50 /* bits for hash index + position */
51 #define LNET_PROC_HPOS_BITS (LNET_PROC_HASH_BITS + LNET_PROC_HOFF_BITS)
52 /* bits for peer hash table + hash version */
53 #define LNET_PROC_VPOS_BITS (LNET_PROC_HPOS_BITS + LNET_PROC_VER_BITS)
55 #define LNET_PROC_CPT_MASK ((1ULL << LNET_PROC_CPT_BITS) - 1)
56 #define LNET_PROC_VER_MASK ((1ULL << LNET_PROC_VER_BITS) - 1)
57 #define LNET_PROC_HASH_MASK ((1ULL << LNET_PROC_HASH_BITS) - 1)
58 #define LNET_PROC_HOFF_MASK ((1ULL << LNET_PROC_HOFF_BITS) - 1)
60 #define LNET_PROC_CPT_GET(pos) \
61 (int)(((pos) >> LNET_PROC_VPOS_BITS) & LNET_PROC_CPT_MASK)
63 #define LNET_PROC_VER_GET(pos) \
64 (int)(((pos) >> LNET_PROC_HPOS_BITS) & LNET_PROC_VER_MASK)
66 #define LNET_PROC_HASH_GET(pos) \
67 (int)(((pos) >> LNET_PROC_HOFF_BITS) & LNET_PROC_HASH_MASK)
69 #define LNET_PROC_HOFF_GET(pos) \
70 (int)((pos) & LNET_PROC_HOFF_MASK)
72 #define LNET_PROC_POS_MAKE(cpt, ver, hash, off) \
73 (((((loff_t)(cpt)) & LNET_PROC_CPT_MASK) << LNET_PROC_VPOS_BITS) | \
74 ((((loff_t)(ver)) & LNET_PROC_VER_MASK) << LNET_PROC_HPOS_BITS) | \
75 ((((loff_t)(hash)) & LNET_PROC_HASH_MASK) << LNET_PROC_HOFF_BITS) | \
76 ((off) & LNET_PROC_HOFF_MASK))
78 #define LNET_PROC_VERSION(v) ((unsigned int)((v) & LNET_PROC_VER_MASK))
80 static int __proc_lnet_stats(void *data, int write,
81 loff_t pos, void __user *buffer, int nob)
84 lnet_counters_t *ctrs;
87 const int tmpsiz = 256; /* 7 %u and 4 LPU64 */
90 lnet_counters_reset();
96 LIBCFS_ALLOC(ctrs, sizeof(*ctrs));
100 LIBCFS_ALLOC(tmpstr, tmpsiz);
101 if (tmpstr == NULL) {
102 LIBCFS_FREE(ctrs, sizeof(*ctrs));
106 lnet_counters_get(ctrs);
108 len = snprintf(tmpstr, tmpsiz,
109 "%u %u %u %u %u %u %u "LPU64" "LPU64" "
111 ctrs->msgs_alloc, ctrs->msgs_max,
113 ctrs->send_count, ctrs->recv_count,
114 ctrs->route_count, ctrs->drop_count,
115 ctrs->send_length, ctrs->recv_length,
116 ctrs->route_length, ctrs->drop_length);
118 if (pos >= min_t(int, len, strlen(tmpstr)))
121 rc = cfs_trace_copyout_string(buffer, nob,
124 LIBCFS_FREE(tmpstr, tmpsiz);
125 LIBCFS_FREE(ctrs, sizeof(*ctrs));
130 proc_lnet_stats(struct ctl_table *table, int write, void __user *buffer,
131 size_t *lenp, loff_t *ppos)
133 return lprocfs_call_handler(table->data, write, ppos, buffer, lenp,
138 proc_lnet_routes(struct ctl_table *table, int write, void __user *buffer,
139 size_t *lenp, loff_t *ppos)
141 const int tmpsiz = 256;
149 CLASSERT(sizeof(loff_t) >= 4);
151 off = LNET_PROC_HOFF_GET(*ppos);
152 ver = LNET_PROC_VER_GET(*ppos);
159 LIBCFS_ALLOC(tmpstr, tmpsiz);
163 s = tmpstr; /* points to current position in tmpstr[] */
166 s += snprintf(s, tmpstr + tmpsiz - s, "Routing %s\n",
167 the_lnet.ln_routing ? "enabled" : "disabled");
168 LASSERT (tmpstr + tmpsiz - s > 0);
170 s += snprintf(s, tmpstr + tmpsiz - s, "%-8s %4s %8s %7s %s\n",
171 "net", "hops", "priority", "state", "router");
172 LASSERT (tmpstr + tmpsiz - s > 0);
175 ver = (unsigned int)the_lnet.ln_remote_nets_version;
177 *ppos = LNET_PROC_POS_MAKE(0, ver, 0, off);
181 lnet_route_t *route = NULL;
182 lnet_remotenet_t *rnet = NULL;
184 struct list_head *rn_list;
189 if (ver != LNET_PROC_VERSION(the_lnet.ln_remote_nets_version)) {
191 LIBCFS_FREE(tmpstr, tmpsiz);
195 for (i = 0; i < LNET_REMOTE_NETS_HASH_SIZE && route == NULL;
197 rn_list = &the_lnet.ln_remote_nets_hash[i];
201 while (n != rn_list && route == NULL) {
202 rnet = list_entry(n, lnet_remotenet_t,
205 r = rnet->lrn_routes.next;
207 while (r != &rnet->lrn_routes) {
209 list_entry(r, lnet_route_t,
225 __u32 net = rnet->lrn_net;
226 unsigned int hops = route->lr_hops;
227 unsigned int priority = route->lr_priority;
228 lnet_nid_t nid = route->lr_gateway->lp_nid;
229 int alive = lnet_is_route_alive(route);
231 s += snprintf(s, tmpstr + tmpsiz - s,
232 "%-8s %4u %8u %7s %s\n",
233 libcfs_net2str(net), hops,
235 alive ? "up" : "down",
236 libcfs_nid2str(nid));
237 LASSERT(tmpstr + tmpsiz - s > 0);
243 len = s - tmpstr; /* how many bytes was written */
245 if (len > *lenp) { /* linux-supplied buffer is too small */
247 } else if (len > 0) { /* wrote something */
248 if (copy_to_user(buffer, tmpstr, len))
252 *ppos = LNET_PROC_POS_MAKE(0, ver, 0, off);
256 LIBCFS_FREE(tmpstr, tmpsiz);
265 proc_lnet_routers(struct ctl_table *table, int write, void __user *buffer,
266 size_t *lenp, loff_t *ppos)
271 const int tmpsiz = 256;
276 off = LNET_PROC_HOFF_GET(*ppos);
277 ver = LNET_PROC_VER_GET(*ppos);
284 LIBCFS_ALLOC(tmpstr, tmpsiz);
288 s = tmpstr; /* points to current position in tmpstr[] */
291 s += snprintf(s, tmpstr + tmpsiz - s,
292 "%-4s %7s %9s %6s %12s %9s %8s %7s %s\n",
293 "ref", "rtr_ref", "alive_cnt", "state",
294 "last_ping", "ping_sent", "deadline",
295 "down_ni", "router");
296 LASSERT(tmpstr + tmpsiz - s > 0);
299 ver = (unsigned int)the_lnet.ln_routers_version;
301 *ppos = LNET_PROC_POS_MAKE(0, ver, 0, off);
304 struct lnet_peer *peer = NULL;
309 if (ver != LNET_PROC_VERSION(the_lnet.ln_routers_version)) {
312 LIBCFS_FREE(tmpstr, tmpsiz);
316 r = the_lnet.ln_routers.next;
318 while (r != &the_lnet.ln_routers) {
319 lnet_peer_t *lp = list_entry(r, lnet_peer_t,
332 lnet_nid_t nid = peer->lp_nid;
333 cfs_time_t now = cfs_time_current();
334 cfs_time_t deadline = peer->lp_ping_deadline;
335 int nrefs = peer->lp_refcount;
336 int nrtrrefs = peer->lp_rtr_refcount;
337 int alive_cnt = peer->lp_alive_count;
338 int alive = peer->lp_alive;
339 int pingsent = !peer->lp_ping_notsent;
340 int last_ping = cfs_duration_sec(cfs_time_sub(now,
341 peer->lp_ping_timestamp));
345 if ((peer->lp_ping_feats &
346 LNET_PING_FEAT_NI_STATUS) != 0) {
347 list_for_each_entry(rtr, &peer->lp_routes,
349 /* downis on any route should be the
350 * number of downis on the gateway */
351 if (rtr->lr_downis != 0) {
352 down_ni = rtr->lr_downis;
359 s += snprintf(s, tmpstr + tmpsiz - s,
360 "%-4d %7d %9d %6s %12d %9d %8s %7d %s\n",
361 nrefs, nrtrrefs, alive_cnt,
362 alive ? "up" : "down", last_ping,
363 pingsent, "NA", down_ni,
364 libcfs_nid2str(nid));
366 s += snprintf(s, tmpstr + tmpsiz - s,
367 "%-4d %7d %9d %6s %12d %9d %8lu %7d %s\n",
368 nrefs, nrtrrefs, alive_cnt,
369 alive ? "up" : "down", last_ping,
371 cfs_duration_sec(cfs_time_sub(deadline, now)),
372 down_ni, libcfs_nid2str(nid));
373 LASSERT (tmpstr + tmpsiz - s > 0);
379 len = s - tmpstr; /* how many bytes was written */
381 if (len > *lenp) { /* linux-supplied buffer is too small */
383 } else if (len > 0) { /* wrote something */
384 if (copy_to_user(buffer, tmpstr, len))
388 *ppos = LNET_PROC_POS_MAKE(0, ver, 0, off);
392 LIBCFS_FREE(tmpstr, tmpsiz);
401 proc_lnet_peers(struct ctl_table *table, int write, void __user *buffer,
402 size_t *lenp, loff_t *ppos)
404 const int tmpsiz = 256;
405 struct lnet_peer_table *ptable;
408 int cpt = LNET_PROC_CPT_GET(*ppos);
409 int ver = LNET_PROC_VER_GET(*ppos);
410 int hash = LNET_PROC_HASH_GET(*ppos);
411 int hoff = LNET_PROC_HOFF_GET(*ppos);
415 CLASSERT(LNET_PROC_HASH_BITS >= LNET_PEER_HASH_BITS);
421 if (cpt >= LNET_CPT_NUMBER) {
426 LIBCFS_ALLOC(tmpstr, tmpsiz);
430 s = tmpstr; /* points to current position in tmpstr[] */
433 s += snprintf(s, tmpstr + tmpsiz - s,
434 "%-24s %4s %5s %5s %5s %5s %5s %5s %5s %s\n",
435 "nid", "refs", "state", "last", "max",
436 "rtr", "min", "tx", "min", "queue");
437 LASSERT (tmpstr + tmpsiz - s > 0);
441 struct lnet_peer *peer;
450 ptable = the_lnet.ln_peer_tables[cpt];
452 ver = LNET_PROC_VERSION(ptable->pt_version);
454 if (ver != LNET_PROC_VERSION(ptable->pt_version)) {
455 lnet_net_unlock(cpt);
456 LIBCFS_FREE(tmpstr, tmpsiz);
460 while (hash < LNET_PEER_HASH_SIZE) {
462 p = ptable->pt_hash[hash].next;
464 while (p != &ptable->pt_hash[hash]) {
465 lnet_peer_t *lp = list_entry(p, lnet_peer_t,
470 /* minor optimization: start from idx+1
471 * on next iteration if we've just
472 * drained lp_hashlist */
473 if (lp->lp_hashlist.next ==
474 &ptable->pt_hash[hash]) {
485 p = lp->lp_hashlist.next;
497 lnet_nid_t nid = peer->lp_nid;
498 int nrefs = peer->lp_refcount;
500 char *aliveness = "NA";
501 int maxcr = peer->lp_ni->ni_peertxcredits;
502 int txcr = peer->lp_txcredits;
503 int mintxcr = peer->lp_mintxcredits;
504 int rtrcr = peer->lp_rtrcredits;
505 int minrtrcr = peer->lp_minrtrcredits;
506 int txqnob = peer->lp_txqnob;
508 if (lnet_isrouter(peer) ||
509 lnet_peer_aliveness_enabled(peer))
510 aliveness = peer->lp_alive ? "up" : "down";
512 if (lnet_peer_aliveness_enabled(peer)) {
513 cfs_time_t now = cfs_time_current();
514 cfs_duration_t delta;
516 delta = cfs_time_sub(now, peer->lp_last_alive);
517 lastalive = cfs_duration_sec(delta);
519 /* No need to mess up peers contents with
520 * arbitrarily long integers - it suffices to
521 * know that lastalive is more than 10000s old
523 if (lastalive >= 10000)
527 lnet_net_unlock(cpt);
529 s += snprintf(s, tmpstr + tmpsiz - s,
530 "%-24s %4d %5s %5d %5d %5d %5d %5d %5d %d\n",
531 libcfs_nid2str(nid), nrefs, aliveness,
532 lastalive, maxcr, rtrcr, minrtrcr, txcr,
534 LASSERT (tmpstr + tmpsiz - s > 0);
536 } else { /* peer is NULL */
537 lnet_net_unlock(cpt);
540 if (hash == LNET_PEER_HASH_SIZE) {
544 if (peer == NULL && cpt < LNET_CPT_NUMBER)
549 len = s - tmpstr; /* how many bytes was written */
551 if (len > *lenp) { /* linux-supplied buffer is too small */
553 } else if (len > 0) { /* wrote something */
554 if (copy_to_user(buffer, tmpstr, len))
557 *ppos = LNET_PROC_POS_MAKE(cpt, ver, hash, hoff);
560 LIBCFS_FREE(tmpstr, tmpsiz);
568 static int __proc_lnet_buffers(void *data, int write,
569 loff_t pos, void __user *buffer, int nob)
581 /* (4 %d) * 4 * LNET_CPT_NUMBER */
582 tmpsiz = 64 * (LNET_NRBPOOLS + 1) * LNET_CPT_NUMBER;
583 LIBCFS_ALLOC(tmpstr, tmpsiz);
587 s = tmpstr; /* points to current position in tmpstr[] */
589 s += snprintf(s, tmpstr + tmpsiz - s,
591 "pages", "count", "credits", "min");
592 LASSERT (tmpstr + tmpsiz - s > 0);
594 if (the_lnet.ln_rtrpools == NULL)
595 goto out; /* I'm not a router */
597 for (idx = 0; idx < LNET_NRBPOOLS; idx++) {
598 lnet_rtrbufpool_t *rbp;
600 lnet_net_lock(LNET_LOCK_EX);
601 cfs_percpt_for_each(rbp, i, the_lnet.ln_rtrpools) {
602 s += snprintf(s, tmpstr + tmpsiz - s,
605 rbp[idx].rbp_nbuffers,
606 rbp[idx].rbp_credits,
607 rbp[idx].rbp_mincredits);
608 LASSERT(tmpstr + tmpsiz - s > 0);
610 lnet_net_unlock(LNET_LOCK_EX);
616 if (pos >= min_t(int, len, strlen(tmpstr)))
619 rc = cfs_trace_copyout_string(buffer, nob,
622 LIBCFS_FREE(tmpstr, tmpsiz);
627 proc_lnet_buffers(struct ctl_table *table, int write, void __user *buffer,
628 size_t *lenp, loff_t *ppos)
630 return lprocfs_call_handler(table->data, write, ppos, buffer, lenp,
631 __proc_lnet_buffers);
635 proc_lnet_nis(struct ctl_table *table, int write, void __user *buffer,
636 size_t *lenp, loff_t *ppos)
638 int tmpsiz = 128 * LNET_CPT_NUMBER;
649 LIBCFS_ALLOC(tmpstr, tmpsiz);
653 s = tmpstr; /* points to current position in tmpstr[] */
656 s += snprintf(s, tmpstr + tmpsiz - s,
657 "%-24s %6s %5s %4s %4s %4s %5s %5s %5s\n",
658 "nid", "status", "alive", "refs", "peer",
659 "rtr", "max", "tx", "min");
660 LASSERT (tmpstr + tmpsiz - s > 0);
663 lnet_ni_t *ni = NULL;
664 int skip = *ppos - 1;
668 n = the_lnet.ln_nis.next;
670 while (n != &the_lnet.ln_nis) {
671 lnet_ni_t *a_ni = list_entry(n, lnet_ni_t, ni_list);
683 struct lnet_tx_queue *tq;
685 long now = cfs_time_current_sec();
690 if (the_lnet.ln_routing)
691 last_alive = now - ni->ni_last_alive;
693 /* @lo forever alive */
694 if (ni->ni_lnd->lnd_type == LOLND)
698 LASSERT(ni->ni_status != NULL);
699 stat = (ni->ni_status->ns_status ==
700 LNET_NI_STATUS_UP) ? "up" : "down";
703 /* we actually output credits information for
704 * TX queue of each partition */
705 cfs_percpt_for_each(tq, i, ni->ni_tx_queues) {
706 for (j = 0; ni->ni_cpts != NULL &&
707 j < ni->ni_ncpts; j++) {
708 if (i == ni->ni_cpts[j])
712 if (j == ni->ni_ncpts)
718 s += snprintf(s, tmpstr + tmpsiz - s,
719 "%-24s %6s %5d %4d %4d %4d %5d %5d %5d\n",
720 libcfs_nid2str(ni->ni_nid), stat,
721 last_alive, *ni->ni_refs[i],
722 ni->ni_peertxcredits,
723 ni->ni_peerrtrcredits,
725 tq->tq_credits, tq->tq_credits_min);
729 LASSERT(tmpstr + tmpsiz - s > 0);
735 len = s - tmpstr; /* how many bytes was written */
737 if (len > *lenp) { /* linux-supplied buffer is too small */
739 } else if (len > 0) { /* wrote something */
740 if (copy_to_user(buffer, tmpstr, len))
746 LIBCFS_FREE(tmpstr, tmpsiz);
754 struct lnet_portal_rotors {
760 static struct lnet_portal_rotors portal_rotors[] = {
762 .pr_value = LNET_PTL_ROTOR_OFF,
764 .pr_desc = "Turn off message rotor for wildcard portals"
767 .pr_value = LNET_PTL_ROTOR_ON,
769 .pr_desc = "round-robin dispatch all PUT messages for "
773 .pr_value = LNET_PTL_ROTOR_RR_RT,
775 .pr_desc = "round-robin dispatch routed PUT message for "
779 .pr_value = LNET_PTL_ROTOR_HASH_RT,
780 .pr_name = "HASH_RT",
781 .pr_desc = "dispatch routed PUT message by hashing source "
782 "NID for wildcard portals"
791 static int __proc_lnet_portal_rotor(void *data, int write,
792 loff_t pos, void __user *buffer, int nob)
794 const int buf_len = 128;
800 LIBCFS_ALLOC(buf, buf_len);
807 for (i = 0; portal_rotors[i].pr_value >= 0; i++) {
808 if (portal_rotors[i].pr_value == portal_rotor)
812 LASSERT(portal_rotors[i].pr_value == portal_rotor);
815 rc = snprintf(buf, buf_len,
816 "{\n\tportals: all\n"
817 "\trotor: %s\n\tdescription: %s\n}",
818 portal_rotors[i].pr_name,
819 portal_rotors[i].pr_desc);
821 if (pos >= min_t(int, rc, buf_len)) {
824 rc = cfs_trace_copyout_string(buffer, nob,
830 rc = cfs_trace_copyin_string(buf, buf_len, buffer, nob);
834 tmp = cfs_trimwhite(buf);
838 for (i = 0; portal_rotors[i].pr_name != NULL; i++) {
839 if (strncasecmp(portal_rotors[i].pr_name, tmp,
840 strlen(portal_rotors[i].pr_name)) == 0) {
841 portal_rotor = portal_rotors[i].pr_value;
848 LIBCFS_FREE(buf, buf_len);
853 proc_lnet_portal_rotor(struct ctl_table *table, int write, void __user *buffer,
854 size_t *lenp, loff_t *ppos)
856 return lprocfs_call_handler(table->data, write, ppos, buffer, lenp,
857 __proc_lnet_portal_rotor);
861 static struct ctl_table lnet_table[] = {
863 * NB No .strategy entries have been provided since sysctl(8) prefers
864 * to go via /proc for portability.
870 .proc_handler = &proc_lnet_stats,
874 .procname = "routes",
876 .proc_handler = &proc_lnet_routes,
880 .procname = "routers",
882 .proc_handler = &proc_lnet_routers,
888 .proc_handler = &proc_lnet_peers,
892 .procname = "buffers",
894 .proc_handler = &proc_lnet_buffers,
900 .proc_handler = &proc_lnet_nis,
904 .procname = "portal_rotor",
906 .proc_handler = &proc_lnet_portal_rotor,
911 static struct ctl_table top_table[] = {
927 if (lnet_table_header == NULL)
928 lnet_table_header = register_sysctl_table(top_table);
936 if (lnet_table_header != NULL)
937 unregister_sysctl_table(lnet_table_header);
939 lnet_table_header = NULL;