4 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 only,
8 * as published by the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * General Public License version 2 for more details (a copy is included
14 * in the LICENSE file that accompanied this code).
16 * You should have received a copy of the GNU General Public License
17 * version 2 along with this program; If not, see
18 * http://www.sun.com/software/products/lustre/docs/GPLv2.pdf
20 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
21 * CA 95054 USA or visit www.sun.com if you need additional information or
27 * Copyright (c) 2007, 2010, Oracle and/or its affiliates. All rights reserved.
28 * Use is subject to license terms.
31 * This file is part of Lustre, http://www.lustre.org/
32 * Lustre is a trademark of Sun Microsystems, Inc.
34 * lnet/selftest/conctl.c
36 * Author: Liang Zhen <liangzhen@clusterfs.com>
41 #include <libcfs/libcfsutil.h>
42 #include <lnet/lnetctl.h>
43 #include <lnet/lnetst.h>
46 lst_sid_t LST_INVALID_SID = {LNET_NID_ANY, -1};
47 static lst_sid_t session_id;
48 static int session_key;
49 static lstcon_trans_stat_t trans_stat;
51 typedef struct list_string {
52 struct list_string *lstr_next;
58 # define offsetof(typ,memb) ((unsigned long)((char *)&(((typ *)0)->memb)))
61 static int alloc_count = 0;
62 static int alloc_nob = 0;
67 lstr_t *lstr = malloc(offsetof(lstr_t, lstr_str[sz]));
70 fprintf(stderr, "Can't allocate lstr\n");
77 lstr->lstr_str[0] = 0;
83 free_lstr(lstr_t *lstr)
86 alloc_nob -= lstr->lstr_sz;
91 free_lstrs(lstr_t **list)
95 while ((lstr = *list) != NULL) {
96 *list = lstr->lstr_next;
102 new_lstrs(lstr_t **list, char *prefix, char *postfix,
103 int lo, int hi, int stride)
105 int n1 = strlen(prefix);
106 int n2 = strlen(postfix);
107 int sz = n1 + 20 + n2 + 1;
110 lstr_t *n = alloc_lstr(sz);
112 snprintf(n->lstr_str, sz - 1, "%s%u%s",
113 prefix, lo, postfix);
115 n->lstr_next = *list;
123 expand_lstr(lstr_t **list, lstr_t *l)
125 int nob = strlen(l->lstr_str);
135 b1 = strchr(l->lstr_str, '[');
137 l->lstr_next = *list;
142 b2 = strchr(b1, ']');
143 if (b2 == NULL || b2 == b1 + 1)
151 sep = strchr(expr, ',');
157 if (sscanf(expr, "%u%n", &x, &n) >= 1 && n == nob) {
159 new_lstrs(list, l->lstr_str, b2, x, x, 1);
164 if (sscanf(expr, "%u-%u%n", &x, &y, &n) >= 2 && n == nob &&
167 new_lstrs(list, l->lstr_str, b2, x, y, 1);
172 if (sscanf(expr, "%u-%u/%u%n", &x, &y, &z, &n) >= 3 && n == nob &&
175 new_lstrs(list, l->lstr_str, b2, x, y, z);
181 } while ((expr = sep) != NULL);
189 expand_strs(char *str, lstr_t **head)
197 l = alloc_lstr(strlen(str) + 1);
198 memcpy(l->lstr_str, str, strlen(str) + 1);
206 while ((l = list) != NULL) {
209 rc = expand_lstr(&nlist, l);
211 fprintf(stderr, "Syntax error in \"%s\"\n", str);
219 /* re-order onto 'list' */
220 while ((l = nlist) != NULL) {
221 nlist = l->lstr_next;
226 } while (expanded && rc > 0);
233 while ((l = list) != NULL) {
242 lst_parse_nids(char *str, int *countp, lnet_process_id_t **idspp)
250 rc = expand_strs(str, &head);
260 *idspp = malloc(c * sizeof(lnet_process_id_t));
261 if (*idspp == NULL) {
262 fprintf(stderr, "Out of memory\n");
269 while ((l = head) != NULL) {
273 (*idspp)[i].nid = libcfs_str2nid(l->lstr_str);
274 if ((*idspp)[i].nid == LNET_NID_ANY) {
275 fprintf(stderr, "Invalid nid: %s\n",
280 (*idspp)[i].pid = LUSTRE_LNET_PID;
297 lst_node_state2str(int state)
299 if (state == LST_NODE_ACTIVE)
301 if (state == LST_NODE_BUSY)
303 if (state == LST_NODE_DOWN)
310 lst_node_str2state(char *str)
312 if (strcasecmp(str, "active") == 0)
313 return LST_NODE_ACTIVE;
314 if (strcasecmp(str, "busy") == 0)
315 return LST_NODE_BUSY;
316 if (strcasecmp(str, "down") == 0)
317 return LST_NODE_DOWN;
318 if (strcasecmp(str, "unknown") == 0)
319 return LST_NODE_UNKNOWN;
320 if (strcasecmp(str, "invalid") == 0)
321 return (LST_NODE_UNKNOWN | LST_NODE_DOWN | LST_NODE_BUSY);
327 lst_test_type2name(int type)
329 if (type == LST_TEST_PING)
331 if (type == LST_TEST_BULK)
338 lst_test_name2type(char *name)
340 if (strcasecmp(name, "ping") == 0)
341 return LST_TEST_PING;
342 if (strcasecmp(name, "brw") == 0)
343 return LST_TEST_BULK;
349 lst_print_usage(char *cmd)
351 Parser_printhelp(cmd);
355 lst_print_error(char *sub, const char *def_format, ...)
359 /* local error returned from kernel */
362 fprintf(stderr, "No session exists\n");
365 fprintf(stderr, "Session is shutting down\n");
368 fprintf(stderr, "Unmatched session key or not root\n");
371 fprintf(stderr, "Can't find %s in current session\n", sub);
374 fprintf(stderr, "Invalid parameters list in command line\n");
377 fprintf(stderr, "Bad parameter address\n");
380 fprintf(stderr, "%s already exists\n", sub);
383 va_start(ap, def_format);
384 vfprintf(stderr, def_format, ap);
392 lst_free_rpcent(cfs_list_t *head)
394 lstcon_rpc_ent_t *ent;
396 while (!cfs_list_empty(head)) {
397 ent = cfs_list_entry(head->next, lstcon_rpc_ent_t, rpe_link);
399 cfs_list_del(&ent->rpe_link);
405 lst_reset_rpcent(cfs_list_t *head)
407 lstcon_rpc_ent_t *ent;
409 cfs_list_for_each_entry_typed(ent, head, lstcon_rpc_ent_t, rpe_link) {
410 ent->rpe_sid = LST_INVALID_SID;
411 ent->rpe_peer.nid = LNET_NID_ANY;
412 ent->rpe_peer.pid = LNET_PID_ANY;
413 ent->rpe_rpc_errno = ent->rpe_fwk_errno = 0;
418 lst_alloc_rpcent(cfs_list_t *head, int count, int offset)
420 lstcon_rpc_ent_t *ent;
423 for (i = 0; i < count; i++) {
424 ent = malloc(offsetof(lstcon_rpc_ent_t, rpe_payload[offset]));
426 lst_free_rpcent(head);
430 memset(ent, 0, offsetof(lstcon_rpc_ent_t, rpe_payload[offset]));
432 ent->rpe_sid = LST_INVALID_SID;
433 ent->rpe_peer.nid = LNET_NID_ANY;
434 ent->rpe_peer.pid = LNET_PID_ANY;
435 cfs_list_add(&ent->rpe_link, head);
442 lst_print_transerr(cfs_list_t *head, char *optstr)
444 lstcon_rpc_ent_t *ent;
446 cfs_list_for_each_entry_typed(ent, head, lstcon_rpc_ent_t, rpe_link) {
447 if (ent->rpe_rpc_errno == 0 && ent->rpe_fwk_errno == 0)
450 if (ent->rpe_rpc_errno != 0) {
451 fprintf(stderr, "%s RPC failed on %s: %s\n",
452 optstr, libcfs_id2str(ent->rpe_peer),
453 strerror(ent->rpe_rpc_errno));
457 fprintf(stderr, "%s failed on %s: %s\n",
458 optstr, libcfs_id2str(ent->rpe_peer),
459 strerror(ent->rpe_fwk_errno));
463 int lst_info_batch_ioctl(char *batch, int test, int server,
464 lstcon_test_batch_ent_t *entp, int *idxp,
465 int *ndentp, lstcon_node_ent_t *dentsp);
467 int lst_info_group_ioctl(char *name, lstcon_ndlist_ent_t *gent,
468 int *idx, int *count, lstcon_node_ent_t *dents);
470 int lst_query_batch_ioctl(char *batch, int test, int server,
471 int timeout, cfs_list_t *head);
474 lst_ioctl(unsigned int opc, void *buf, int len)
476 struct libcfs_ioctl_data data;
479 LIBCFS_IOC_INIT (data);
480 data.ioc_u32[0] = opc;
481 data.ioc_plen1 = len;
482 data.ioc_pbuf1 = (char *)buf;
483 data.ioc_plen2 = sizeof(trans_stat);
484 data.ioc_pbuf2 = (char *)&trans_stat;
486 memset(&trans_stat, 0, sizeof(trans_stat));
488 rc = l_ioctl(LNET_DEV_ID, IOC_LIBCFS_LNETST, &data);
490 /* local error, no valid RPC result */
495 if (trans_stat.trs_rpc_errno != 0)
498 /* Framework error */
499 if (trans_stat.trs_fwk_errno != 0)
506 lst_new_session_ioctl (char *name, int timeout, int force, lst_sid_t *sid)
508 lstio_session_new_args_t args = {0};
510 args.lstio_ses_key = session_key;
511 args.lstio_ses_timeout = timeout;
512 args.lstio_ses_force = force;
513 args.lstio_ses_idp = sid;
514 args.lstio_ses_nmlen = strlen(name);
515 args.lstio_ses_namep = name;
517 return lst_ioctl (LSTIO_SESSION_NEW, &args, sizeof(args));
521 jt_lst_new_session(int argc, char **argv)
523 char buf[LST_NAME_SIZE];
531 static struct option session_opts[] =
533 {"timeout", required_argument, 0, 't' },
534 {"force", no_argument, 0, 'f' },
538 if (session_key == 0) {
540 "Can't find env LST_SESSION or value is not valid\n");
546 c = getopt_long(argc, argv, "ft:",
547 session_opts, &optidx);
557 timeout = atoi(optarg);
560 lst_print_usage(argv[0]);
566 fprintf(stderr, "Invalid timeout value\n");
570 if (optind == argc - 1) {
571 name = argv[optind ++];
572 if (strlen(name) >= LST_NAME_SIZE) {
573 fprintf(stderr, "Name size is limited to %d\n",
578 } else if (optind == argc) {
579 char user[LST_NAME_SIZE];
580 char host[LST_NAME_SIZE];
581 struct passwd *pw = getpwuid(getuid());
584 snprintf(user, sizeof(user), "%d", (int)getuid());
586 snprintf(user, sizeof(user), "%s", pw->pw_name);
588 rc = gethostname(host, sizeof(host));
590 snprintf(host, sizeof(host), "unknown_host");
592 snprintf(buf, LST_NAME_SIZE, "%s@%s", user, host);
596 lst_print_usage(argv[0]);
600 rc = lst_new_session_ioctl(name, timeout, force, &session_id);
603 lst_print_error("session", "Failed to create session: %s\n",
608 fprintf(stdout, "SESSION: %s TIMEOUT: %d FORCE: %s\n",
609 name, timeout, force ? "Yes": "No");
615 lst_session_info_ioctl(char *name, int len, int *key,
616 lst_sid_t *sid, lstcon_ndlist_ent_t *ndinfo)
618 lstio_session_info_args_t args = {0};
620 args.lstio_ses_idp = sid;
621 args.lstio_ses_keyp = key;
622 args.lstio_ses_ndinfo = ndinfo;
623 args.lstio_ses_nmlen = len;
624 args.lstio_ses_namep = name;
626 return lst_ioctl(LSTIO_SESSION_INFO, &args, sizeof(args));
630 jt_lst_show_session(int argc, char **argv)
632 lstcon_ndlist_ent_t ndinfo;
634 char name[LST_NAME_SIZE];
638 rc = lst_session_info_ioctl(name, LST_NAME_SIZE, &key, &sid, &ndinfo);
641 lst_print_error("session", "Failed to show session: %s\n",
646 fprintf(stdout, "%s ID: "LPU64"@%s, KEY: %d NODES: %d\n",
647 name, sid.ses_stamp, libcfs_nid2str(sid.ses_nid),
648 key, ndinfo.nle_nnode);
654 lst_end_session_ioctl(void)
656 lstio_session_end_args_t args = {0};
658 args.lstio_ses_key = session_key;
659 return lst_ioctl (LSTIO_SESSION_END, &args, sizeof(args));
663 jt_lst_end_session(int argc, char **argv)
667 if (session_key == 0) {
669 "Can't find env LST_SESSION or value is not valid\n");
673 rc = lst_end_session_ioctl();
676 fprintf(stdout, "session is ended\n");
681 lst_print_error("session", "Failed to end session: %s\n",
686 if (trans_stat.trs_rpc_errno != 0) {
688 "[RPC] Failed to send %d session RPCs: %s\n",
689 lstcon_rpc_stat_failure(&trans_stat, 0),
690 strerror(trans_stat.trs_rpc_errno));
693 if (trans_stat.trs_fwk_errno != 0) {
695 "[FWK] Failed to end session on %d nodes: %s\n",
696 lstcon_sesop_stat_failure(&trans_stat, 0),
697 strerror(trans_stat.trs_fwk_errno));
704 lst_ping_ioctl(char *str, int type, int timeout,
705 int count, lnet_process_id_t *ids, cfs_list_t *head)
707 lstio_debug_args_t args = {0};
709 args.lstio_dbg_key = session_key;
710 args.lstio_dbg_type = type;
711 args.lstio_dbg_flags = 0;
712 args.lstio_dbg_timeout = timeout;
713 args.lstio_dbg_nmlen = (str == NULL) ? 0: strlen(str);
714 args.lstio_dbg_namep = str;
715 args.lstio_dbg_count = count;
716 args.lstio_dbg_idsp = ids;
717 args.lstio_dbg_resultp = head;
719 return lst_ioctl (LSTIO_DEBUG, &args, sizeof(args));
723 lst_get_node_count(int type, char *str, int *countp, lnet_process_id_t **idspp)
725 char buf[LST_NAME_SIZE];
726 lstcon_test_batch_ent_t ent;
727 lstcon_ndlist_ent_t *entp = &ent.tbe_cli_nle;
733 case LST_OPC_SESSION:
734 rc = lst_session_info_ioctl(buf, LST_NAME_SIZE,
738 case LST_OPC_BATCHSRV:
739 entp = &ent.tbe_srv_nle;
740 case LST_OPC_BATCHCLI:
741 rc = lst_info_batch_ioctl(str, 0, 0, &ent, NULL, NULL, NULL);
745 rc = lst_info_group_ioctl(str, entp, NULL, NULL, NULL);
749 rc = lst_parse_nids(str, &entp->nle_nnode, idspp) < 0 ? -1 : 0;
758 *countp = entp->nle_nnode;
764 jt_lst_ping(int argc, char **argv)
767 lnet_process_id_t *ids = NULL;
768 lstcon_rpc_ent_t *ent = NULL;
778 static struct option ping_opts[] =
780 {"session", no_argument, 0, 's' },
781 {"server", no_argument, 0, 'v' },
782 {"batch", required_argument, 0, 'b' },
783 {"group", required_argument, 0, 'g' },
784 {"nodes", required_argument, 0, 'n' },
785 {"timeout", required_argument, 0, 't' },
789 if (session_key == 0) {
791 "Can't find env LST_SESSION or value is not valid\n");
797 c = getopt_long(argc, argv, "g:b:n:t:sv",
805 type = LST_OPC_SESSION;
809 type = LST_OPC_GROUP;
814 type = LST_OPC_BATCHCLI;
819 type = LST_OPC_NODES;
824 timeout = atoi(optarg);
832 lst_print_usage(argv[0]);
837 if (type == 0 || timeout <= 0 || optind != argc) {
838 lst_print_usage(argv[0]);
842 if (type == LST_OPC_BATCHCLI && server)
843 type = LST_OPC_BATCHSRV;
845 rc = lst_get_node_count(type, str, &count, &ids);
847 fprintf(stderr, "Failed to get count of nodes from %s: %s\n",
848 (str == NULL) ? "session" : str, strerror(errno));
852 CFS_INIT_LIST_HEAD(&head);
854 rc = lst_alloc_rpcent(&head, count, LST_NAME_SIZE);
856 fprintf(stderr, "Out of memory\n");
861 fprintf(stdout, "Target %s is empty\n",
862 (str == NULL) ? "session" : str);
866 rc = lst_ping_ioctl(str, type, timeout, count, ids, &head);
867 if (rc == -1) { /* local failure */
868 lst_print_error("debug", "Failed to ping %s: %s\n",
869 (str == NULL) ? "session" : str,
875 /* ignore RPC errors and framwork errors */
876 cfs_list_for_each_entry_typed(ent, &head, lstcon_rpc_ent_t, rpe_link) {
877 fprintf(stdout, "\t%s: %s [session: %s id: %s]\n",
878 libcfs_id2str(ent->rpe_peer),
879 lst_node_state2str(ent->rpe_state),
880 (ent->rpe_state == LST_NODE_ACTIVE ||
881 ent->rpe_state == LST_NODE_BUSY)?
882 (ent->rpe_rpc_errno == 0 ?
883 &ent->rpe_payload[0] : "Unknown") :
884 "<NULL>", libcfs_nid2str(ent->rpe_sid.ses_nid));
888 lst_free_rpcent(&head);
898 lst_add_nodes_ioctl (char *name, int count, lnet_process_id_t *ids,
901 lstio_group_nodes_args_t args = {0};
903 args.lstio_grp_key = session_key;
904 args.lstio_grp_nmlen = strlen(name);
905 args.lstio_grp_namep = name;
906 args.lstio_grp_count = count;
907 args.lstio_grp_idsp = ids;
908 args.lstio_grp_resultp = resultp;
910 return lst_ioctl(LSTIO_NODES_ADD, &args, sizeof(args));
914 lst_add_group_ioctl (char *name)
916 lstio_group_add_args_t args = {0};
918 args.lstio_grp_key = session_key;
919 args.lstio_grp_nmlen = strlen(name);
920 args.lstio_grp_namep = name;
922 return lst_ioctl(LSTIO_GROUP_ADD, &args, sizeof(args));
926 jt_lst_add_group(int argc, char **argv)
929 lnet_process_id_t *ids;
935 if (session_key == 0) {
937 "Can't find env LST_SESSION or value is not valid\n");
942 lst_print_usage(argv[0]);
947 if (strlen(name) >= LST_NAME_SIZE) {
948 fprintf(stderr, "Name length is limited to %d\n",
953 rc = lst_add_group_ioctl(name);
955 lst_print_error("group", "Failed to add group %s: %s\n",
956 name, strerror(errno));
960 CFS_INIT_LIST_HEAD(&head);
962 for (i = 2; i < argc; i++) {
963 /* parse address list */
964 rc = lst_parse_nids(argv[i], &count, &ids);
966 fprintf(stderr, "Ignore invalid id list %s\n",
974 rc = lst_alloc_rpcent(&head, count, 0);
976 fprintf(stderr, "Out of memory\n");
980 rc = lst_add_nodes_ioctl(name, count, ids, &head);
985 lst_free_rpcent(&head);
986 fprintf(stderr, "%s are added to session\n", argv[i]);
991 lst_free_rpcent(&head);
992 lst_print_error("group", "Failed to add nodes %s: %s\n",
993 argv[i], strerror(errno));
997 lst_print_transerr(&head, "create session");
998 lst_free_rpcent(&head);
1005 lst_del_group_ioctl (char *name)
1007 lstio_group_del_args_t args = {0};
1009 args.lstio_grp_key = session_key;
1010 args.lstio_grp_nmlen = strlen(name);
1011 args.lstio_grp_namep = name;
1013 return lst_ioctl(LSTIO_GROUP_DEL, &args, sizeof(args));
1017 jt_lst_del_group(int argc, char **argv)
1021 if (session_key == 0) {
1023 "Can't find env LST_SESSION or value is not valid\n");
1028 lst_print_usage(argv[0]);
1032 rc = lst_del_group_ioctl(argv[1]);
1034 fprintf(stdout, "Group is deleted\n");
1039 lst_print_error("group", "Failed to delete group: %s\n",
1044 fprintf(stderr, "Group is deleted with some errors\n");
1046 if (trans_stat.trs_rpc_errno != 0) {
1047 fprintf(stderr, "[RPC] Failed to send %d end session RPCs: %s\n",
1048 lstcon_rpc_stat_failure(&trans_stat, 0),
1049 strerror(trans_stat.trs_rpc_errno));
1052 if (trans_stat.trs_fwk_errno != 0) {
1054 "[FWK] Failed to end session on %d nodes: %s\n",
1055 lstcon_sesop_stat_failure(&trans_stat, 0),
1056 strerror(trans_stat.trs_fwk_errno));
1063 lst_update_group_ioctl(int opc, char *name, int clean, int count,
1064 lnet_process_id_t *ids, cfs_list_t *resultp)
1066 lstio_group_update_args_t args = {0};
1068 args.lstio_grp_key = session_key;
1069 args.lstio_grp_opc = opc;
1070 args.lstio_grp_args = clean;
1071 args.lstio_grp_nmlen = strlen(name);
1072 args.lstio_grp_namep = name;
1073 args.lstio_grp_count = count;
1074 args.lstio_grp_idsp = ids;
1075 args.lstio_grp_resultp = resultp;
1077 return lst_ioctl(LSTIO_GROUP_UPDATE, &args, sizeof(args));
1081 jt_lst_update_group(int argc, char **argv)
1084 lnet_process_id_t *ids = NULL;
1094 static struct option update_group_opts[] =
1096 {"refresh", no_argument, 0, 'f' },
1097 {"clean", required_argument, 0, 'c' },
1098 {"remove", required_argument, 0, 'r' },
1102 if (session_key == 0) {
1104 "Can't find env LST_SESSION or value is not valid\n");
1109 c = getopt_long(argc, argv, "fc:r:",
1110 update_group_opts, &optidx);
1112 /* Detect the end of the options. */
1119 lst_print_usage(argv[0]);
1122 opc = LST_GROUP_REFRESH;
1127 lst_print_usage(argv[0]);
1130 opc = LST_GROUP_RMND;
1135 clean = lst_node_str2state(optarg);
1136 if (opc != 0 || clean <= 0) {
1137 lst_print_usage(argv[0]);
1140 opc = LST_GROUP_CLEAN;
1144 lst_print_usage(argv[0]);
1149 /* no OPC or group is specified */
1150 if (opc == 0 || optind != argc - 1) {
1151 lst_print_usage(argv[0]);
1157 CFS_INIT_LIST_HEAD(&head);
1159 if (opc == LST_GROUP_RMND || opc == LST_GROUP_REFRESH) {
1160 rc = lst_get_node_count(opc == LST_GROUP_RMND ? LST_OPC_NODES :
1162 opc == LST_GROUP_RMND ? str : grp,
1166 fprintf(stderr, "Can't get count of nodes from %s: %s\n",
1167 opc == LST_GROUP_RMND ? str : grp,
1172 rc = lst_alloc_rpcent(&head, count, 0);
1174 fprintf(stderr, "Out of memory\n");
1181 rc = lst_update_group_ioctl(opc, grp, clean, count, ids, &head);
1187 lst_free_rpcent(&head);
1192 lst_free_rpcent(&head);
1193 lst_print_error("group", "Failed to update group: %s\n",
1198 lst_print_transerr(&head, "Updating group");
1200 lst_free_rpcent(&head);
1206 lst_list_group_ioctl(int len, char *name, int idx)
1208 lstio_group_list_args_t args = {0};
1210 args.lstio_grp_key = session_key;
1211 args.lstio_grp_idx = idx;
1212 args.lstio_grp_nmlen = len;
1213 args.lstio_grp_namep = name;
1215 return lst_ioctl(LSTIO_GROUP_LIST, &args, sizeof(args));
1219 lst_info_group_ioctl(char *name, lstcon_ndlist_ent_t *gent,
1220 int *idx, int *count, lstcon_node_ent_t *dents)
1222 lstio_group_info_args_t args = {0};
1224 args.lstio_grp_key = session_key;
1225 args.lstio_grp_nmlen = strlen(name);
1226 args.lstio_grp_namep = name;
1227 args.lstio_grp_entp = gent;
1228 args.lstio_grp_idxp = idx;
1229 args.lstio_grp_ndentp = count;
1230 args.lstio_grp_dentsp = dents;
1232 return lst_ioctl(LSTIO_GROUP_INFO, &args, sizeof(args));
1236 lst_list_group_all(void)
1238 char name[LST_NAME_SIZE];
1242 /* no group is specified, list name of all groups */
1243 for (i = 0; ; i++) {
1244 rc = lst_list_group_ioctl(LST_NAME_SIZE, name, i);
1246 fprintf(stdout, "%d) %s\n", i + 1, name);
1250 if (errno == ENOENT)
1253 lst_print_error("group", "Failed to list group: %s\n",
1258 fprintf(stdout, "Total %d groups\n", i);
1263 #define LST_NODES_TITLE "\tACTIVE\tBUSY\tDOWN\tUNKNOWN\tTOTAL\n"
1266 jt_lst_list_group(int argc, char **argv)
1268 lstcon_ndlist_ent_t gent;
1269 lstcon_node_ent_t *dents;
1284 static struct option list_group_opts[] =
1286 {"active", no_argument, 0, 'a' },
1287 {"busy", no_argument, 0, 'b' },
1288 {"down", no_argument, 0, 'd' },
1289 {"unknown", no_argument, 0, 'u' },
1290 {"all", no_argument, 0, 'l' },
1294 if (session_key == 0) {
1296 "Can't find env LST_SESSION or value is not valid\n");
1301 c = getopt_long(argc, argv, "abdul",
1302 list_group_opts, &optidx);
1309 verbose = active = 1;
1321 verbose = unknown = 1;
1328 lst_print_usage(argv[0]);
1333 if (optind == argc) {
1334 /* no group is specified, list name of all groups */
1335 rc = lst_list_group_all();
1341 fprintf(stdout, LST_NODES_TITLE);
1343 /* list nodes in specified groups */
1344 for (i = optind; i < argc; i++) {
1345 rc = lst_info_group_ioctl(argv[i], &gent, NULL, NULL, NULL);
1347 if (errno == ENOENT) {
1352 lst_print_error("group", "Failed to list group\n",
1358 fprintf(stdout, "\t%d\t%d\t%d\t%d\t%d\t%s\n",
1359 gent.nle_nactive, gent.nle_nbusy,
1360 gent.nle_ndown, gent.nle_nunknown,
1361 gent.nle_nnode, argv[i]);
1365 fprintf(stdout, "Group [ %s ]\n", argv[i]);
1367 if (gent.nle_nnode == 0) {
1368 fprintf(stdout, "No nodes found [ %s ]\n", argv[i]);
1372 count = gent.nle_nnode;
1374 dents = malloc(count * sizeof(lstcon_node_ent_t));
1375 if (dents == NULL) {
1376 fprintf(stderr, "Failed to malloc: %s\n",
1382 rc = lst_info_group_ioctl(argv[i], &gent, &index, &count, dents);
1384 lst_print_error("group", "Failed to list group: %s\n",
1390 for (j = 0, c = 0; j < count; j++) {
1392 ((active && dents[j].nde_state == LST_NODE_ACTIVE) ||
1393 (busy && dents[j].nde_state == LST_NODE_BUSY) ||
1394 (down && dents[j].nde_state == LST_NODE_DOWN) ||
1395 (unknown && dents[j].nde_state == LST_NODE_UNKNOWN))) {
1397 fprintf(stdout, "\t%s: %s\n",
1398 libcfs_id2str(dents[j].nde_id),
1399 lst_node_state2str(dents[j].nde_state));
1404 fprintf(stdout, "Total %d nodes [ %s ]\n", c, argv[i]);
1413 lst_stat_ioctl (char *name, int count, lnet_process_id_t *idsp,
1414 int timeout, cfs_list_t *resultp)
1416 lstio_stat_args_t args = {0};
1418 args.lstio_sta_key = session_key;
1419 args.lstio_sta_timeout = timeout;
1420 args.lstio_sta_nmlen = strlen(name);
1421 args.lstio_sta_namep = name;
1422 args.lstio_sta_count = count;
1423 args.lstio_sta_idsp = idsp;
1424 args.lstio_sta_resultp = resultp;
1426 return lst_ioctl (LSTIO_STAT_QUERY, &args, sizeof(args));
1430 cfs_list_t srp_link;
1433 lnet_process_id_t *srp_ids;
1434 cfs_list_t srp_result[2];
1435 } lst_stat_req_param_t;
1438 lst_stat_req_param_free(lst_stat_req_param_t *srp)
1442 for (i = 0; i < 2; i++)
1443 lst_free_rpcent(&srp->srp_result[i]);
1445 if (srp->srp_ids != NULL)
1452 lst_stat_req_param_alloc(char *name, lst_stat_req_param_t **srpp, int save_old)
1454 lst_stat_req_param_t *srp = NULL;
1455 int count = save_old ? 2 : 1;
1459 srp = malloc(sizeof(*srp));
1463 memset(srp, 0, sizeof(*srp));
1464 CFS_INIT_LIST_HEAD(&srp->srp_result[0]);
1465 CFS_INIT_LIST_HEAD(&srp->srp_result[1]);
1467 rc = lst_get_node_count(LST_OPC_GROUP, name,
1468 &srp->srp_count, NULL);
1469 if (rc != 0 && errno == ENOENT) {
1470 rc = lst_get_node_count(LST_OPC_NODES, name,
1471 &srp->srp_count, &srp->srp_ids);
1476 "Failed to get count of nodes from %s: %s\n",
1477 name, strerror(errno));
1478 lst_stat_req_param_free(srp);
1483 srp->srp_name = name;
1485 for (i = 0; i < count; i++) {
1486 rc = lst_alloc_rpcent(&srp->srp_result[i], srp->srp_count,
1487 sizeof(sfw_counters_t) +
1488 sizeof(srpc_counters_t) +
1489 sizeof(lnet_counters_t));
1491 fprintf(stderr, "Out of memory\n");
1501 lst_stat_req_param_free(srp);
1509 } lst_srpc_stat_result;
1511 #define LST_LNET_AVG 0
1512 #define LST_LNET_MIN 1
1513 #define LST_LNET_MAX 2
1516 float lnet_avg_sndrate;
1517 float lnet_min_sndrate;
1518 float lnet_max_sndrate;
1519 float lnet_total_sndrate;
1521 float lnet_avg_rcvrate;
1522 float lnet_min_rcvrate;
1523 float lnet_max_rcvrate;
1524 float lnet_total_rcvrate;
1526 float lnet_avg_sndperf;
1527 float lnet_min_sndperf;
1528 float lnet_max_sndperf;
1529 float lnet_total_sndperf;
1531 float lnet_avg_rcvperf;
1532 float lnet_min_rcvperf;
1533 float lnet_max_rcvperf;
1534 float lnet_total_rcvperf;
1536 int lnet_stat_count;
1537 } lst_lnet_stat_result_t;
1539 lst_lnet_stat_result_t lnet_stat_result;
1542 lst_lnet_stat_value(int bw, int send, int off)
1546 p = bw ? &lnet_stat_result.lnet_avg_sndperf :
1547 &lnet_stat_result.lnet_avg_sndrate;
1558 lst_timeval_diff(struct timeval *tv1,
1559 struct timeval *tv2, struct timeval *df)
1561 if (tv1->tv_usec >= tv2->tv_usec) {
1562 df->tv_sec = tv1->tv_sec - tv2->tv_sec;
1563 df->tv_usec = tv1->tv_usec - tv2->tv_usec;
1567 df->tv_sec = tv1->tv_sec - 1 - tv2->tv_sec;
1568 df->tv_usec = tv1->tv_usec + 1000000 - tv2->tv_usec;
1574 lst_cal_lnet_stat(float delta, lnet_counters_t *lnet_new,
1575 lnet_counters_t *lnet_old)
1580 perf = (float)(lnet_new->send_length -
1581 lnet_old->send_length) / (1024 * 1024) / delta;
1582 lnet_stat_result.lnet_total_sndperf += perf;
1584 if (lnet_stat_result.lnet_min_sndperf > perf ||
1585 lnet_stat_result.lnet_min_sndperf == 0)
1586 lnet_stat_result.lnet_min_sndperf = perf;
1588 if (lnet_stat_result.lnet_max_sndperf < perf)
1589 lnet_stat_result.lnet_max_sndperf = perf;
1591 perf = (float)(lnet_new->recv_length -
1592 lnet_old->recv_length) / (1024 * 1024) / delta;
1593 lnet_stat_result.lnet_total_rcvperf += perf;
1595 if (lnet_stat_result.lnet_min_rcvperf > perf ||
1596 lnet_stat_result.lnet_min_rcvperf == 0)
1597 lnet_stat_result.lnet_min_rcvperf = perf;
1599 if (lnet_stat_result.lnet_max_rcvperf < perf)
1600 lnet_stat_result.lnet_max_rcvperf = perf;
1602 rate = (lnet_new->send_count - lnet_old->send_count) / delta;
1603 lnet_stat_result.lnet_total_sndrate += rate;
1605 if (lnet_stat_result.lnet_min_sndrate > rate ||
1606 lnet_stat_result.lnet_min_sndrate == 0)
1607 lnet_stat_result.lnet_min_sndrate = rate;
1609 if (lnet_stat_result.lnet_max_sndrate < rate)
1610 lnet_stat_result.lnet_max_sndrate = rate;
1612 rate = (lnet_new->recv_count - lnet_old->recv_count) / delta;
1613 lnet_stat_result.lnet_total_rcvrate += rate;
1615 if (lnet_stat_result.lnet_min_rcvrate > rate ||
1616 lnet_stat_result.lnet_min_rcvrate == 0)
1617 lnet_stat_result.lnet_min_rcvrate = rate;
1619 if (lnet_stat_result.lnet_max_rcvrate < rate)
1620 lnet_stat_result.lnet_max_rcvrate = rate;
1622 lnet_stat_result.lnet_stat_count ++;
1624 lnet_stat_result.lnet_avg_sndrate = lnet_stat_result.lnet_total_sndrate /
1625 lnet_stat_result.lnet_stat_count;
1626 lnet_stat_result.lnet_avg_rcvrate = lnet_stat_result.lnet_total_rcvrate /
1627 lnet_stat_result.lnet_stat_count;
1629 lnet_stat_result.lnet_avg_sndperf = lnet_stat_result.lnet_total_sndperf /
1630 lnet_stat_result.lnet_stat_count;
1631 lnet_stat_result.lnet_avg_rcvperf = lnet_stat_result.lnet_total_rcvperf /
1632 lnet_stat_result.lnet_stat_count;
1637 lst_print_lnet_stat(char *name, int bwrt, int rdwr, int type)
1646 if (lnet_stat_result.lnet_stat_count == 0)
1649 if (bwrt == 1) /* bw only */
1652 if (bwrt == 2) /* rates only */
1655 if (rdwr == 1) /* recv only */
1658 if (rdwr == 2) /* send only */
1661 for (i = start1; i <= end1; i++) {
1662 fprintf(stdout, "[LNet %s of %s]\n",
1663 i == 0 ? "Rates" : "Bandwidth", name);
1665 for (j = start2; j <= end2; j++) {
1666 fprintf(stdout, "[%c] ", j == 0 ? 'R' : 'W');
1668 if ((type & 1) != 0) {
1669 fprintf(stdout, i == 0 ? "Avg: %-8.0f RPC/s " :
1670 "Avg: %-8.2f MB/s ",
1671 lst_lnet_stat_value(i, j, 0));
1674 if ((type & 2) != 0) {
1675 fprintf(stdout, i == 0 ? "Min: %-8.0f RPC/s " :
1676 "Min: %-8.2f MB/s ",
1677 lst_lnet_stat_value(i, j, 1));
1680 if ((type & 4) != 0) {
1681 fprintf(stdout, i == 0 ? "Max: %-8.0f RPC/s" :
1683 lst_lnet_stat_value(i, j, 2));
1686 fprintf(stdout, "\n");
1692 lst_print_stat(char *name, cfs_list_t *resultp,
1693 int idx, int lnet, int bwrt, int rdwr, int type)
1696 lstcon_rpc_ent_t *new;
1697 lstcon_rpc_ent_t *old;
1698 sfw_counters_t *sfwk_new;
1699 sfw_counters_t *sfwk_old;
1700 srpc_counters_t *srpc_new;
1701 srpc_counters_t *srpc_old;
1702 lnet_counters_t *lnet_new;
1703 lnet_counters_t *lnet_old;
1707 CFS_INIT_LIST_HEAD(&tmp[0]);
1708 CFS_INIT_LIST_HEAD(&tmp[1]);
1710 memset(&lnet_stat_result, 0, sizeof(lnet_stat_result));
1712 while (!cfs_list_empty(&resultp[idx])) {
1713 if (cfs_list_empty(&resultp[1 - idx])) {
1714 fprintf(stderr, "Group is changed, re-run stat\n");
1718 new = cfs_list_entry(resultp[idx].next, lstcon_rpc_ent_t,
1720 old = cfs_list_entry(resultp[1 - idx].next, lstcon_rpc_ent_t,
1723 /* first time get stats result, can't calculate diff */
1724 if (new->rpe_peer.nid == LNET_NID_ANY)
1727 if (new->rpe_peer.nid != old->rpe_peer.nid ||
1728 new->rpe_peer.pid != old->rpe_peer.pid) {
1729 /* Something wrong. i.e, somebody change the group */
1733 cfs_list_del(&new->rpe_link);
1734 cfs_list_add_tail(&new->rpe_link, &tmp[idx]);
1736 cfs_list_del(&old->rpe_link);
1737 cfs_list_add_tail(&old->rpe_link, &tmp[1 - idx]);
1739 if (new->rpe_rpc_errno != 0 || new->rpe_fwk_errno != 0 ||
1740 old->rpe_rpc_errno != 0 || old->rpe_fwk_errno != 0) {
1745 sfwk_new = (sfw_counters_t *)&new->rpe_payload[0];
1746 sfwk_old = (sfw_counters_t *)&old->rpe_payload[0];
1748 srpc_new = (srpc_counters_t *)((char *)sfwk_new + sizeof(*sfwk_new));
1749 srpc_old = (srpc_counters_t *)((char *)sfwk_old + sizeof(*sfwk_old));
1751 lnet_new = (lnet_counters_t *)((char *)srpc_new + sizeof(*srpc_new));
1752 lnet_old = (lnet_counters_t *)((char *)srpc_old + sizeof(*srpc_old));
1754 /* Prior to version 2.3, the running_ms field was a counter for
1755 * the number of running tests. We are looking at this value
1756 * to determine if it is a millisecond timestamep (>= 2.3) or a
1757 * test counter (< 2.3). The number 500 is being used for this
1758 * barrier as the test counter should never get this high, and
1759 * the timestamp should never get this low. */
1761 if (sfwk_new->running_ms > 500) {
1762 /* use the timestamp from the remote node, not our
1763 * rpe_stamp from when we copied up the data out of
1766 delta = (float) (sfwk_new->running_ms -
1767 sfwk_old->running_ms) / 1000;
1771 lst_timeval_diff(&new->rpe_stamp, &old->rpe_stamp, &tv);
1772 delta = tv.tv_sec + (float)tv.tv_usec / 1000000;
1775 if (!lnet) /* TODO */
1778 lst_cal_lnet_stat(delta, lnet_new, lnet_old);
1781 cfs_list_splice(&tmp[idx], &resultp[idx]);
1782 cfs_list_splice(&tmp[1 - idx], &resultp[1 - idx]);
1785 fprintf(stdout, "Failed to stat on %d nodes\n", errcount);
1787 if (!lnet) /* TODO */
1790 lst_print_lnet_stat(name, bwrt, rdwr, type);
1794 jt_lst_stat(int argc, char **argv)
1797 lst_stat_req_param_t *srp;
1800 int timeout = 5; /* default timeout, 5 sec */
1801 int delay = 5; /* default delay, 5 sec */
1802 int count = -1; /* run forever */
1803 int lnet = 1; /* lnet stat by default */
1811 static struct option stat_opts[] =
1813 {"timeout" , required_argument, 0, 't' },
1814 {"delay" , required_argument, 0, 'd' },
1815 {"count" , required_argument, 0, 'o' },
1816 {"lnet" , no_argument, 0, 'l' },
1817 {"rpc" , no_argument, 0, 'c' },
1818 {"bw" , no_argument, 0, 'b' },
1819 {"rate" , no_argument, 0, 'a' },
1820 {"read" , no_argument, 0, 'r' },
1821 {"write" , no_argument, 0, 'w' },
1822 {"avg" , no_argument, 0, 'g' },
1823 {"min" , no_argument, 0, 'n' },
1824 {"max" , no_argument, 0, 'x' },
1828 if (session_key == 0) {
1830 "Can't find env LST_SESSION or value is not valid\n");
1835 c = getopt_long(argc, argv, "t:d:lcbarwgnx", stat_opts, &optidx);
1842 timeout = atoi(optarg);
1845 delay = atoi(optarg);
1848 count = atoi(optarg);
1891 lst_print_usage(argv[0]);
1896 if (optind == argc) {
1897 lst_print_usage(argv[0]);
1901 if (timeout <= 0 || delay <= 0) {
1902 fprintf(stderr, "Invalid timeout or delay value\n");
1907 fprintf(stderr, "Invalid count value\n");
1911 /* extra count to get first data point */
1915 CFS_INIT_LIST_HEAD(&head);
1917 while (optind < argc) {
1918 rc = lst_stat_req_param_alloc(argv[optind++], &srp, 1);
1922 cfs_list_add_tail(&srp->srp_link, &head);
1926 time_t now = time(NULL);
1928 if (now - last < delay) {
1929 sleep(delay - now + last);
1935 cfs_list_for_each_entry_typed(srp, &head, lst_stat_req_param_t,
1937 rc = lst_stat_ioctl(srp->srp_name,
1938 srp->srp_count, srp->srp_ids,
1939 timeout, &srp->srp_result[idx]);
1941 lst_print_error("stat", "Failed to stat %s: %s\n",
1942 srp->srp_name, strerror(errno));
1946 lst_print_stat(srp->srp_name, srp->srp_result,
1947 idx, lnet, bwrt, rdwr, type);
1949 lst_reset_rpcent(&srp->srp_result[1 - idx]);
1956 } while (count == -1 || count > 0);
1959 while (!cfs_list_empty(&head)) {
1960 srp = cfs_list_entry(head.next, lst_stat_req_param_t, srp_link);
1962 cfs_list_del(&srp->srp_link);
1963 lst_stat_req_param_free(srp);
1970 jt_lst_show_error(int argc, char **argv)
1973 lst_stat_req_param_t *srp;
1974 lstcon_rpc_ent_t *ent;
1975 sfw_counters_t *sfwk;
1976 srpc_counters_t *srpc;
1977 lnet_counters_t *lnet;
1984 static struct option show_error_opts[] =
1986 {"session", no_argument, 0, 's' },
1990 if (session_key == 0) {
1992 "Can't find env LST_SESSION or value is not valid\n");
1997 c = getopt_long(argc, argv, "s", show_error_opts, &optidx);
2008 lst_print_usage(argv[0]);
2013 if (optind == argc) {
2014 lst_print_usage(argv[0]);
2018 CFS_INIT_LIST_HEAD(&head);
2020 while (optind < argc) {
2021 rc = lst_stat_req_param_alloc(argv[optind++], &srp, 0);
2025 cfs_list_add_tail(&srp->srp_link, &head);
2028 cfs_list_for_each_entry_typed(srp, &head, lst_stat_req_param_t,
2030 rc = lst_stat_ioctl(srp->srp_name, srp->srp_count,
2031 srp->srp_ids, 10, &srp->srp_result[0]);
2034 lst_print_error(srp->srp_name, "Failed to show errors of %s: %s\n",
2035 srp->srp_name, strerror(errno));
2039 fprintf(stdout, "%s:\n", srp->srp_name);
2043 cfs_list_for_each_entry_typed(ent, &srp->srp_result[0],
2044 lstcon_rpc_ent_t, rpe_link) {
2045 if (ent->rpe_rpc_errno != 0) {
2047 fprintf(stderr, "RPC failure, can't show error on %s\n",
2048 libcfs_id2str(ent->rpe_peer));
2052 if (ent->rpe_fwk_errno != 0) {
2054 fprintf(stderr, "Framework failure, can't show error on %s\n",
2055 libcfs_id2str(ent->rpe_peer));
2059 sfwk = (sfw_counters_t *)&ent->rpe_payload[0];
2060 srpc = (srpc_counters_t *)((char *)sfwk + sizeof(*sfwk));
2061 lnet = (lnet_counters_t *)((char *)srpc + sizeof(*srpc));
2063 if (srpc->errors == 0 &&
2064 sfwk->brw_errors == 0 && sfwk->ping_errors == 0)
2068 sfwk->brw_errors == 0 && sfwk->ping_errors == 0)
2073 fprintf(stderr, "%s: [Session %d brw errors, %d ping errors]%c",
2074 libcfs_id2str(ent->rpe_peer),
2075 sfwk->brw_errors, sfwk->ping_errors,
2076 show_rpc ? ' ' : '\n');
2081 fprintf(stderr, "[RPC: %d errors, %d dropped, %d expired]\n",
2082 srpc->errors, srpc->rpcs_dropped, srpc->rpcs_expired);
2085 fprintf(stdout, "Total %d error nodes in %s\n", ecount, srp->srp_name);
2088 while (!cfs_list_empty(&head)) {
2089 srp = cfs_list_entry(head.next, lst_stat_req_param_t, srp_link);
2091 cfs_list_del(&srp->srp_link);
2092 lst_stat_req_param_free(srp);
2099 lst_add_batch_ioctl (char *name)
2101 lstio_batch_add_args_t args = {0};
2103 args.lstio_bat_key = session_key;
2104 args.lstio_bat_nmlen = strlen(name);
2105 args.lstio_bat_namep = name;
2107 return lst_ioctl (LSTIO_BATCH_ADD, &args, sizeof(args));
2111 jt_lst_add_batch(int argc, char **argv)
2116 if (session_key == 0) {
2118 "Can't find env LST_SESSION or value is not valid\n");
2123 lst_print_usage(argv[0]);
2128 if (strlen(name) >= LST_NAME_SIZE) {
2129 fprintf(stderr, "Name length is limited to %d\n",
2134 rc = lst_add_batch_ioctl(name);
2138 lst_print_error("batch", "Failed to create batch: %s\n",
2145 lst_start_batch_ioctl (char *name, int timeout, cfs_list_t *resultp)
2147 lstio_batch_run_args_t args = {0};
2149 args.lstio_bat_key = session_key;
2150 args.lstio_bat_timeout = timeout;
2151 args.lstio_bat_nmlen = strlen(name);
2152 args.lstio_bat_namep = name;
2153 args.lstio_bat_resultp = resultp;
2155 return lst_ioctl(LSTIO_BATCH_START, &args, sizeof(args));
2159 jt_lst_start_batch(int argc, char **argv)
2169 static struct option start_batch_opts[] =
2171 {"timeout", required_argument, 0, 't' },
2175 if (session_key == 0) {
2177 "Can't find env LST_SESSION or value is not valid\n");
2182 c = getopt_long(argc, argv, "t:",
2183 start_batch_opts, &optidx);
2185 /* Detect the end of the options. */
2191 timeout = atoi(optarg);
2194 lst_print_usage(argv[0]);
2199 if (optind == argc) {
2200 batch = LST_DEFAULT_BATCH;
2202 } else if (optind == argc - 1) {
2203 batch = argv[optind];
2206 lst_print_usage(argv[0]);
2210 rc = lst_get_node_count(LST_OPC_BATCHCLI, batch, &count, NULL);
2212 fprintf(stderr, "Failed to get count of nodes from %s: %s\n",
2213 batch, strerror(errno));
2217 CFS_INIT_LIST_HEAD(&head);
2219 rc = lst_alloc_rpcent(&head, count, 0);
2221 fprintf(stderr, "Out of memory\n");
2225 rc = lst_start_batch_ioctl(batch, timeout, &head);
2228 fprintf(stdout, "%s is running now\n", batch);
2229 lst_free_rpcent(&head);
2234 lst_print_error("batch", "Failed to start batch: %s\n",
2236 lst_free_rpcent(&head);
2240 lst_print_transerr(&head, "Run batch");
2242 lst_free_rpcent(&head);
2248 lst_stop_batch_ioctl(char *name, int force, cfs_list_t *resultp)
2250 lstio_batch_stop_args_t args = {0};
2252 args.lstio_bat_key = session_key;
2253 args.lstio_bat_force = force;
2254 args.lstio_bat_nmlen = strlen(name);
2255 args.lstio_bat_namep = name;
2256 args.lstio_bat_resultp = resultp;
2258 return lst_ioctl(LSTIO_BATCH_STOP, &args, sizeof(args));
2262 jt_lst_stop_batch(int argc, char **argv)
2272 static struct option stop_batch_opts[] =
2274 {"force", no_argument, 0, 'f' },
2278 if (session_key == 0) {
2280 "Can't find env LST_SESSION or value is not valid\n");
2285 c = getopt_long(argc, argv, "f",
2286 stop_batch_opts, &optidx);
2288 /* Detect the end of the options. */
2297 lst_print_usage(argv[0]);
2302 if (optind == argc) {
2303 batch = LST_DEFAULT_BATCH;
2305 } else if (optind == argc - 1) {
2306 batch = argv[optind];
2309 lst_print_usage(argv[0]);
2313 rc = lst_get_node_count(LST_OPC_BATCHCLI, batch, &count, NULL);
2315 fprintf(stderr, "Failed to get count of nodes from %s: %s\n",
2316 batch, strerror(errno));
2320 CFS_INIT_LIST_HEAD(&head);
2322 rc = lst_alloc_rpcent(&head, count, 0);
2324 fprintf(stderr, "Out of memory\n");
2328 rc = lst_stop_batch_ioctl(batch, force, &head);
2333 lst_reset_rpcent(&head);
2335 rc = lst_query_batch_ioctl(batch, 0, 0, 30, &head);
2339 if (lstcon_tsbqry_stat_run(&trans_stat, 0) == 0 &&
2340 lstcon_tsbqry_stat_failure(&trans_stat, 0) == 0)
2343 fprintf(stdout, "%d batch in stopping\n",
2344 lstcon_tsbqry_stat_run(&trans_stat, 0));
2348 fprintf(stdout, "Batch is stopped\n");
2349 lst_free_rpcent(&head);
2354 lst_print_error("batch", "Failed to stop batch: %s\n",
2356 lst_free_rpcent(&head);
2360 lst_print_transerr(&head, "stop batch");
2362 lst_free_rpcent(&head);
2368 lst_list_batch_ioctl(int len, char *name, int index)
2370 lstio_batch_list_args_t args = {0};
2372 args.lstio_bat_key = session_key;
2373 args.lstio_bat_idx = index;
2374 args.lstio_bat_nmlen = len;
2375 args.lstio_bat_namep = name;
2377 return lst_ioctl(LSTIO_BATCH_LIST, &args, sizeof(args));
2381 lst_info_batch_ioctl(char *batch, int test, int server,
2382 lstcon_test_batch_ent_t *entp, int *idxp,
2383 int *ndentp, lstcon_node_ent_t *dentsp)
2385 lstio_batch_info_args_t args = {0};
2387 args.lstio_bat_key = session_key;
2388 args.lstio_bat_nmlen = strlen(batch);
2389 args.lstio_bat_namep = batch;
2390 args.lstio_bat_server = server;
2391 args.lstio_bat_testidx = test;
2392 args.lstio_bat_entp = entp;
2393 args.lstio_bat_idxp = idxp;
2394 args.lstio_bat_ndentp = ndentp;
2395 args.lstio_bat_dentsp = dentsp;
2397 return lst_ioctl(LSTIO_BATCH_INFO, &args, sizeof(args));
2401 lst_list_batch_all(void)
2403 char name[LST_NAME_SIZE];
2407 for (i = 0; ; i++) {
2408 rc = lst_list_batch_ioctl(LST_NAME_SIZE, name, i);
2410 fprintf(stdout, "%d) %s\n", i + 1, name);
2414 if (errno == ENOENT)
2417 lst_print_error("batch", "Failed to list batch: %s\n",
2422 fprintf(stdout, "Total %d batches\n", i);
2428 lst_list_tsb_nodes(char *batch, int test, int server,
2429 int count, int active, int invalid)
2431 lstcon_node_ent_t *dents;
2440 /* verbose list, show nodes in batch or test */
2441 dents = malloc(count * sizeof(lstcon_node_ent_t));
2442 if (dents == NULL) {
2443 fprintf(stdout, "Can't allocate memory\n");
2447 rc = lst_info_batch_ioctl(batch, test, server,
2448 NULL, &index, &count, dents);
2451 lst_print_error((test > 0) ? "test" : "batch",
2452 (test > 0) ? "Failed to query test: %s\n" :
2453 "Failed to query batch: %s\n",
2458 for (i = 0, c = 0; i < count; i++) {
2459 if ((!active && dents[i].nde_state == LST_NODE_ACTIVE) ||
2460 (!invalid && (dents[i].nde_state == LST_NODE_BUSY ||
2461 dents[i].nde_state == LST_NODE_DOWN ||
2462 dents[i].nde_state == LST_NODE_UNKNOWN)))
2465 fprintf(stdout, "\t%s: %s\n",
2466 libcfs_id2str(dents[i].nde_id),
2467 lst_node_state2str(dents[i].nde_state));
2471 fprintf(stdout, "Total %d nodes\n", c);
2478 jt_lst_list_batch(int argc, char **argv)
2480 lstcon_test_batch_ent_t ent;
2483 int verbose = 0; /* list nodes in batch or test */
2492 static struct option list_batch_opts[] =
2494 {"test", required_argument, 0, 't' },
2495 {"invalid", no_argument, 0, 'i' },
2496 {"active", no_argument, 0, 'a' },
2497 {"all", no_argument, 0, 'l' },
2498 {"server", no_argument, 0, 's' },
2502 if (session_key == 0) {
2504 "Can't find env LST_SESSION or value is not valid\n");
2509 c = getopt_long(argc, argv, "ailst:",
2510 list_batch_opts, &optidx);
2517 verbose = active = 1;
2520 verbose = invalid = 1;
2523 verbose = active = invalid = 1;
2529 test = atoi(optarg);
2533 lst_print_usage(argv[0]);
2538 if (optind == argc) {
2539 /* list all batches */
2540 rc = lst_list_batch_all();
2544 if (ntest == 1 && test <= 0) {
2545 fprintf(stderr, "Invalid test id, test id starts from 1\n");
2549 if (optind != argc - 1) {
2550 lst_print_usage(argv[0]);
2554 batch = argv[optind];
2557 /* show detail of specified batch or test */
2558 rc = lst_info_batch_ioctl(batch, test, server,
2559 &ent, NULL, NULL, NULL);
2561 lst_print_error((test > 0) ? "test" : "batch",
2562 (test > 0) ? "Failed to query test: %s\n" :
2563 "Failed to query batch: %s\n",
2569 /* list nodes in test or batch */
2570 rc = lst_list_tsb_nodes(batch, test, server,
2571 server ? ent.tbe_srv_nle.nle_nnode :
2572 ent.tbe_cli_nle.nle_nnode,
2577 /* only show number of hosts in batch or test */
2579 fprintf(stdout, "Batch: %s Tests: %d State: %d\n",
2580 batch, ent.u.tbe_batch.bae_ntest,
2581 ent.u.tbe_batch.bae_state);
2582 ntest = ent.u.tbe_batch.bae_ntest;
2583 test = 1; /* starting from test 1 */
2587 "\tTest %d(%s) (loop: %d, concurrency: %d)\n",
2588 test, lst_test_type2name(ent.u.tbe_test.tse_type),
2589 ent.u.tbe_test.tse_loop,
2590 ent.u.tbe_test.tse_concur);
2595 fprintf(stdout, LST_NODES_TITLE);
2596 fprintf(stdout, "client\t%d\t%d\t%d\t%d\t%d\n"
2597 "server\t%d\t%d\t%d\t%d\t%d\n",
2598 ent.tbe_cli_nle.nle_nactive,
2599 ent.tbe_cli_nle.nle_nbusy,
2600 ent.tbe_cli_nle.nle_ndown,
2601 ent.tbe_cli_nle.nle_nunknown,
2602 ent.tbe_cli_nle.nle_nnode,
2603 ent.tbe_srv_nle.nle_nactive,
2604 ent.tbe_srv_nle.nle_nbusy,
2605 ent.tbe_srv_nle.nle_ndown,
2606 ent.tbe_srv_nle.nle_nunknown,
2607 ent.tbe_srv_nle.nle_nnode);
2616 lst_query_batch_ioctl(char *batch, int test, int server,
2617 int timeout, cfs_list_t *head)
2619 lstio_batch_query_args_t args = {0};
2621 args.lstio_bat_key = session_key;
2622 args.lstio_bat_testidx = test;
2623 args.lstio_bat_client = !(server);
2624 args.lstio_bat_timeout = timeout;
2625 args.lstio_bat_nmlen = strlen(batch);
2626 args.lstio_bat_namep = batch;
2627 args.lstio_bat_resultp = head;
2629 return lst_ioctl(LSTIO_BATCH_QUERY, &args, sizeof(args));
2633 lst_print_tsb_verbose(cfs_list_t *head,
2634 int active, int idle, int error)
2636 lstcon_rpc_ent_t *ent;
2638 cfs_list_for_each_entry_typed(ent, head, lstcon_rpc_ent_t, rpe_link) {
2639 if (ent->rpe_priv[0] == 0 && active)
2642 if (ent->rpe_priv[0] != 0 && idle)
2645 if (ent->rpe_fwk_errno == 0 && error)
2648 fprintf(stdout, "%s [%s]: %s\n",
2649 libcfs_id2str(ent->rpe_peer),
2650 lst_node_state2str(ent->rpe_state),
2651 ent->rpe_rpc_errno != 0 ?
2652 strerror(ent->rpe_rpc_errno) :
2653 (ent->rpe_priv[0] > 0 ? "Running" : "Idle"));
2658 jt_lst_query_batch(int argc, char **argv)
2660 lstcon_test_batch_ent_t ent;
2667 int timeout = 5; /* default 5 seconds */
2668 int delay = 5; /* default 5 seconds */
2669 int loop = 1; /* default 1 loop */
2679 static struct option query_batch_opts[] =
2681 {"timeout", required_argument, 0, 'o' },
2682 {"delay", required_argument, 0, 'd' },
2683 {"loop", required_argument, 0, 'c' },
2684 {"test", required_argument, 0, 't' },
2685 {"server", no_argument, 0, 's' },
2686 {"active", no_argument, 0, 'a' },
2687 {"idle", no_argument, 0, 'i' },
2688 {"error", no_argument, 0, 'e' },
2689 {"all", no_argument, 0, 'l' },
2693 if (session_key == 0) {
2695 "Can't find env LST_SESSION or value is not valid\n");
2700 c = getopt_long(argc, argv, "o:d:c:t:saiel",
2701 query_batch_opts, &optidx);
2703 /* Detect the end of the options. */
2709 timeout = atoi(optarg);
2712 delay = atoi(optarg);
2715 loop = atoi(optarg);
2718 test = atoi(optarg);
2724 active = verbose = 1;
2730 error = verbose = 1;
2736 lst_print_usage(argv[0]);
2741 if (test < 0 || timeout <= 0 || delay <= 0 || loop <= 0) {
2742 lst_print_usage(argv[0]);
2746 if (optind == argc) {
2747 batch = LST_DEFAULT_BATCH;
2749 } else if (optind == argc - 1) {
2750 batch = argv[optind];
2753 lst_print_usage(argv[0]);
2758 CFS_INIT_LIST_HEAD(&head);
2761 rc = lst_info_batch_ioctl(batch, test, server,
2762 &ent, NULL, NULL, NULL);
2764 fprintf(stderr, "Failed to query %s [%d]: %s\n",
2765 batch, test, strerror(errno));
2769 count = server ? ent.tbe_srv_nle.nle_nnode :
2770 ent.tbe_cli_nle.nle_nnode;
2772 fprintf(stdout, "Batch or test is empty\n");
2777 rc = lst_alloc_rpcent(&head, count, 0);
2779 fprintf(stderr, "Out of memory\n");
2783 for (i = 0; i < loop; i++) {
2784 time_t now = time(NULL);
2786 if (now - last < delay) {
2787 sleep(delay - now + last);
2793 rc = lst_query_batch_ioctl(batch, test,
2794 server, timeout, &head);
2796 fprintf(stderr, "Failed to query batch: %s\n",
2803 lst_print_tsb_verbose(&head, active, idle, error);
2807 fprintf(stdout, "%s [%d] ", batch, test);
2809 if (lstcon_rpc_stat_failure(&trans_stat, 0) != 0) {
2810 fprintf(stdout, "%d of %d nodes are unknown, ",
2811 lstcon_rpc_stat_failure(&trans_stat, 0),
2812 lstcon_rpc_stat_total(&trans_stat, 0));
2815 if (lstcon_rpc_stat_failure(&trans_stat, 0) == 0 &&
2816 lstcon_tsbqry_stat_run(&trans_stat, 0) == 0 &&
2817 lstcon_tsbqry_stat_failure(&trans_stat, 0) == 0) {
2818 fprintf(stdout, "is stopped\n");
2822 if (lstcon_rpc_stat_failure(&trans_stat, 0) == 0 &&
2823 lstcon_tsbqry_stat_idle(&trans_stat, 0) == 0 &&
2824 lstcon_tsbqry_stat_failure(&trans_stat, 0) == 0) {
2825 fprintf(stdout, "is running\n");
2829 fprintf(stdout, "stopped: %d , running: %d, failed: %d\n",
2830 lstcon_tsbqry_stat_idle(&trans_stat, 0),
2831 lstcon_tsbqry_stat_run(&trans_stat, 0),
2832 lstcon_tsbqry_stat_failure(&trans_stat, 0));
2835 lst_free_rpcent(&head);
2841 lst_parse_distribute(char *dstr, int *dist, int *span)
2847 dstr = strchr(dstr, ':');
2851 *span = atoi(dstr + 1);
2859 lst_get_bulk_param(int argc, char **argv, lst_test_bulk_param_t *bulk)
2866 bulk->blk_size = 4096;
2867 bulk->blk_opc = LST_BRW_READ;
2868 bulk->blk_flags = LST_BRW_CHECK_NONE;
2871 if (strcasestr(argv[i], "check=") == argv[i] ||
2872 strcasestr(argv[i], "c=") == argv[i]) {
2873 tok = strchr(argv[i], '=') + 1;
2875 if (strcasecmp(tok, "full") == 0) {
2876 bulk->blk_flags = LST_BRW_CHECK_FULL;
2877 } else if (strcasecmp(tok, "simple") == 0) {
2878 bulk->blk_flags = LST_BRW_CHECK_SIMPLE;
2880 fprintf(stderr, "Unknow flag %s\n", tok);
2884 } else if (strcasestr(argv[i], "size=") == argv[i] ||
2885 strcasestr(argv[i], "s=") == argv[i]) {
2886 tok = strchr(argv[i], '=') + 1;
2888 bulk->blk_size = strtol(tok, &end, 0);
2889 if (bulk->blk_size <= 0) {
2890 fprintf(stderr, "Invalid size %s\n", tok);
2897 if (*end == 'k' || *end == 'K')
2898 bulk->blk_size *= 1024;
2899 else if (*end == 'm' || *end == 'M')
2900 bulk->blk_size *= 1024 * 1024;
2902 if (bulk->blk_size > CFS_PAGE_SIZE * LNET_MAX_IOV) {
2903 fprintf(stderr, "Size exceed limitation: %d bytes\n",
2908 } else if (strcasecmp(argv[i], "read") == 0 ||
2909 strcasecmp(argv[i], "r") == 0) {
2910 bulk->blk_opc = LST_BRW_READ;
2912 } else if (strcasecmp(argv[i], "write") == 0 ||
2913 strcasecmp(argv[i], "w") == 0) {
2914 bulk->blk_opc = LST_BRW_WRITE;
2917 fprintf(stderr, "Unknow parameter: %s\n", argv[i]);
2928 lst_get_test_param(char *test, int argc, char **argv, void **param, int *plen)
2930 lst_test_bulk_param_t *bulk = NULL;
2933 type = lst_test_name2type(test);
2935 fprintf(stderr, "Unknow test name %s\n", test);
2944 bulk = malloc(sizeof(*bulk));
2946 fprintf(stderr, "Out of memory\n");
2950 memset(bulk, 0, sizeof(*bulk));
2952 if (lst_get_bulk_param(argc, argv, bulk) != 0) {
2958 *plen = sizeof(*bulk);
2966 /* TODO: parse more parameter */
2971 lst_add_test_ioctl(char *batch, int type, int loop, int concur,
2972 int dist, int span, char *sgrp, char *dgrp,
2973 void *param, int plen, int *retp, cfs_list_t *resultp)
2975 lstio_test_args_t args = {0};
2977 args.lstio_tes_key = session_key;
2978 args.lstio_tes_bat_nmlen = strlen(batch);
2979 args.lstio_tes_bat_name = batch;
2980 args.lstio_tes_type = type;
2981 args.lstio_tes_oneside = 0;
2982 args.lstio_tes_loop = loop;
2983 args.lstio_tes_concur = concur;
2984 args.lstio_tes_dist = dist;
2985 args.lstio_tes_span = span;
2986 args.lstio_tes_sgrp_nmlen = strlen(sgrp);
2987 args.lstio_tes_sgrp_name = sgrp;
2988 args.lstio_tes_dgrp_nmlen = strlen(dgrp);
2989 args.lstio_tes_dgrp_name = dgrp;
2990 args.lstio_tes_param_len = plen;
2991 args.lstio_tes_param = param;
2992 args.lstio_tes_retp = retp;
2993 args.lstio_tes_resultp = resultp;
2995 return lst_ioctl(LSTIO_TEST_ADD, &args, sizeof(args));
2999 jt_lst_add_test(int argc, char **argv)
3021 static struct option add_test_opts[] =
3023 {"batch", required_argument, 0, 'b' },
3024 {"concurrency", required_argument, 0, 'c' },
3025 {"distribute", required_argument, 0, 'd' },
3026 {"from", required_argument, 0, 'f' },
3027 {"to", required_argument, 0, 't' },
3028 {"loop", required_argument, 0, 'l' },
3032 if (session_key == 0) {
3034 "Can't find env LST_SESSION or value is not valid\n");
3039 c = getopt_long(argc, argv, "b:c:d:f:l:t:",
3040 add_test_opts, &optidx);
3042 /* Detect the end of the options. */
3051 concur = atoi(optarg);
3060 loop = atoi(optarg);
3066 lst_print_usage(argv[0]);
3071 if (optind == argc || from == NULL || to == NULL) {
3072 lst_print_usage(argv[0]);
3076 if (concur <= 0 || concur > LST_MAX_CONCUR) {
3077 fprintf(stderr, "Invalid concurrency of test: %d\n", concur);
3082 batch = LST_DEFAULT_BATCH;
3085 rc = lst_parse_distribute(dstr, &dist, &span);
3087 fprintf(stderr, "Invalid distribution: %s\n", dstr);
3092 test = argv[optind++];
3097 type = lst_get_test_param(test, argc, argv, ¶m, &plen);
3099 fprintf(stderr, "Failed to add test (%s)\n", test);
3103 CFS_INIT_LIST_HEAD(&head);
3105 rc = lst_get_node_count(LST_OPC_GROUP, from, &fcount, NULL);
3107 fprintf(stderr, "Can't get count of nodes from %s: %s\n",
3108 from, strerror(errno));
3112 rc = lst_get_node_count(LST_OPC_GROUP, to, &tcount, NULL);
3114 fprintf(stderr, "Can't get count of nodes from %s: %s\n",
3115 to, strerror(errno));
3119 rc = lst_alloc_rpcent(&head, fcount > tcount ? fcount : tcount, 0);
3121 fprintf(stderr, "Out of memory\n");
3125 rc = lst_add_test_ioctl(batch, type, loop, concur,
3126 dist, span, from, to, param, plen, &ret, &head);
3129 fprintf(stdout, "Test was added successfully\n");
3131 fprintf(stdout, "Server group contains userland test "
3132 "nodes, old version of tcplnd can't accept "
3133 "connection request\n");
3140 lst_print_error("test", "Failed to add test: %s\n",
3145 lst_print_transerr(&head, "add test");
3147 lst_free_rpcent(&head);
3155 static command_t lst_cmdlist[] = {
3156 {"new_session", jt_lst_new_session, NULL,
3157 "Usage: lst new_session [--timeout TIME] [--force] [NAME]" },
3158 {"end_session", jt_lst_end_session, NULL,
3159 "Usage: lst end_session" },
3160 {"show_session", jt_lst_show_session, NULL,
3161 "Usage: lst show_session" },
3162 {"ping", jt_lst_ping , NULL,
3163 "Usage: lst ping [--group NAME] [--batch NAME] [--session] [--nodes IDS]" },
3164 {"add_group", jt_lst_add_group, NULL,
3165 "Usage: lst group NAME IDs [IDs]..." },
3166 {"del_group", jt_lst_del_group, NULL,
3167 "Usage: lst del_group NAME" },
3168 {"update_group", jt_lst_update_group, NULL,
3169 "Usage: lst update_group NAME [--clean] [--refresh] [--remove IDs]" },
3170 {"list_group", jt_lst_list_group, NULL,
3171 "Usage: lst list_group [--active] [--busy] [--down] [--unknown] GROUP ..." },
3172 {"stat", jt_lst_stat, NULL,
3173 "Usage: lst stat [--bw] [--rate] [--read] [--write] [--max] [--min] [--avg] "
3174 " [--timeout #] [--delay #] [--count #] GROUP [GROUP]" },
3175 {"show_error", jt_lst_show_error, NULL,
3176 "Usage: lst show_error NAME | IDS ..." },
3177 {"add_batch", jt_lst_add_batch, NULL,
3178 "Usage: lst add_batch NAME" },
3179 {"run", jt_lst_start_batch, NULL,
3180 "Usage: lst run [--timeout TIME] [NAME]" },
3181 {"stop", jt_lst_stop_batch, NULL,
3182 "Usage: lst stop [--force] BATCH_NAME" },
3183 {"list_batch", jt_lst_list_batch, NULL,
3184 "Usage: lst list_batch NAME [--test ID] [--server]" },
3185 {"query", jt_lst_query_batch, NULL,
3186 "Usage: lst query [--test ID] [--server] [--timeout TIME] NAME" },
3187 {"add_test", jt_lst_add_test, NULL,
3188 "Usage: lst add_test [--batch BATCH] [--loop #] [--concurrency #] "
3189 " [--distribute #:#] [--from GROUP] [--to GROUP] TEST..." },
3190 {"help", Parser_help, 0, "help" },
3195 lst_initialize(void)
3199 key = getenv("LST_SESSION");
3206 session_key = atoi(key);
3212 main(int argc, char **argv)
3218 rc = libcfs_arch_init();
3222 rc = lst_initialize();
3226 rc = ptl_initialize(argc, argv);
3230 Parser_init("lst > ", lst_cmdlist);
3233 rc = Parser_execarg(argc - 1, argv + 1, lst_cmdlist);
3240 libcfs_arch_cleanup();