4 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 only,
8 * as published by the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * General Public License version 2 for more details (a copy is included
14 * in the LICENSE file that accompanied this code).
16 * You should have received a copy of the GNU General Public License
17 * version 2 along with this program; If not, see
18 * http://www.gnu.org/licenses/gpl-2.0.html
23 * Copyright (c) 2007, 2010, Oracle and/or its affiliates. All rights reserved.
24 * Use is subject to license terms.
26 * Copyright (c) 2012, 2017, Intel Corporation.
29 * This file is part of Lustre, http://www.lustre.org/
31 * lnet/selftest/conctl.c
33 * Author: Liang Zhen <liangzhen@clusterfs.com>
44 #include <sys/ioctl.h>
46 #include <linux/types.h>
48 #include <libcfs/util/list.h>
49 #include <libcfs/util/ioctl.h>
50 #include <libcfs/util/parser.h>
51 #include <linux/lnet/lnetctl.h>
52 #include <linux/lnet/lnetst.h>
53 #include <linux/lnet/nidstr.h>
54 #include "lnetconfig/liblnetconfig.h"
56 static int lst_info_batch_ioctl(char *batch, int test, int server,
57 struct lstcon_test_batch_ent *entp, int *idxp,
58 int *ndentp, struct lstcon_node_ent *dentsp);
59 static int lst_info_group_ioctl(char *name, struct lstcon_ndlist_ent *gent,
60 int *idx, int *count, struct lstcon_node_ent *dents);
61 static int lst_query_batch_ioctl(char *batch, int test, int server,
62 int timeout, struct list_head *head);
64 struct lst_sid LST_INVALID_SID = { .ses_nid = LNET_NID_ANY, .ses_stamp = -1 };
65 static unsigned int session_key;
67 /* All nodes running 2.6.50 or later understand feature LST_FEAT_BULK_LEN */
68 static unsigned int session_features = LST_FEATS_MASK;
69 static struct lstcon_trans_stat trans_stat;
71 typedef struct list_string {
72 struct list_string *lstr_next;
78 # define offsetof(typ,memb) ((unsigned long)((char *)&(((typ *)0)->memb)))
81 static int alloc_count = 0;
82 static int alloc_nob = 0;
87 lstr_t *lstr = malloc(offsetof(lstr_t, lstr_str[sz]));
90 fprintf(stderr, "Can't allocate lstr\n");
97 lstr->lstr_str[0] = 0;
103 free_lstr(lstr_t *lstr)
106 alloc_nob -= lstr->lstr_sz;
111 new_lstrs(lstr_t **list, char *prefix, char *postfix,
112 int lo, int hi, int stride)
114 int n1 = strlen(prefix);
115 int n2 = strlen(postfix);
116 int sz = n1 + 20 + n2 + 1;
119 lstr_t *n = alloc_lstr(sz);
121 snprintf(n->lstr_str, sz - 1, "%s%u%s",
122 prefix, lo, postfix);
124 n->lstr_next = *list;
132 expand_lstr(lstr_t **list, lstr_t *l)
134 int nob = strlen(l->lstr_str);
144 b1 = strchr(l->lstr_str, '[');
146 l->lstr_next = *list;
151 b2 = strchr(b1, ']');
152 if (b2 == NULL || b2 == b1 + 1)
160 sep = strchr(expr, ',');
166 if (sscanf(expr, "%u%n", &x, &n) >= 1 && n == nob) {
168 new_lstrs(list, l->lstr_str, b2, x, x, 1);
173 if (sscanf(expr, "%u-%u%n", &x, &y, &n) >= 2 && n == nob &&
176 new_lstrs(list, l->lstr_str, b2, x, y, 1);
181 if (sscanf(expr, "%u-%u/%u%n", &x, &y, &z, &n) >= 3 && n == nob &&
184 new_lstrs(list, l->lstr_str, b2, x, y, z);
190 } while ((expr = sep) != NULL);
198 expand_strs(char *str, lstr_t **head)
206 l = alloc_lstr(strlen(str) + 1);
207 memcpy(l->lstr_str, str, strlen(str) + 1);
215 while ((l = list) != NULL) {
218 rc = expand_lstr(&nlist, l);
220 fprintf(stderr, "Syntax error in \"%s\"\n", str);
228 /* re-order onto 'list' */
229 while ((l = nlist) != NULL) {
230 nlist = l->lstr_next;
235 } while (expanded && rc > 0);
242 while ((l = list) != NULL) {
251 lst_parse_nids(char *str, int *countp, struct lnet_process_id **idspp)
259 rc = expand_strs(str, &head);
269 *idspp = malloc(c * sizeof(struct lnet_process_id));
270 if (*idspp == NULL) {
271 fprintf(stderr, "Out of memory\n");
278 while ((l = head) != NULL) {
282 (*idspp)[i].nid = libcfs_str2nid(l->lstr_str);
283 if ((*idspp)[i].nid == LNET_NID_ANY) {
284 fprintf(stderr, "Invalid nid: %s\n",
289 (*idspp)[i].pid = LNET_PID_LUSTRE;
306 lst_node_state2str(int state)
308 if (state == LST_NODE_ACTIVE)
310 if (state == LST_NODE_BUSY)
312 if (state == LST_NODE_DOWN)
319 lst_node_str2state(char *str)
321 if (strcasecmp(str, "active") == 0)
322 return LST_NODE_ACTIVE;
323 if (strcasecmp(str, "busy") == 0)
324 return LST_NODE_BUSY;
325 if (strcasecmp(str, "down") == 0)
326 return LST_NODE_DOWN;
327 if (strcasecmp(str, "unknown") == 0)
328 return LST_NODE_UNKNOWN;
329 if (strcasecmp(str, "invalid") == 0)
330 return (LST_NODE_UNKNOWN | LST_NODE_DOWN | LST_NODE_BUSY);
336 lst_test_type2name(int type)
338 if (type == LST_TEST_PING)
340 if (type == LST_TEST_BULK)
347 lst_test_name2type(char *name)
349 if (strcasecmp(name, "ping") == 0)
350 return LST_TEST_PING;
351 if (strcasecmp(name, "brw") == 0)
352 return LST_TEST_BULK;
358 lst_print_usage(char *cmd)
360 char *argv[] = { "help", cmd };
362 cfs_parser(2, argv, NULL);
366 lst_print_error(char *sub, const char *def_format, ...)
370 /* local error returned from kernel */
373 fprintf(stderr, "No session exists\n");
376 fprintf(stderr, "Session is shutting down\n");
379 fprintf(stderr, "Unmatched session key or not root\n");
382 fprintf(stderr, "Can't find %s in current session\n", sub);
385 fprintf(stderr, "Invalid parameters list in command line\n");
388 fprintf(stderr, "Bad parameter address\n");
391 fprintf(stderr, "%s already exists\n", sub);
394 va_start(ap, def_format);
395 vfprintf(stderr, def_format, ap);
403 lst_free_rpcent(struct list_head *head)
405 struct lstcon_rpc_ent *ent;
407 while (!list_empty(head)) {
408 ent = list_first_entry(head, struct lstcon_rpc_ent, rpe_link);
410 list_del(&ent->rpe_link);
416 lst_reset_rpcent(struct list_head *head)
418 struct lstcon_rpc_ent *ent;
420 list_for_each_entry(ent, head, rpe_link) {
421 ent->rpe_sid = LST_INVALID_SID;
422 ent->rpe_peer.nid = LNET_NID_ANY;
423 ent->rpe_peer.pid = LNET_PID_ANY;
424 ent->rpe_rpc_errno = ent->rpe_fwk_errno = 0;
429 lst_alloc_rpcent(struct list_head *head, int count, int offset)
431 struct lstcon_rpc_ent *ent;
434 for (i = 0; i < count; i++) {
435 ent = malloc(offsetof(struct lstcon_rpc_ent, rpe_payload[offset]));
437 lst_free_rpcent(head);
441 memset(ent, 0, offsetof(struct lstcon_rpc_ent, rpe_payload[offset]));
443 ent->rpe_sid = LST_INVALID_SID;
444 ent->rpe_peer.nid = LNET_NID_ANY;
445 ent->rpe_peer.pid = LNET_PID_ANY;
446 list_add(&ent->rpe_link, head);
453 lst_print_transerr(struct list_head *head, char *optstr)
455 struct lstcon_rpc_ent *ent;
457 list_for_each_entry(ent, head, rpe_link) {
458 if (ent->rpe_rpc_errno == 0 && ent->rpe_fwk_errno == 0)
461 if (ent->rpe_rpc_errno != 0) {
462 fprintf(stderr, "%s RPC failed on %s: %s\n",
463 optstr, libcfs_id2str(ent->rpe_peer),
464 strerror(ent->rpe_rpc_errno));
468 fprintf(stderr, "operation %s failed on %s: %s\n",
469 optstr, libcfs_id2str(ent->rpe_peer),
470 strerror(ent->rpe_fwk_errno));
475 lst_ioctl(unsigned int opc, void *buf, int len)
477 struct libcfs_ioctl_data data;
480 LIBCFS_IOC_INIT (data);
481 data.ioc_u32[0] = opc;
482 data.ioc_plen1 = len;
483 data.ioc_pbuf1 = (char *)buf;
484 data.ioc_plen2 = sizeof(trans_stat);
485 data.ioc_pbuf2 = (char *)&trans_stat;
487 memset(&trans_stat, 0, sizeof(trans_stat));
489 rc = l_ioctl(LNET_DEV_ID, IOC_LIBCFS_LNETST, &data);
491 /* local error, no valid RPC result */
496 if (trans_stat.trs_rpc_errno != 0)
499 /* Framework error */
500 if (trans_stat.trs_fwk_errno != 0)
506 static int lst_yaml_session(const char *label, const char *timeout, int nlflags,
509 struct lstcon_ndlist_ent ndinfo = { };
510 struct lst_sid sid = LST_INVALID_SID;
511 /* nlflags being zero means we are destroying the session.
512 * No parsing of reply needed.
514 bool done = nlflags ? false : true;
515 char nid[LNET_NIDSTR_SIZE];
516 char name[LST_NAME_SIZE];
517 unsigned int key = 0;
518 yaml_emitter_t request;
524 sk = nl_socket_alloc();
528 /* Note: NL_AUTO_PID == zero which we use by default for the
529 * session_key when creating a new session. This is considered
530 * an invalid key so we need to get the real session key from
531 * the yaml parser yet to be created. If the user did request
532 * a specific session key then set the socket's port id to this
536 nl_socket_set_local_port(sk, session_key);
538 /* Setup reply parser to recieve Netlink packets */
539 rc = yaml_parser_initialize(&reply);
545 rc = yaml_parser_set_input_netlink(&reply, sk, false);
549 /* Create Netlink emitter to send request to kernel */
550 yaml_emitter_initialize(&request);
551 rc = yaml_emitter_set_output_netlink(&request, sk,
552 LNET_SELFTEST_GENL_NAME,
553 LNET_SELFTEST_GENL_VERSION,
554 LNET_SELFTEST_CMD_SESSIONS,
559 yaml_emitter_open(&request);
560 yaml_document_start_event_initialize(&event, NULL, NULL, NULL, 0);
561 rc = yaml_emitter_emit(&request, &event);
565 yaml_mapping_start_event_initialize(&event, NULL,
566 (yaml_char_t *)YAML_MAP_TAG,
567 1, YAML_BLOCK_MAPPING_STYLE);
568 rc = yaml_emitter_emit(&request, &event);
572 yaml_scalar_event_initialize(&event, NULL,
573 (yaml_char_t *)YAML_STR_TAG,
574 (yaml_char_t *)"sessions",
575 strlen("sessions"), 1, 0,
576 YAML_PLAIN_SCALAR_STYLE);
577 rc = yaml_emitter_emit(&request, &event);
582 yaml_scalar_event_initialize(&event, NULL,
583 (yaml_char_t *)YAML_STR_TAG,
586 YAML_PLAIN_SCALAR_STYLE);
587 rc = yaml_emitter_emit(&request, &event);
593 /* sessions: { name: 'name', timeout: 300 }
599 yaml_mapping_start_event_initialize(&event, NULL,
600 (yaml_char_t *)YAML_MAP_TAG,
601 1, YAML_FLOW_MAPPING_STYLE);
602 rc = yaml_emitter_emit(&request, &event);
606 yaml_scalar_event_initialize(&event, NULL,
607 (yaml_char_t *)YAML_STR_TAG,
608 (yaml_char_t *)"name",
609 strlen("name"), 1, 0,
610 YAML_PLAIN_SCALAR_STYLE);
611 rc = yaml_emitter_emit(&request, &event);
615 yaml_scalar_event_initialize(&event, NULL,
616 (yaml_char_t *)YAML_STR_TAG,
617 (yaml_char_t *)label,
619 YAML_PLAIN_SCALAR_STYLE);
620 rc = yaml_emitter_emit(&request, &event);
625 yaml_scalar_event_initialize(&event, NULL,
626 (yaml_char_t *)YAML_STR_TAG,
627 (yaml_char_t *)"timeout",
628 strlen("timeout"), 1, 0,
629 YAML_PLAIN_SCALAR_STYLE);
630 rc = yaml_emitter_emit(&request, &event);
634 yaml_scalar_event_initialize(&event, NULL,
635 (yaml_char_t *)YAML_STR_TAG,
636 (yaml_char_t *)timeout,
637 strlen(timeout), 1, 0,
638 YAML_PLAIN_SCALAR_STYLE);
639 rc = yaml_emitter_emit(&request, &event);
644 yaml_mapping_end_event_initialize(&event);
645 rc = yaml_emitter_emit(&request, &event);
650 yaml_mapping_end_event_initialize(&event);
651 rc = yaml_emitter_emit(&request, &event);
655 yaml_document_end_event_initialize(&event, 0);
656 rc = yaml_emitter_emit(&request, &event);
660 rc = yaml_emitter_close(&request);
663 yaml_emitter_log_error(&request, stderr);
664 yaml_emitter_delete(&request);
668 yaml_emitter_delete(&request);
671 rc = yaml_parser_parse(&reply, &event);
675 if (event.type == YAML_SCALAR_EVENT) {
676 char *tmp, *endp = NULL;
678 if (strcmp((char *)event.data.scalar.value,
680 yaml_event_delete(&event);
681 rc = yaml_parser_parse(&reply, &event);
685 strncpy(name, (char *)event.data.scalar.value,
689 if (strcmp((char *)event.data.scalar.value,
691 yaml_event_delete(&event);
692 rc = yaml_parser_parse(&reply, &event);
696 tmp = (char *)event.data.scalar.value;
697 key = strtoul(tmp, &endp, 10);
702 if (strcmp((char *)event.data.scalar.value,
704 yaml_event_delete(&event);
705 rc = yaml_parser_parse(&reply, &event);
709 tmp = (char *)event.data.scalar.value;
710 sid.ses_stamp = strtoll(tmp, &endp, 10);
715 if (strcmp((char *)event.data.scalar.value,
717 yaml_event_delete(&event);
718 rc = yaml_parser_parse(&reply, &event);
722 strncpy(nid, (char *)event.data.scalar.value,
726 if (strcmp((char *)event.data.scalar.value,
728 yaml_event_delete(&event);
729 rc = yaml_parser_parse(&reply, &event);
733 tmp = (char *)event.data.scalar.value;
734 ndinfo.nle_nnode = strtoul(tmp, &endp, 10);
740 done = (event.type == YAML_STREAM_END_EVENT);
742 yaml_event_delete(&event);
745 if (nlflags & NLM_F_CREATE) {
746 session_features = yaml_parser_get_reader_proto_version(&reply);
750 if (rc == 0 && errmsg)
751 yaml_parser_log_error(&reply, stderr, errmsg);
752 yaml_parser_delete(&reply);
755 if (((nlflags & NLM_F_DUMP) == NLM_F_DUMP) && rc != 0) {
757 "%s ID: %ju@%s, KEY: %u FEATURES: %x NODES: %d\n",
758 name, (uintmax_t)sid.ses_stamp, nid,
759 key, session_features, ndinfo.nle_nnode);
762 return rc == 0 ? -1 : 0;
766 lst_new_session_ioctl(char *name, int timeout, int force, struct lst_sid *sid)
768 struct lstio_session_new_args args = { 0 };
770 args.lstio_ses_key = session_key;
771 args.lstio_ses_timeout = timeout;
772 args.lstio_ses_force = force;
773 args.lstio_ses_idp = sid;
774 args.lstio_ses_feats = session_features;
775 args.lstio_ses_nmlen = strlen(name);
776 args.lstio_ses_namep = name;
778 return lst_ioctl (LSTIO_SESSION_NEW, &args, sizeof(args));
782 jt_lst_new_session(int argc, char **argv)
784 char buf[LST_NAME_SIZE * 2 + 1];
785 char *name, *timeout_s = NULL;
786 int nlflags = NLM_F_CREATE;
787 struct lst_sid session_id;
794 static const struct option session_opts[] = {
795 { .name = "timeout", .has_arg = required_argument, .val = 't' },
796 { .name = "force", .has_arg = no_argument, .val = 'f' },
800 c = getopt_long(argc, argv, "ft:",
801 session_opts, &optidx);
807 nlflags |= NLM_F_REPLACE;
814 lst_print_usage(argv[0]);
820 timeout = atoi(timeout_s);
822 fprintf(stderr, "Invalid timeout value\n");
827 if (optind == argc - 1) {
828 name = argv[optind ++];
829 if (strlen(name) >= LST_NAME_SIZE) {
830 fprintf(stderr, "Name size is limited to %d\n",
834 } else if (optind == argc) {
835 char user[LST_NAME_SIZE];
836 char host[LST_NAME_SIZE];
837 struct passwd *pw = getpwuid(getuid());
840 snprintf(user, sizeof(user), "%d", (int)getuid());
842 snprintf(user, sizeof(user), "%s", pw->pw_name);
844 rc = gethostname(host, sizeof(host));
846 snprintf(host, sizeof(host), "unknown_host");
848 snprintf(buf, sizeof(buf), "%s@%s", user, host);
851 lst_print_usage(argv[0]);
855 rc = lst_yaml_session(name, timeout_s, nlflags, "new session");
859 if (session_key == 0) {
861 "Can't find env LST_SESSION or value is not valid\n");
865 rc = lst_new_session_ioctl(name, timeout, force, &session_id);
867 lst_print_error("session", "Failed to create session: %s\n",
872 fprintf(stdout, "SESSION: %s FEATURES: %x TIMEOUT: %d FORCE: %s\n",
873 name, session_features, timeout, force ? "Yes" : "No");
878 lst_session_info_ioctl(char *name, int len, int *key, unsigned *featp,
879 struct lst_sid *sid, struct lstcon_ndlist_ent *ndinfo)
881 struct lstio_session_info_args args = { 0 };
883 args.lstio_ses_idp = sid;
884 args.lstio_ses_keyp = key;
885 args.lstio_ses_featp = featp;
886 args.lstio_ses_ndinfo = ndinfo;
887 args.lstio_ses_nmlen = len;
888 args.lstio_ses_namep = name;
890 return lst_ioctl(LSTIO_SESSION_INFO, &args, sizeof(args));
894 jt_lst_show_session(int argc, char **argv)
896 struct lstcon_ndlist_ent ndinfo;
898 char name[LST_NAME_SIZE];
903 rc = lst_yaml_session(NULL, NULL, NLM_F_DUMP, "show session");
907 rc = lst_session_info_ioctl(name, sizeof(name), &key,
908 &feats, &sid, &ndinfo);
911 lst_print_error("session", "Failed to show session: %s\n",
916 fprintf(stdout, "%s ID: %ju@%s, KEY: %d FEATURES: %x NODES: %d\n",
917 name, (uintmax_t)sid.ses_stamp, libcfs_nid2str(sid.ses_nid),
918 key, feats, ndinfo.nle_nnode);
924 lst_end_session_ioctl(void)
926 struct lstio_session_end_args args = { 0 };
928 args.lstio_ses_key = session_key;
929 return lst_ioctl(LSTIO_SESSION_END, &args, sizeof(args));
933 jt_lst_end_session(int argc, char **argv)
937 if (session_key == 0) {
939 "Can't find env LST_SESSION or value is not valid\n");
943 rc = lst_yaml_session(NULL, NULL, 0, "end session");
947 rc = lst_end_session_ioctl();
950 fprintf(stdout, "session is ended\n");
955 lst_print_error("session", "Failed to end session: %s\n",
960 if (trans_stat.trs_rpc_errno != 0) {
962 "[RPC] Failed to send %d session RPCs: %s\n",
963 lstcon_rpc_stat_failure(&trans_stat, 0),
964 strerror(trans_stat.trs_rpc_errno));
967 if (trans_stat.trs_fwk_errno != 0) {
969 "[FWK] Failed to end session on %d nodes: %s\n",
970 lstcon_sesop_stat_failure(&trans_stat, 0),
971 strerror(trans_stat.trs_fwk_errno));
977 #define LST_NODES_TITLE "\tACTIVE\tBUSY\tDOWN\tUNKNOWN\tTOTAL\n"
979 static int lst_yaml_display_groups(yaml_parser_t *reply, char *group,
980 int states, bool print)
986 char name[LST_NAME_SIZE] = {};
991 fprintf(stdout, LST_NODES_TITLE);
994 rc = yaml_parser_parse(reply, &event);
998 if (event.type == YAML_MAPPING_START_EVENT) {
1002 rc = yaml_parser_parse(reply, &next);
1006 if (next.type != YAML_SCALAR_EVENT) {
1007 yaml_event_delete(&next);
1011 value = (char *)next.data.scalar.value;
1012 if (strcmp(value, "groups") == 0) {
1013 yaml_event_delete(&next);
1014 } else if (strcmp(value, "nid") == 0) {
1018 rc = yaml_parser_parse(reply, &next);
1022 fprintf(stdout, "\t%s: ",
1023 (char *)next.data.scalar.value);
1025 rc = yaml_parser_parse(reply, &next);
1029 tmp = (char *)next.data.scalar.value;
1030 if (strcmp(tmp, "status") == 0) {
1033 rc = yaml_parser_parse(reply, &state);
1037 fprintf(stdout, "%s\n",
1038 (char *)state.data.scalar.value);
1044 rc = yaml_parser_parse(reply, &next);
1048 strncpy(name, value, sizeof(name) - 1);
1049 fprintf(stdout, "Group [ %s ]\n", name);
1052 if (next.type != YAML_SEQUENCE_START_EVENT) {
1054 "No nodes found [ %s ]\n",
1058 } else if (event.type == YAML_SEQUENCE_END_EVENT &&
1060 fprintf(stdout, "Total %d nodes [ %s ]\n",
1065 done = (event.type == YAML_STREAM_END_EVENT);
1066 yaml_event_delete(&event);
1069 int active = 0, busy = 0, down = 0, unknown = 0;
1070 char group[LST_NAME_SIZE];
1074 rc = yaml_parser_parse(reply, &event);
1078 if (event.type == YAML_SCALAR_EVENT) {
1079 char *value = (char *)event.data.scalar.value;
1082 value = (char *)event.data.scalar.value;
1083 if (strcmp(value, "groups") == 0) {
1084 yaml_event_delete(&event);
1088 rc = yaml_parser_parse(reply, &next);
1092 if (next.type == YAML_SCALAR_EVENT) {
1095 status = lst_node_str2state((char *)next.data.scalar.value);
1097 case LST_NODE_ACTIVE:
1106 case LST_NODE_UNKNOWN:
1111 } else if (next.type == YAML_SEQUENCE_START_EVENT) {
1112 strncpy(group, value, sizeof(group) - 1);
1118 yaml_event_delete(&next);
1119 } else if (event.type == YAML_SEQUENCE_END_EVENT) {
1120 if (strlen(group)) {
1121 fprintf(stdout, "\t%d\t%d\t%d\t%d\t%d\t%s\n",
1122 active, busy, down, unknown,
1123 active + busy + down + unknown, group);
1125 memset(group, 0, sizeof(group));
1127 done = (event.type == YAML_STREAM_END_EVENT);
1128 yaml_event_delete(&event);
1135 rc = yaml_parser_parse(reply, &event);
1139 if (event.type == YAML_SCALAR_EVENT) {
1142 value = (char *)event.data.scalar.value;
1143 if (strlen(value) &&
1144 strcmp(value, "groups") != 0) {
1146 fprintf(stdout, "%d) %s\n",
1151 done = (event.type == YAML_STREAM_END_EVENT);
1153 yaml_event_delete(&event);
1156 fprintf(stdout, "Total %d groups\n", i - 1);
1164 #define LST_NODES_TITLE "\tACTIVE\tBUSY\tDOWN\tUNKNOWN\tTOTAL\n"
1166 static int lst_yaml_groups(int nlflags, char *name, int states, bool print)
1168 yaml_emitter_t request;
1169 yaml_parser_t reply;
1174 sk = nl_socket_alloc();
1178 /* Setup reply parser to recieve Netlink packets */
1179 rc = yaml_parser_initialize(&reply);
1185 rc = yaml_parser_set_input_netlink(&reply, sk, false);
1189 /* Create Netlink emitter to send request to kernel */
1190 yaml_emitter_initialize(&request);
1191 rc = yaml_emitter_set_output_netlink(&request, sk,
1192 LNET_SELFTEST_GENL_NAME,
1193 LNET_SELFTEST_GENL_VERSION,
1194 LNET_SELFTEST_CMD_GROUPS,
1199 yaml_emitter_open(&request);
1200 yaml_document_start_event_initialize(&event, NULL, NULL, NULL, 0);
1201 rc = yaml_emitter_emit(&request, &event);
1205 yaml_mapping_start_event_initialize(&event, NULL,
1206 (yaml_char_t *)YAML_MAP_TAG,
1207 1, YAML_BLOCK_MAPPING_STYLE);
1208 rc = yaml_emitter_emit(&request, &event);
1212 yaml_scalar_event_initialize(&event, NULL,
1213 (yaml_char_t *)YAML_STR_TAG,
1214 (yaml_char_t *)"groups",
1215 strlen("groups"), 1, 0,
1216 YAML_PLAIN_SCALAR_STYLE);
1217 rc = yaml_emitter_emit(&request, &event);
1222 yaml_sequence_start_event_initialize(&event, NULL,
1223 (yaml_char_t *)YAML_SEQ_TAG,
1224 1, YAML_BLOCK_SEQUENCE_STYLE);
1225 rc = yaml_emitter_emit(&request, &event);
1229 yaml_mapping_start_event_initialize(&event, NULL,
1230 (yaml_char_t *)YAML_MAP_TAG,
1231 1, YAML_BLOCK_MAPPING_STYLE);
1232 rc = yaml_emitter_emit(&request, &event);
1236 yaml_scalar_event_initialize(&event, NULL,
1237 (yaml_char_t *)YAML_STR_TAG,
1238 (yaml_char_t *)name,
1240 YAML_PLAIN_SCALAR_STYLE);
1241 rc = yaml_emitter_emit(&request, &event);
1246 int max = ffs(LST_NODE_UNKNOWN) + 1, i;
1249 yaml_sequence_start_event_initialize(&event, NULL,
1250 (yaml_char_t *)YAML_SEQ_TAG,
1251 1, YAML_BLOCK_SEQUENCE_STYLE);
1252 rc = yaml_emitter_emit(&request, &event);
1257 for (i = 0; i < max; i++) {
1258 int mask = states & (1 << i);
1260 state = lst_node_state2str(mask);
1261 if (mask != LST_NODE_UNKNOWN && strcmp(state, "Unknown") == 0)
1264 yaml_mapping_start_event_initialize(&event, NULL,
1265 (yaml_char_t *)YAML_MAP_TAG,
1266 1, YAML_BLOCK_MAPPING_STYLE);
1267 rc = yaml_emitter_emit(&request, &event);
1271 yaml_scalar_event_initialize(&event, NULL,
1272 (yaml_char_t *)YAML_STR_TAG,
1273 (yaml_char_t *)"status",
1274 strlen("status"), 1, 0,
1275 YAML_PLAIN_SCALAR_STYLE);
1276 rc = yaml_emitter_emit(&request, &event);
1280 yaml_scalar_event_initialize(&event, NULL,
1281 (yaml_char_t *)YAML_STR_TAG,
1282 (yaml_char_t *)state,
1283 strlen(state), 1, 0,
1284 YAML_PLAIN_SCALAR_STYLE);
1285 rc = yaml_emitter_emit(&request, &event);
1289 yaml_mapping_end_event_initialize(&event);
1290 rc = yaml_emitter_emit(&request, &event);
1295 yaml_sequence_end_event_initialize(&event);
1296 rc = yaml_emitter_emit(&request, &event);
1300 yaml_scalar_event_initialize(&event, NULL,
1301 (yaml_char_t *)YAML_STR_TAG,
1304 YAML_PLAIN_SCALAR_STYLE);
1305 rc = yaml_emitter_emit(&request, &event);
1310 yaml_mapping_end_event_initialize(&event);
1311 rc = yaml_emitter_emit(&request, &event);
1315 yaml_sequence_end_event_initialize(&event);
1316 rc = yaml_emitter_emit(&request, &event);
1320 yaml_scalar_event_initialize(&event, NULL,
1321 (yaml_char_t *)YAML_STR_TAG,
1324 YAML_PLAIN_SCALAR_STYLE);
1325 rc = yaml_emitter_emit(&request, &event);
1329 yaml_mapping_end_event_initialize(&event);
1330 rc = yaml_emitter_emit(&request, &event);
1334 yaml_document_end_event_initialize(&event, 0);
1335 rc = yaml_emitter_emit(&request, &event);
1339 rc = yaml_emitter_close(&request);
1342 yaml_emitter_log_error(&request, stderr);
1343 yaml_emitter_delete(&request);
1347 yaml_emitter_delete(&request);
1349 /* display output */
1350 if (nlflags == NLM_F_DUMP)
1351 rc = lst_yaml_display_groups(&reply, name, states, print);
1354 yaml_parser_log_error(&reply, stderr, NULL);
1355 yaml_parser_delete(&reply);
1359 rc = rc == 1 ? 0 : -EINVAL;
1365 lst_ping_ioctl(char *str, int type, int timeout,
1366 int count, struct lnet_process_id *ids, struct list_head *head)
1368 struct lstio_debug_args args = { 0 };
1370 args.lstio_dbg_key = session_key;
1371 args.lstio_dbg_type = type;
1372 args.lstio_dbg_flags = 0;
1373 args.lstio_dbg_timeout = timeout;
1374 args.lstio_dbg_nmlen = (str == NULL) ? 0: strlen(str);
1375 args.lstio_dbg_namep = str;
1376 args.lstio_dbg_count = count;
1377 args.lstio_dbg_idsp = ids;
1378 args.lstio_dbg_resultp = head;
1380 return lst_ioctl (LSTIO_DEBUG, &args, sizeof(args));
1384 lst_get_node_count(int type, char *str, int *countp,
1385 struct lnet_process_id **idspp)
1387 char buf[LST_NAME_SIZE];
1388 struct lstcon_test_batch_ent ent;
1389 struct lstcon_ndlist_ent *entp = &ent.tbe_cli_nle;
1396 case LST_OPC_SESSION:
1397 rc = lst_session_info_ioctl(buf, LST_NAME_SIZE,
1398 &key, &feats, &sid, entp);
1401 case LST_OPC_BATCHSRV:
1402 entp = &ent.tbe_srv_nle;
1403 case LST_OPC_BATCHCLI:
1404 rc = lst_info_batch_ioctl(str, 0, 0, &ent, NULL, NULL, NULL);
1408 rc = lst_yaml_groups(NLM_F_DUMP, NULL, 0, false);
1409 if (rc == -EOPNOTSUPP) {
1410 rc = lst_info_group_ioctl(str, entp, NULL, NULL, NULL);
1411 } else if (rc > 0) {
1412 entp->nle_nnode = rc;
1418 rc = lst_parse_nids(str, &entp->nle_nnode, idspp) < 0 ? -1 : 0;
1427 *countp = entp->nle_nnode;
1433 jt_lst_ping(int argc, char **argv)
1435 struct list_head head;
1436 struct lnet_process_id *ids = NULL;
1437 struct lstcon_rpc_ent *ent = NULL;
1447 static const struct option ping_opts[] = {
1448 { .name = "session", .has_arg = no_argument, .val = 's' },
1449 { .name = "server", .has_arg = no_argument, .val = 'v' },
1450 { .name = "batch", .has_arg = required_argument, .val = 'b' },
1451 { .name = "group", .has_arg = required_argument, .val = 'g' },
1452 { .name = "nodes", .has_arg = required_argument, .val = 'n' },
1453 { .name = "timeout", .has_arg = required_argument, .val = 't' },
1454 { .name = NULL, } };
1456 if (session_key == 0) {
1458 "Can't find env LST_SESSION or value is not valid\n");
1464 c = getopt_long(argc, argv, "g:b:n:t:sv",
1465 ping_opts, &optidx);
1472 type = LST_OPC_SESSION;
1476 type = LST_OPC_GROUP;
1481 type = LST_OPC_BATCHCLI;
1486 type = LST_OPC_NODES;
1491 timeout = atoi(optarg);
1499 lst_print_usage(argv[0]);
1504 if (type == 0 || timeout <= 0 || optind != argc) {
1505 lst_print_usage(argv[0]);
1509 if (type == LST_OPC_BATCHCLI && server)
1510 type = LST_OPC_BATCHSRV;
1512 rc = lst_get_node_count(type, str, &count, &ids);
1514 fprintf(stderr, "Failed to get count of nodes from %s: %s\n",
1515 (str == NULL) ? "session" : str, strerror(errno));
1519 INIT_LIST_HEAD(&head);
1521 rc = lst_alloc_rpcent(&head, count, LST_NAME_SIZE);
1523 fprintf(stderr, "Out of memory\n");
1528 fprintf(stdout, "Target %s is empty\n",
1529 (str == NULL) ? "session" : str);
1533 rc = lst_ping_ioctl(str, type, timeout, count, ids, &head);
1534 if (rc == -1) { /* local failure */
1535 lst_print_error("debug", "Failed to ping %s: %s\n",
1536 (str == NULL) ? "session" : str,
1542 /* ignore RPC errors and framwork errors */
1543 list_for_each_entry(ent, &head, rpe_link) {
1544 fprintf(stdout, "\t%s: %s [session: %s id: %s]\n",
1545 libcfs_id2str(ent->rpe_peer),
1546 lst_node_state2str(ent->rpe_state),
1547 (ent->rpe_state == LST_NODE_ACTIVE ||
1548 ent->rpe_state == LST_NODE_BUSY) ?
1549 (ent->rpe_rpc_errno == 0 ?
1550 &ent->rpe_payload[0] : "Unknown") :
1551 "<NULL>", libcfs_nid2str(ent->rpe_sid.ses_nid));
1555 lst_free_rpcent(&head);
1565 lst_add_nodes_ioctl(char *name, int count, struct lnet_process_id *ids,
1566 unsigned *featp, struct list_head *resultp)
1568 struct lstio_group_nodes_args args = { 0 };
1570 args.lstio_grp_key = session_key;
1571 args.lstio_grp_nmlen = strlen(name);
1572 args.lstio_grp_namep = name;
1573 args.lstio_grp_count = count;
1574 args.lstio_grp_featp = featp;
1575 args.lstio_grp_idsp = ids;
1576 args.lstio_grp_resultp = resultp;
1578 return lst_ioctl(LSTIO_NODES_ADD, &args, sizeof(args));
1582 lst_del_group_ioctl(char *name)
1584 struct lstio_group_del_args args = { 0 };
1586 args.lstio_grp_key = session_key;
1587 args.lstio_grp_nmlen = strlen(name);
1588 args.lstio_grp_namep = name;
1590 return lst_ioctl(LSTIO_GROUP_DEL, &args, sizeof(args));
1594 lst_del_group(char *grp_name)
1598 rc = lst_del_group_ioctl(grp_name);
1600 fprintf(stdout, "Group is deleted\n");
1605 lst_print_error("group", "Failed to delete group: %s\n",
1610 fprintf(stderr, "Group is deleted with some errors\n");
1612 if (trans_stat.trs_rpc_errno != 0) {
1614 "[RPC] Failed to send %d end session RPCs: %s\n",
1615 lstcon_rpc_stat_failure(&trans_stat, 0),
1616 strerror(trans_stat.trs_rpc_errno));
1619 if (trans_stat.trs_fwk_errno != 0) {
1621 "[FWK] Failed to end session on %d nodes: %s\n",
1622 lstcon_sesop_stat_failure(&trans_stat, 0),
1623 strerror(trans_stat.trs_fwk_errno));
1630 lst_add_group_ioctl(char *name)
1632 struct lstio_group_add_args args = { 0 };
1634 args.lstio_grp_key = session_key;
1635 args.lstio_grp_nmlen = strlen(name);
1636 args.lstio_grp_namep = name;
1638 return lst_ioctl(LSTIO_GROUP_ADD, &args, sizeof(args));
1642 jt_lst_add_group(int argc, char **argv)
1644 struct list_head head;
1645 struct lnet_process_id *ids;
1647 unsigned feats = session_features;
1651 bool nodes_added = false;
1653 if (session_key == 0) {
1655 "Can't find env LST_SESSION or value is not valid\n");
1660 lst_print_usage(argv[0]);
1665 if (strlen(name) >= LST_NAME_SIZE) {
1666 fprintf(stderr, "Name length is limited to %d\n",
1671 rc = lst_add_group_ioctl(name);
1673 lst_print_error("group", "Failed to add group %s: %s\n",
1674 name, strerror(errno));
1678 INIT_LIST_HEAD(&head);
1680 for (i = 2; i < argc; i++) {
1681 /* parse address list */
1682 rc = lst_parse_nids(argv[i], &count, &ids);
1684 fprintf(stderr, "Ignore invalid id list %s\n",
1692 rc = lst_alloc_rpcent(&head, count, 0);
1694 fprintf(stderr, "Out of memory\n");
1700 rc = lst_add_nodes_ioctl(name, count, ids, &feats, &head);
1707 fprintf(stdout, "%s are added to session\n", argv[i]);
1711 if ((feats & session_features) != session_features) {
1713 "Warning, this session will run with "
1714 "compatible mode because some test nodes "
1715 "might not understand these features: %x\n",
1716 (~feats & session_features));
1719 lst_free_rpcent(&head);
1724 * The selftest kernel module expects that a group should
1725 * have at least one node, since it doesn't make sense for
1726 * an empty group to be added to a test.
1729 "No nodes added successfully, deleting group %s\n",
1731 rc = lst_del_group(name);
1734 "Failed to delete group %s."
1735 " Group is empty.\n", name);
1743 lst_print_error("group", "Failed to add nodes %s: %s\n",
1744 argv[i], strerror(errno));
1747 if (trans_stat.trs_fwk_errno == EPROTO) {
1749 "test nodes might have different LST "
1750 "features, please disable some features by "
1751 "setting LST_FEATURES\n");
1754 lst_print_transerr(&head, "create session");
1757 lst_free_rpcent(&head);
1761 "No nodes added successfully, deleting group %s\n",
1763 if (lst_del_group(name) != 0) {
1765 "Failed to delete group %s."
1766 " Group is empty.\n", name);
1774 jt_lst_del_group(int argc, char **argv)
1778 if (session_key == 0) {
1780 "Can't find env LST_SESSION or value is not valid\n");
1785 lst_print_usage(argv[0]);
1789 rc = lst_del_group(argv[1]);
1795 lst_update_group_ioctl(int opc, char *name, int clean, int count,
1796 struct lnet_process_id *ids, struct list_head *resultp)
1798 struct lstio_group_update_args args = { 0 };
1800 args.lstio_grp_key = session_key;
1801 args.lstio_grp_opc = opc;
1802 args.lstio_grp_args = clean;
1803 args.lstio_grp_nmlen = strlen(name);
1804 args.lstio_grp_namep = name;
1805 args.lstio_grp_count = count;
1806 args.lstio_grp_idsp = ids;
1807 args.lstio_grp_resultp = resultp;
1809 return lst_ioctl(LSTIO_GROUP_UPDATE, &args, sizeof(args));
1813 jt_lst_update_group(int argc, char **argv)
1815 struct list_head head;
1816 struct lnet_process_id *ids = NULL;
1826 static const struct option update_group_opts[] = {
1827 { .name = "refresh", .has_arg = no_argument, .val = 'f' },
1828 { .name = "clean", .has_arg = required_argument, .val = 'c' },
1829 { .name = "remove", .has_arg = required_argument, .val = 'r' },
1832 if (session_key == 0) {
1834 "Can't find env LST_SESSION or value is not valid\n");
1839 c = getopt_long(argc, argv, "fc:r:",
1840 update_group_opts, &optidx);
1842 /* Detect the end of the options. */
1849 lst_print_usage(argv[0]);
1852 opc = LST_GROUP_REFRESH;
1857 lst_print_usage(argv[0]);
1860 opc = LST_GROUP_RMND;
1865 clean = lst_node_str2state(optarg);
1866 if (opc != 0 || clean <= 0) {
1867 lst_print_usage(argv[0]);
1870 opc = LST_GROUP_CLEAN;
1874 lst_print_usage(argv[0]);
1879 /* no OPC or group is specified */
1880 if (opc == 0 || optind != argc - 1) {
1881 lst_print_usage(argv[0]);
1887 INIT_LIST_HEAD(&head);
1889 if (opc == LST_GROUP_RMND || opc == LST_GROUP_REFRESH) {
1890 rc = lst_get_node_count(opc == LST_GROUP_RMND ? LST_OPC_NODES :
1892 opc == LST_GROUP_RMND ? str : grp,
1896 fprintf(stderr, "Can't get count of nodes from %s: %s\n",
1897 opc == LST_GROUP_RMND ? str : grp,
1902 rc = lst_alloc_rpcent(&head, count, 0);
1904 fprintf(stderr, "Out of memory\n");
1911 rc = lst_update_group_ioctl(opc, grp, clean, count, ids, &head);
1917 lst_free_rpcent(&head);
1922 lst_free_rpcent(&head);
1923 lst_print_error("group", "Failed to update group: %s\n",
1928 lst_print_transerr(&head, "Updating group");
1930 lst_free_rpcent(&head);
1936 lst_list_group_ioctl(int len, char *name, int idx)
1938 struct lstio_group_list_args args = { 0 };
1940 args.lstio_grp_key = session_key;
1941 args.lstio_grp_idx = idx;
1942 args.lstio_grp_nmlen = len;
1943 args.lstio_grp_namep = name;
1945 return lst_ioctl(LSTIO_GROUP_LIST, &args, sizeof(args));
1949 lst_info_group_ioctl(char *name, struct lstcon_ndlist_ent *gent,
1950 int *idx, int *count, struct lstcon_node_ent *dents)
1952 struct lstio_group_info_args args = { 0 };
1954 args.lstio_grp_key = session_key;
1955 args.lstio_grp_nmlen = strlen(name);
1956 args.lstio_grp_namep = name;
1957 args.lstio_grp_entp = gent;
1958 args.lstio_grp_idxp = idx;
1959 args.lstio_grp_ndentp = count;
1960 args.lstio_grp_dentsp = dents;
1962 return lst_ioctl(LSTIO_GROUP_INFO, &args, sizeof(args));
1966 lst_list_group_all(void)
1968 char name[LST_NAME_SIZE];
1972 /* no group is specified, list name of all groups */
1973 for (i = 0; ; i++) {
1974 rc = lst_list_group_ioctl(LST_NAME_SIZE, name, i);
1976 fprintf(stdout, "%d) %s\n", i + 1, name);
1980 if (errno == ENOENT)
1983 lst_print_error("group", "Failed to list group: %s\n",
1988 fprintf(stdout, "Total %d groups\n", i);
1994 jt_lst_list_group(int argc, char **argv)
1996 struct lstcon_ndlist_ent gent;
1997 struct lstcon_node_ent *dents;
2012 static const struct option list_group_opts[] = {
2013 { .name = "active", .has_arg = no_argument, .val = 'a' },
2014 { .name = "busy", .has_arg = no_argument, .val = 'b' },
2015 { .name = "down", .has_arg = no_argument, .val = 'd' },
2016 { .name = "unknown", .has_arg = no_argument, .val = 'u' },
2017 { .name = "all", .has_arg = no_argument, .val = 'l' },
2018 { .name = NULL, } };
2020 if (session_key == 0) {
2022 "Can't find env LST_SESSION or value is not valid\n");
2027 c = getopt_long(argc, argv, "abdul",
2028 list_group_opts, &optidx);
2035 verbose = active = 1;
2036 states |= LST_NODE_ACTIVE;
2041 states |= LST_NODE_BUSY;
2046 states |= LST_NODE_DOWN;
2050 verbose = unknown = 1;
2051 states |= LST_NODE_UNKNOWN;
2055 states |= LST_NODE_ACTIVE | LST_NODE_BUSY |
2056 LST_NODE_DOWN | LST_NODE_UNKNOWN;
2060 lst_print_usage(argv[0]);
2065 if (optind == argc) {
2066 rc = lst_yaml_groups(NLM_F_DUMP, NULL, 0, true);
2068 if (rc == -EOPNOTSUPP)
2073 for (i = optind; i < argc; i++) {
2074 rc = lst_yaml_groups(NLM_F_DUMP, argv[i], states,
2075 i == optind ? true : false);
2077 if (rc == -EOPNOTSUPP)
2085 if (optind == argc) {
2086 /* no group is specified, list name of all groups */
2087 rc = lst_list_group_all();
2093 fprintf(stdout, LST_NODES_TITLE);
2095 /* list nodes in specified groups */
2096 for (i = optind; i < argc; i++) {
2097 rc = lst_info_group_ioctl(argv[i], &gent, NULL, NULL, NULL);
2099 if (errno == ENOENT) {
2104 lst_print_error("group", "Failed to list group: %s\n",
2110 fprintf(stdout, "\t%d\t%d\t%d\t%d\t%d\t%s\n",
2111 gent.nle_nactive, gent.nle_nbusy,
2112 gent.nle_ndown, gent.nle_nunknown,
2113 gent.nle_nnode, argv[i]);
2117 fprintf(stdout, "Group [ %s ]\n", argv[i]);
2119 if (gent.nle_nnode == 0) {
2120 fprintf(stdout, "No nodes found [ %s ]\n", argv[i]);
2124 count = gent.nle_nnode;
2126 dents = malloc(count * sizeof(struct lstcon_node_ent));
2127 if (dents == NULL) {
2128 fprintf(stderr, "Failed to malloc: %s\n",
2134 rc = lst_info_group_ioctl(argv[i], &gent, &index, &count, dents);
2136 lst_print_error("group", "Failed to list group: %s\n",
2142 for (j = 0, c = 0; j < count; j++) {
2144 ((active && dents[j].nde_state == LST_NODE_ACTIVE) ||
2145 (busy && dents[j].nde_state == LST_NODE_BUSY) ||
2146 (down && dents[j].nde_state == LST_NODE_DOWN) ||
2147 (unknown && dents[j].nde_state == LST_NODE_UNKNOWN))) {
2149 fprintf(stdout, "\t%s: %s\n",
2150 libcfs_id2str(dents[j].nde_id),
2151 lst_node_state2str(dents[j].nde_state));
2156 fprintf(stdout, "Total %d nodes [ %s ]\n", c, argv[i]);
2165 lst_stat_ioctl(char *name, int count, struct lnet_process_id *idsp,
2166 int timeout, struct list_head *resultp)
2168 struct lstio_stat_args args = { 0 };
2170 args.lstio_sta_key = session_key;
2171 args.lstio_sta_timeout = timeout;
2172 args.lstio_sta_nmlen = strlen(name);
2173 args.lstio_sta_namep = name;
2174 args.lstio_sta_count = count;
2175 args.lstio_sta_idsp = idsp;
2176 args.lstio_sta_resultp = resultp;
2178 return lst_ioctl(LSTIO_STAT_QUERY, &args, sizeof(args));
2182 struct list_head srp_link;
2185 struct lnet_process_id *srp_ids;
2186 struct list_head srp_result[2];
2187 } lst_stat_req_param_t;
2190 lst_stat_req_param_free(lst_stat_req_param_t *srp)
2194 for (i = 0; i < 2; i++)
2195 lst_free_rpcent(&srp->srp_result[i]);
2197 if (srp->srp_ids != NULL)
2204 lst_stat_req_param_alloc(char *name, lst_stat_req_param_t **srpp, int save_old)
2206 lst_stat_req_param_t *srp = NULL;
2207 int count = save_old ? 2 : 1;
2211 srp = malloc(sizeof(*srp));
2215 memset(srp, 0, sizeof(*srp));
2216 INIT_LIST_HEAD(&srp->srp_result[0]);
2217 INIT_LIST_HEAD(&srp->srp_result[1]);
2219 rc = lst_get_node_count(LST_OPC_GROUP, name,
2220 &srp->srp_count, NULL);
2221 if (rc != 0 && errno == ENOENT) {
2222 rc = lst_get_node_count(LST_OPC_NODES, name,
2223 &srp->srp_count, &srp->srp_ids);
2228 "Failed to get count of nodes from %s: %s\n",
2229 name, strerror(errno));
2230 lst_stat_req_param_free(srp);
2235 srp->srp_name = name;
2237 for (i = 0; i < count; i++) {
2238 rc = lst_alloc_rpcent(&srp->srp_result[i], srp->srp_count,
2239 sizeof(struct sfw_counters) +
2240 sizeof(struct srpc_counters) +
2241 sizeof(struct lnet_counters_common));
2243 fprintf(stderr, "Out of memory\n");
2253 lst_stat_req_param_free(srp);
2261 } lst_srpc_stat_result;
2263 #define LST_LNET_AVG 0
2264 #define LST_LNET_MIN 1
2265 #define LST_LNET_MAX 2
2268 float lnet_avg_sndrate;
2269 float lnet_min_sndrate;
2270 float lnet_max_sndrate;
2271 float lnet_total_sndrate;
2273 float lnet_avg_rcvrate;
2274 float lnet_min_rcvrate;
2275 float lnet_max_rcvrate;
2276 float lnet_total_rcvrate;
2278 float lnet_avg_sndperf;
2279 float lnet_min_sndperf;
2280 float lnet_max_sndperf;
2281 float lnet_total_sndperf;
2283 float lnet_avg_rcvperf;
2284 float lnet_min_rcvperf;
2285 float lnet_max_rcvperf;
2286 float lnet_total_rcvperf;
2288 int lnet_stat_count;
2289 } lst_lnet_stat_result_t;
2291 lst_lnet_stat_result_t lnet_stat_result;
2294 lst_lnet_stat_value(int bw, int send, int off)
2298 p = bw ? &lnet_stat_result.lnet_avg_sndperf :
2299 &lnet_stat_result.lnet_avg_sndrate;
2310 lst_cal_lnet_stat(float delta, struct lnet_counters_common *lnet_new,
2311 struct lnet_counters_common *lnet_old, int mbs)
2315 unsigned int unit_divisor;
2317 unit_divisor = (mbs) ? (1000 * 1000) : (1024 * 1024);
2318 perf = (float)(lnet_new->lcc_send_length -
2319 lnet_old->lcc_send_length) / unit_divisor / delta;
2320 lnet_stat_result.lnet_total_sndperf += perf;
2322 if (lnet_stat_result.lnet_min_sndperf > perf ||
2323 lnet_stat_result.lnet_min_sndperf == 0)
2324 lnet_stat_result.lnet_min_sndperf = perf;
2326 if (lnet_stat_result.lnet_max_sndperf < perf)
2327 lnet_stat_result.lnet_max_sndperf = perf;
2329 perf = (float)(lnet_new->lcc_recv_length -
2330 lnet_old->lcc_recv_length) / unit_divisor / delta;
2331 lnet_stat_result.lnet_total_rcvperf += perf;
2333 if (lnet_stat_result.lnet_min_rcvperf > perf ||
2334 lnet_stat_result.lnet_min_rcvperf == 0)
2335 lnet_stat_result.lnet_min_rcvperf = perf;
2337 if (lnet_stat_result.lnet_max_rcvperf < perf)
2338 lnet_stat_result.lnet_max_rcvperf = perf;
2340 rate = (lnet_new->lcc_send_count - lnet_old->lcc_send_count) / delta;
2341 lnet_stat_result.lnet_total_sndrate += rate;
2343 if (lnet_stat_result.lnet_min_sndrate > rate ||
2344 lnet_stat_result.lnet_min_sndrate == 0)
2345 lnet_stat_result.lnet_min_sndrate = rate;
2347 if (lnet_stat_result.lnet_max_sndrate < rate)
2348 lnet_stat_result.lnet_max_sndrate = rate;
2350 rate = (lnet_new->lcc_recv_count - lnet_old->lcc_recv_count) / delta;
2351 lnet_stat_result.lnet_total_rcvrate += rate;
2353 if (lnet_stat_result.lnet_min_rcvrate > rate ||
2354 lnet_stat_result.lnet_min_rcvrate == 0)
2355 lnet_stat_result.lnet_min_rcvrate = rate;
2357 if (lnet_stat_result.lnet_max_rcvrate < rate)
2358 lnet_stat_result.lnet_max_rcvrate = rate;
2360 lnet_stat_result.lnet_stat_count++;
2362 lnet_stat_result.lnet_avg_sndrate = lnet_stat_result.lnet_total_sndrate /
2363 lnet_stat_result.lnet_stat_count;
2364 lnet_stat_result.lnet_avg_rcvrate = lnet_stat_result.lnet_total_rcvrate /
2365 lnet_stat_result.lnet_stat_count;
2367 lnet_stat_result.lnet_avg_sndperf = lnet_stat_result.lnet_total_sndperf /
2368 lnet_stat_result.lnet_stat_count;
2369 lnet_stat_result.lnet_avg_rcvperf = lnet_stat_result.lnet_total_rcvperf /
2370 lnet_stat_result.lnet_stat_count;
2374 lst_print_lnet_stat(char *name, int bwrt, int rdwr, int type, int mbs)
2384 if (lnet_stat_result.lnet_stat_count == 0)
2387 units = (mbs) ? "MB/s " : "MiB/s ";
2389 if (bwrt == 1) /* bw only */
2392 if (bwrt == 2) /* rates only */
2395 if (rdwr == 1) /* recv only */
2398 if (rdwr == 2) /* send only */
2401 for (i = start1; i <= end1; i++) {
2402 fprintf(stdout, "[LNet %s of %s]\n",
2403 i == 0 ? "Rates" : "Bandwidth", name);
2405 for (j = start2; j <= end2; j++) {
2406 fprintf(stdout, "[%c] ", j == 0 ? 'R' : 'W');
2408 if ((type & 1) != 0) {
2409 fprintf(stdout, i == 0 ? "Avg: %-8.0f RPC/s " :
2411 lst_lnet_stat_value(i, j, 0), units);
2414 if ((type & 2) != 0) {
2415 fprintf(stdout, i == 0 ? "Min: %-8.0f RPC/s " :
2417 lst_lnet_stat_value(i, j, 1), units);
2420 if ((type & 4) != 0) {
2421 fprintf(stdout, i == 0 ? "Max: %-8.0f RPC/s" :
2423 lst_lnet_stat_value(i, j, 2), units);
2426 fprintf(stdout, "\n");
2432 lst_print_stat(char *name, struct list_head *resultp,
2433 int idx, int lnet, int bwrt, int rdwr, int type,
2436 struct list_head tmp[2];
2437 struct lstcon_rpc_ent *new;
2438 struct lstcon_rpc_ent *old;
2439 struct sfw_counters *sfwk_new;
2440 struct sfw_counters *sfwk_old;
2441 struct srpc_counters *srpc_new;
2442 struct srpc_counters *srpc_old;
2443 struct lnet_counters_common *lnet_new;
2444 struct lnet_counters_common *lnet_old;
2448 INIT_LIST_HEAD(&tmp[0]);
2449 INIT_LIST_HEAD(&tmp[1]);
2451 memset(&lnet_stat_result, 0, sizeof(lnet_stat_result));
2453 while (!list_empty(&resultp[idx])) {
2454 if (list_empty(&resultp[1 - idx])) {
2455 fprintf(stderr, "Group is changed, re-run stat\n");
2459 new = list_first_entry(&resultp[idx], struct lstcon_rpc_ent,
2461 old = list_first_entry(&resultp[1 - idx], struct lstcon_rpc_ent,
2464 /* first time get stats result, can't calculate diff */
2465 if (new->rpe_peer.nid == LNET_NID_ANY)
2468 if (new->rpe_peer.nid != old->rpe_peer.nid ||
2469 new->rpe_peer.pid != old->rpe_peer.pid) {
2470 /* Something wrong. i.e, somebody change the group */
2474 list_move_tail(&new->rpe_link, &tmp[idx]);
2476 list_move_tail(&old->rpe_link, &tmp[1 - idx]);
2478 if (new->rpe_rpc_errno != 0 || new->rpe_fwk_errno != 0 ||
2479 old->rpe_rpc_errno != 0 || old->rpe_fwk_errno != 0) {
2484 sfwk_new = (struct sfw_counters *)&new->rpe_payload[0];
2485 sfwk_old = (struct sfw_counters *)&old->rpe_payload[0];
2487 srpc_new = (struct srpc_counters *)((char *)sfwk_new +
2489 srpc_old = (struct srpc_counters *)((char *)sfwk_old +
2492 lnet_new = (struct lnet_counters_common *)((char *)srpc_new +
2494 lnet_old = (struct lnet_counters_common *)((char *)srpc_old +
2497 /* Prior to version 2.3, the running_ms was a counter for
2498 * the number of running tests. Since 2.3, running_ms is
2499 * changed to hold the millisecond since the start of
2500 * the work item. The rpe_stamp field was formerly used,
2501 * but is no longer. In 2.12 rpe_stamp was changed to
2502 * struct timespec64 and has nanosecond resolution, in
2503 * case it is needed in the future.
2505 delta = (float)(sfwk_new->running_ms -
2506 sfwk_old->running_ms) / 1000;
2508 if (!lnet) /* TODO */
2511 lst_cal_lnet_stat(delta, lnet_new, lnet_old, mbs);
2514 list_splice(&tmp[idx], &resultp[idx]);
2515 list_splice(&tmp[1 - idx], &resultp[1 - idx]);
2518 fprintf(stdout, "Failed to stat on %d nodes\n", errcount);
2520 if (!lnet) /* TODO */
2523 lst_print_lnet_stat(name, bwrt, rdwr, type, mbs);
2527 jt_lst_stat(int argc, char **argv)
2529 struct list_head head;
2530 lst_stat_req_param_t *srp;
2533 int timeout = 5; /* default timeout, 5 sec */
2534 int delay = 5; /* default delay, 5 sec */
2535 int count = -1; /* run forever */
2536 int lnet = 1; /* lnet stat by default */
2543 int mbs = 0; /* report as MB/s */
2545 static const struct option stat_opts[] = {
2546 { .name = "timeout", .has_arg = required_argument, .val = 't' },
2547 { .name = "delay", .has_arg = required_argument, .val = 'd' },
2548 { .name = "count", .has_arg = required_argument, .val = 'o' },
2549 { .name = "lnet", .has_arg = no_argument, .val = 'l' },
2550 { .name = "rpc", .has_arg = no_argument, .val = 'c' },
2551 { .name = "bw", .has_arg = no_argument, .val = 'b' },
2552 { .name = "rate", .has_arg = no_argument, .val = 'a' },
2553 { .name = "read", .has_arg = no_argument, .val = 'r' },
2554 { .name = "write", .has_arg = no_argument, .val = 'w' },
2555 { .name = "avg", .has_arg = no_argument, .val = 'g' },
2556 { .name = "min", .has_arg = no_argument, .val = 'n' },
2557 { .name = "max", .has_arg = no_argument, .val = 'x' },
2558 { .name = "mbs", .has_arg = no_argument, .val = 'm' },
2561 if (session_key == 0) {
2563 "Can't find env LST_SESSION or value is not valid\n");
2568 c = getopt_long(argc, argv, "t:d:lcbarwgnxm", stat_opts,
2576 timeout = atoi(optarg);
2579 delay = atoi(optarg);
2582 count = atoi(optarg);
2628 lst_print_usage(argv[0]);
2633 if (optind == argc) {
2634 lst_print_usage(argv[0]);
2638 if (timeout <= 0 || delay <= 0) {
2639 fprintf(stderr, "Invalid timeout or delay value\n");
2644 fprintf(stderr, "Invalid count value\n");
2648 /* extra count to get first data point */
2652 INIT_LIST_HEAD(&head);
2654 while (optind < argc) {
2655 rc = lst_stat_req_param_alloc(argv[optind++], &srp, 1);
2659 list_add_tail(&srp->srp_link, &head);
2663 time_t now = time(NULL);
2665 if (now - last < delay) {
2666 sleep(delay - now + last);
2671 list_for_each_entry(srp, &head, srp_link) {
2672 rc = lst_stat_ioctl(srp->srp_name,
2673 srp->srp_count, srp->srp_ids,
2674 timeout, &srp->srp_result[idx]);
2676 lst_print_error("stat", "Failed to stat %s: %s\n",
2677 srp->srp_name, strerror(errno));
2681 lst_print_stat(srp->srp_name, srp->srp_result,
2682 idx, lnet, bwrt, rdwr, type, mbs);
2684 lst_reset_rpcent(&srp->srp_result[1 - idx]);
2691 } while (count == -1 || count > 0);
2694 while (!list_empty(&head)) {
2695 srp = list_first_entry(&head, lst_stat_req_param_t, srp_link);
2697 list_del(&srp->srp_link);
2698 lst_stat_req_param_free(srp);
2705 jt_lst_show_error(int argc, char **argv)
2707 struct list_head head;
2708 lst_stat_req_param_t *srp;
2709 struct lstcon_rpc_ent *ent;
2710 struct sfw_counters *sfwk;
2711 struct srpc_counters *srpc;
2718 static const struct option show_error_opts[] = {
2719 { .name = "session", .has_arg = no_argument, .val = 's' },
2720 { .name = NULL, } };
2722 if (session_key == 0) {
2724 "Can't find env LST_SESSION or value is not valid\n");
2729 c = getopt_long(argc, argv, "s", show_error_opts, &optidx);
2740 lst_print_usage(argv[0]);
2745 if (optind == argc) {
2746 lst_print_usage(argv[0]);
2750 INIT_LIST_HEAD(&head);
2752 while (optind < argc) {
2753 rc = lst_stat_req_param_alloc(argv[optind++], &srp, 0);
2757 list_add_tail(&srp->srp_link, &head);
2760 list_for_each_entry(srp, &head, srp_link) {
2761 rc = lst_stat_ioctl(srp->srp_name, srp->srp_count,
2762 srp->srp_ids, 10, &srp->srp_result[0]);
2765 lst_print_error(srp->srp_name, "Failed to show errors of %s: %s\n",
2766 srp->srp_name, strerror(errno));
2770 fprintf(stdout, "%s:\n", srp->srp_name);
2774 list_for_each_entry(ent, &srp->srp_result[0], rpe_link) {
2775 if (ent->rpe_rpc_errno != 0) {
2777 fprintf(stderr, "RPC failure, can't show error on %s\n",
2778 libcfs_id2str(ent->rpe_peer));
2782 if (ent->rpe_fwk_errno != 0) {
2784 fprintf(stderr, "Framework failure, can't show error on %s\n",
2785 libcfs_id2str(ent->rpe_peer));
2789 sfwk = (struct sfw_counters *)&ent->rpe_payload[0];
2790 srpc = (struct srpc_counters *)((char *)sfwk + sizeof(*sfwk));
2792 if (srpc->errors == 0 &&
2793 sfwk->brw_errors == 0 && sfwk->ping_errors == 0)
2797 sfwk->brw_errors == 0 && sfwk->ping_errors == 0)
2802 fprintf(stderr, "%s: [Session %d brw errors, %d ping errors]%c",
2803 libcfs_id2str(ent->rpe_peer),
2804 sfwk->brw_errors, sfwk->ping_errors,
2805 show_rpc ? ' ' : '\n');
2810 fprintf(stderr, "[RPC: %d errors, %d dropped, %d expired]\n",
2811 srpc->errors, srpc->rpcs_dropped, srpc->rpcs_expired);
2814 fprintf(stdout, "Total %d error nodes in %s\n", ecount, srp->srp_name);
2817 while (!list_empty(&head)) {
2818 srp = list_first_entry(&head, lst_stat_req_param_t, srp_link);
2820 list_del(&srp->srp_link);
2821 lst_stat_req_param_free(srp);
2828 lst_add_batch_ioctl(char *name)
2830 struct lstio_batch_add_args args = { 0 };
2832 args.lstio_bat_key = session_key;
2833 args.lstio_bat_nmlen = strlen(name);
2834 args.lstio_bat_namep = name;
2836 return lst_ioctl (LSTIO_BATCH_ADD, &args, sizeof(args));
2840 jt_lst_add_batch(int argc, char **argv)
2845 if (session_key == 0) {
2847 "Can't find env LST_SESSION or value is not valid\n");
2852 lst_print_usage(argv[0]);
2857 if (strlen(name) >= LST_NAME_SIZE) {
2858 fprintf(stderr, "Name length is limited to %d\n",
2863 rc = lst_add_batch_ioctl(name);
2867 lst_print_error("batch", "Failed to create batch: %s\n",
2874 lst_start_batch_ioctl(char *name, int timeout, struct list_head *resultp)
2876 struct lstio_batch_run_args args = { 0 };
2878 args.lstio_bat_key = session_key;
2879 args.lstio_bat_timeout = timeout;
2880 args.lstio_bat_nmlen = strlen(name);
2881 args.lstio_bat_namep = name;
2882 args.lstio_bat_resultp = resultp;
2884 return lst_ioctl(LSTIO_BATCH_START, &args, sizeof(args));
2888 jt_lst_start_batch(int argc, char **argv)
2890 struct list_head head;
2898 static const struct option start_batch_opts[] = {
2899 { .name = "timeout", .has_arg = required_argument, .val = 't' },
2902 if (session_key == 0) {
2904 "Can't find env LST_SESSION or value is not valid\n");
2909 c = getopt_long(argc, argv, "t:",
2910 start_batch_opts, &optidx);
2912 /* Detect the end of the options. */
2918 timeout = atoi(optarg);
2921 lst_print_usage(argv[0]);
2926 if (optind == argc) {
2927 batch = LST_DEFAULT_BATCH;
2929 } else if (optind == argc - 1) {
2930 batch = argv[optind];
2933 lst_print_usage(argv[0]);
2937 rc = lst_get_node_count(LST_OPC_BATCHCLI, batch, &count, NULL);
2939 fprintf(stderr, "Failed to get count of nodes from %s: %s\n",
2940 batch, strerror(errno));
2944 INIT_LIST_HEAD(&head);
2946 rc = lst_alloc_rpcent(&head, count, 0);
2948 fprintf(stderr, "Out of memory\n");
2952 rc = lst_start_batch_ioctl(batch, timeout, &head);
2955 fprintf(stdout, "%s is running now\n", batch);
2956 lst_free_rpcent(&head);
2961 lst_print_error("batch", "Failed to start batch: %s\n",
2963 lst_free_rpcent(&head);
2967 lst_print_transerr(&head, "Run batch");
2969 lst_free_rpcent(&head);
2975 lst_stop_batch_ioctl(char *name, int force, struct list_head *resultp)
2977 struct lstio_batch_stop_args args = { 0 };
2979 args.lstio_bat_key = session_key;
2980 args.lstio_bat_force = force;
2981 args.lstio_bat_nmlen = strlen(name);
2982 args.lstio_bat_namep = name;
2983 args.lstio_bat_resultp = resultp;
2985 return lst_ioctl(LSTIO_BATCH_STOP, &args, sizeof(args));
2989 jt_lst_stop_batch(int argc, char **argv)
2991 struct list_head head;
2999 static const struct option stop_batch_opts[] = {
3000 { .name = "force", .has_arg = no_argument, .val = 'f' },
3003 if (session_key == 0) {
3005 "Can't find env LST_SESSION or value is not valid\n");
3010 c = getopt_long(argc, argv, "f",
3011 stop_batch_opts, &optidx);
3013 /* Detect the end of the options. */
3022 lst_print_usage(argv[0]);
3027 if (optind == argc) {
3028 batch = LST_DEFAULT_BATCH;
3030 } else if (optind == argc - 1) {
3031 batch = argv[optind];
3034 lst_print_usage(argv[0]);
3038 rc = lst_get_node_count(LST_OPC_BATCHCLI, batch, &count, NULL);
3040 fprintf(stderr, "Failed to get count of nodes from %s: %s\n",
3041 batch, strerror(errno));
3045 INIT_LIST_HEAD(&head);
3047 rc = lst_alloc_rpcent(&head, count, 0);
3049 fprintf(stderr, "Out of memory\n");
3053 rc = lst_stop_batch_ioctl(batch, force, &head);
3058 lst_reset_rpcent(&head);
3060 rc = lst_query_batch_ioctl(batch, 0, 0, 30, &head);
3064 if (lstcon_tsbqry_stat_run(&trans_stat, 0) == 0 &&
3065 lstcon_tsbqry_stat_failure(&trans_stat, 0) == 0)
3068 fprintf(stdout, "%d batch in stopping\n",
3069 lstcon_tsbqry_stat_run(&trans_stat, 0));
3073 fprintf(stdout, "Batch is stopped\n");
3074 lst_free_rpcent(&head);
3079 lst_print_error("batch", "Failed to stop batch: %s\n",
3081 lst_free_rpcent(&head);
3085 lst_print_transerr(&head, "stop batch");
3087 lst_free_rpcent(&head);
3093 lst_list_batch_ioctl(int len, char *name, int index)
3095 struct lstio_batch_list_args args = { 0 };
3097 args.lstio_bat_key = session_key;
3098 args.lstio_bat_idx = index;
3099 args.lstio_bat_nmlen = len;
3100 args.lstio_bat_namep = name;
3102 return lst_ioctl(LSTIO_BATCH_LIST, &args, sizeof(args));
3106 lst_info_batch_ioctl(char *batch, int test, int server,
3107 struct lstcon_test_batch_ent *entp, int *idxp,
3108 int *ndentp, struct lstcon_node_ent *dentsp)
3110 struct lstio_batch_info_args args = { 0 };
3112 args.lstio_bat_key = session_key;
3113 args.lstio_bat_nmlen = strlen(batch);
3114 args.lstio_bat_namep = batch;
3115 args.lstio_bat_server = server;
3116 args.lstio_bat_testidx = test;
3117 args.lstio_bat_entp = entp;
3118 args.lstio_bat_idxp = idxp;
3119 args.lstio_bat_ndentp = ndentp;
3120 args.lstio_bat_dentsp = dentsp;
3122 return lst_ioctl(LSTIO_BATCH_INFO, &args, sizeof(args));
3126 lst_list_batch_all(void)
3128 char name[LST_NAME_SIZE];
3132 for (i = 0; ; i++) {
3133 rc = lst_list_batch_ioctl(LST_NAME_SIZE, name, i);
3135 fprintf(stdout, "%d) %s\n", i + 1, name);
3139 if (errno == ENOENT)
3142 lst_print_error("batch", "Failed to list batch: %s\n",
3147 fprintf(stdout, "Total %d batches\n", i);
3153 lst_list_tsb_nodes(char *batch, int test, int server,
3154 int count, int active, int invalid)
3156 struct lstcon_node_ent *dents;
3165 /* verbose list, show nodes in batch or test */
3166 dents = malloc(count * sizeof(struct lstcon_node_ent));
3167 if (dents == NULL) {
3168 fprintf(stdout, "Can't allocate memory\n");
3172 rc = lst_info_batch_ioctl(batch, test, server,
3173 NULL, &index, &count, dents);
3176 lst_print_error((test > 0) ? "test" : "batch",
3177 (test > 0) ? "Failed to query test: %s\n" :
3178 "Failed to query batch: %s\n",
3183 for (i = 0, c = 0; i < count; i++) {
3184 if ((!active && dents[i].nde_state == LST_NODE_ACTIVE) ||
3185 (!invalid && (dents[i].nde_state == LST_NODE_BUSY ||
3186 dents[i].nde_state == LST_NODE_DOWN ||
3187 dents[i].nde_state == LST_NODE_UNKNOWN)))
3190 fprintf(stdout, "\t%s: %s\n",
3191 libcfs_id2str(dents[i].nde_id),
3192 lst_node_state2str(dents[i].nde_state));
3196 fprintf(stdout, "Total %d nodes\n", c);
3203 jt_lst_list_batch(int argc, char **argv)
3205 struct lstcon_test_batch_ent ent;
3208 int verbose = 0; /* list nodes in batch or test */
3217 static const struct option list_batch_opts[] = {
3218 { .name = "test", .has_arg = required_argument, .val = 't' },
3219 { .name = "invalid", .has_arg = no_argument, .val = 'i' },
3220 { .name = "active", .has_arg = no_argument, .val = 'a' },
3221 { .name = "all", .has_arg = no_argument, .val = 'l' },
3222 { .name = "server", .has_arg = no_argument, .val = 's' },
3223 { .name = NULL, } };
3225 if (session_key == 0) {
3227 "Can't find env LST_SESSION or value is not valid\n");
3232 c = getopt_long(argc, argv, "ailst:",
3233 list_batch_opts, &optidx);
3240 verbose = active = 1;
3243 verbose = invalid = 1;
3246 verbose = active = invalid = 1;
3252 test = atoi(optarg);
3256 lst_print_usage(argv[0]);
3261 if (optind == argc) {
3262 /* list all batches */
3263 rc = lst_list_batch_all();
3267 if (ntest == 1 && test <= 0) {
3268 fprintf(stderr, "Invalid test id, test id starts from 1\n");
3272 if (optind != argc - 1) {
3273 lst_print_usage(argv[0]);
3277 batch = argv[optind];
3280 /* show detail of specified batch or test */
3281 rc = lst_info_batch_ioctl(batch, test, server,
3282 &ent, NULL, NULL, NULL);
3284 lst_print_error((test > 0) ? "test" : "batch",
3285 (test > 0) ? "Failed to query test: %s\n" :
3286 "Failed to query batch: %s\n",
3292 /* list nodes in test or batch */
3293 rc = lst_list_tsb_nodes(batch, test, server,
3294 server ? ent.tbe_srv_nle.nle_nnode :
3295 ent.tbe_cli_nle.nle_nnode,
3300 /* only show number of hosts in batch or test */
3302 fprintf(stdout, "Batch: %s Tests: %d State: %d\n",
3303 batch, ent.u.tbe_batch.bae_ntest,
3304 ent.u.tbe_batch.bae_state);
3305 ntest = ent.u.tbe_batch.bae_ntest;
3306 test = 1; /* starting from test 1 */
3310 "\tTest %d(%s) (loop: %d, concurrency: %d)\n",
3311 test, lst_test_type2name(ent.u.tbe_test.tse_type),
3312 ent.u.tbe_test.tse_loop,
3313 ent.u.tbe_test.tse_concur);
3318 fprintf(stdout, LST_NODES_TITLE);
3319 fprintf(stdout, "client\t%d\t%d\t%d\t%d\t%d\n"
3320 "server\t%d\t%d\t%d\t%d\t%d\n",
3321 ent.tbe_cli_nle.nle_nactive,
3322 ent.tbe_cli_nle.nle_nbusy,
3323 ent.tbe_cli_nle.nle_ndown,
3324 ent.tbe_cli_nle.nle_nunknown,
3325 ent.tbe_cli_nle.nle_nnode,
3326 ent.tbe_srv_nle.nle_nactive,
3327 ent.tbe_srv_nle.nle_nbusy,
3328 ent.tbe_srv_nle.nle_ndown,
3329 ent.tbe_srv_nle.nle_nunknown,
3330 ent.tbe_srv_nle.nle_nnode);
3339 lst_query_batch_ioctl(char *batch, int test, int server,
3340 int timeout, struct list_head *head)
3342 struct lstio_batch_query_args args = { 0 };
3344 args.lstio_bat_key = session_key;
3345 args.lstio_bat_testidx = test;
3346 args.lstio_bat_client = !(server);
3347 args.lstio_bat_timeout = timeout;
3348 args.lstio_bat_nmlen = strlen(batch);
3349 args.lstio_bat_namep = batch;
3350 args.lstio_bat_resultp = head;
3352 return lst_ioctl(LSTIO_BATCH_QUERY, &args, sizeof(args));
3356 lst_print_tsb_verbose(struct list_head *head,
3357 int active, int idle, int error)
3359 struct lstcon_rpc_ent *ent;
3361 list_for_each_entry(ent, head, rpe_link) {
3362 if (ent->rpe_priv[0] == 0 && active)
3365 if (ent->rpe_priv[0] != 0 && idle)
3368 if (ent->rpe_fwk_errno == 0 && error)
3371 fprintf(stdout, "%s [%s]: %s\n",
3372 libcfs_id2str(ent->rpe_peer),
3373 lst_node_state2str(ent->rpe_state),
3374 ent->rpe_rpc_errno != 0 ?
3375 strerror(ent->rpe_rpc_errno) :
3376 (ent->rpe_priv[0] > 0 ? "Running" : "Idle"));
3381 jt_lst_query_batch(int argc, char **argv)
3383 struct lstcon_test_batch_ent ent;
3384 struct list_head head;
3390 int timeout = 5; /* default 5 seconds */
3391 int delay = 5; /* default 5 seconds */
3392 int loop = 1; /* default 1 loop */
3402 static const struct option query_batch_opts[] = {
3403 { .name = "timeout", .has_arg = required_argument, .val = 'o' },
3404 { .name = "delay", .has_arg = required_argument, .val = 'd' },
3405 { .name = "loop", .has_arg = required_argument, .val = 'c' },
3406 { .name = "test", .has_arg = required_argument, .val = 't' },
3407 { .name = "server", .has_arg = no_argument, .val = 's' },
3408 { .name = "active", .has_arg = no_argument, .val = 'a' },
3409 { .name = "idle", .has_arg = no_argument, .val = 'i' },
3410 { .name = "error", .has_arg = no_argument, .val = 'e' },
3411 { .name = "all", .has_arg = no_argument, .val = 'l' },
3412 { .name = NULL, } };
3414 if (session_key == 0) {
3416 "Can't find env LST_SESSION or value is not valid\n");
3421 c = getopt_long(argc, argv, "o:d:c:t:saiel",
3422 query_batch_opts, &optidx);
3424 /* Detect the end of the options. */
3430 timeout = atoi(optarg);
3433 delay = atoi(optarg);
3436 loop = atoi(optarg);
3439 test = atoi(optarg);
3445 active = verbose = 1;
3451 error = verbose = 1;
3457 lst_print_usage(argv[0]);
3462 if (test < 0 || timeout <= 0 || delay <= 0 || loop <= 0) {
3463 lst_print_usage(argv[0]);
3467 if (optind == argc) {
3468 batch = LST_DEFAULT_BATCH;
3470 } else if (optind == argc - 1) {
3471 batch = argv[optind];
3474 lst_print_usage(argv[0]);
3479 INIT_LIST_HEAD(&head);
3482 rc = lst_info_batch_ioctl(batch, test, server,
3483 &ent, NULL, NULL, NULL);
3485 fprintf(stderr, "Failed to query %s [%d]: %s\n",
3486 batch, test, strerror(errno));
3490 count = server ? ent.tbe_srv_nle.nle_nnode :
3491 ent.tbe_cli_nle.nle_nnode;
3493 fprintf(stdout, "Batch or test is empty\n");
3498 rc = lst_alloc_rpcent(&head, count, 0);
3500 fprintf(stderr, "Out of memory\n");
3504 for (i = 0; i < loop; i++) {
3505 time_t now = time(NULL);
3507 if (now - last < delay) {
3508 sleep(delay - now + last);
3514 rc = lst_query_batch_ioctl(batch, test,
3515 server, timeout, &head);
3517 fprintf(stderr, "Failed to query batch: %s\n",
3524 lst_print_tsb_verbose(&head, active, idle, error);
3528 fprintf(stdout, "%s [%d] ", batch, test);
3530 if (lstcon_rpc_stat_failure(&trans_stat, 0) != 0) {
3531 fprintf(stdout, "%d of %d nodes are unknown, ",
3532 lstcon_rpc_stat_failure(&trans_stat, 0),
3533 lstcon_rpc_stat_total(&trans_stat, 0));
3536 if (lstcon_rpc_stat_failure(&trans_stat, 0) == 0 &&
3537 lstcon_tsbqry_stat_run(&trans_stat, 0) == 0 &&
3538 lstcon_tsbqry_stat_failure(&trans_stat, 0) == 0) {
3539 fprintf(stdout, "is stopped\n");
3543 if (lstcon_rpc_stat_failure(&trans_stat, 0) == 0 &&
3544 lstcon_tsbqry_stat_idle(&trans_stat, 0) == 0 &&
3545 lstcon_tsbqry_stat_failure(&trans_stat, 0) == 0) {
3546 fprintf(stdout, "is running\n");
3550 fprintf(stdout, "stopped: %d , running: %d, failed: %d\n",
3551 lstcon_tsbqry_stat_idle(&trans_stat, 0),
3552 lstcon_tsbqry_stat_run(&trans_stat, 0),
3553 lstcon_tsbqry_stat_failure(&trans_stat, 0));
3556 lst_free_rpcent(&head);
3562 lst_parse_distribute(char *dstr, int *dist, int *span)
3568 dstr = strchr(dstr, ':');
3572 *span = atoi(dstr + 1);
3580 lst_get_bulk_param(int argc, char **argv, struct lst_test_bulk_param *bulk)
3587 bulk->blk_size = 4096;
3588 bulk->blk_opc = LST_BRW_READ;
3589 bulk->blk_flags = LST_BRW_CHECK_NONE;
3590 bulk->blk_srv_off = bulk->blk_cli_off = 0;
3593 if (strcasestr(argv[i], "check=") == argv[i] ||
3594 strcasestr(argv[i], "c=") == argv[i]) {
3595 tok = strchr(argv[i], '=') + 1;
3597 if (strcasecmp(tok, "full") == 0) {
3598 bulk->blk_flags = LST_BRW_CHECK_FULL;
3599 } else if (strcasecmp(tok, "simple") == 0) {
3600 bulk->blk_flags = LST_BRW_CHECK_SIMPLE;
3602 fprintf(stderr, "Unknow flag %s\n", tok);
3606 } else if (strcasestr(argv[i], "size=") == argv[i] ||
3607 strcasestr(argv[i], "s=") == argv[i]) {
3608 tok = strchr(argv[i], '=') + 1;
3610 bulk->blk_size = strtol(tok, &end, 0);
3611 if (bulk->blk_size <= 0) {
3612 fprintf(stderr, "Invalid size %s\n", tok);
3619 if (*end == 'k' || *end == 'K')
3620 bulk->blk_size *= 1024;
3621 else if (*end == 'm' || *end == 'M')
3622 bulk->blk_size *= 1024 * 1024;
3624 if (bulk->blk_size > LNET_MTU) {
3625 fprintf(stderr, "Size exceed limitation: %d bytes\n",
3630 } else if (strcasestr(argv[i], "off=") == argv[i]) {
3633 tok = strchr(argv[i], '=') + 1;
3635 off = strtol(tok, &end, 0);
3636 /* NB: align with sizeof(__u64) to simplify page
3637 * checking implementation */
3638 if (off < 0 || off % sizeof(__u64) != 0) {
3640 "Invalid offset %s/%d, it should be "
3641 "postive value and multiple of %d\n",
3642 tok, off, (int)sizeof(__u64));
3646 /* NB: blk_srv_off is reserved so far */
3647 bulk->blk_cli_off = bulk->blk_srv_off = off;
3651 } else if (strcasecmp(argv[i], "read") == 0 ||
3652 strcasecmp(argv[i], "r") == 0) {
3653 bulk->blk_opc = LST_BRW_READ;
3655 } else if (strcasecmp(argv[i], "write") == 0 ||
3656 strcasecmp(argv[i], "w") == 0) {
3657 bulk->blk_opc = LST_BRW_WRITE;
3660 fprintf(stderr, "Unknow parameter: %s\n", argv[i]);
3671 lst_get_test_param(char *test, int argc, char **argv, void **param, int *plen)
3673 struct lst_test_bulk_param *bulk = NULL;
3674 struct lst_test_ping_param *ping = NULL;
3677 type = lst_test_name2type(test);
3679 fprintf(stderr, "Unknow test name %s\n", test);
3685 /* unused but needs for kernel part */
3686 ping = malloc(sizeof(*ping));
3688 fprintf(stderr, "Out of memory\n");
3691 memset(ping, 0, sizeof(*ping));
3694 *plen = sizeof(*ping);
3699 bulk = malloc(sizeof(*bulk));
3701 fprintf(stderr, "Out of memory\n");
3705 memset(bulk, 0, sizeof(*bulk));
3707 if (lst_get_bulk_param(argc, argv, bulk) != 0) {
3713 *plen = sizeof(*bulk);
3721 /* TODO: parse more parameter */
3726 lst_add_test_ioctl(char *batch, int type, int loop, int concur,
3727 int dist, int span, char *sgrp, char *dgrp,
3728 void *param, int plen, int *retp, struct list_head *resultp)
3730 struct lstio_test_args args = { 0 };
3732 args.lstio_tes_key = session_key;
3733 args.lstio_tes_bat_nmlen = strlen(batch);
3734 args.lstio_tes_bat_name = batch;
3735 args.lstio_tes_type = type;
3736 args.lstio_tes_oneside = 0;
3737 args.lstio_tes_loop = loop;
3738 args.lstio_tes_concur = concur;
3739 args.lstio_tes_dist = dist;
3740 args.lstio_tes_span = span;
3741 args.lstio_tes_sgrp_nmlen = strlen(sgrp);
3742 args.lstio_tes_sgrp_name = sgrp;
3743 args.lstio_tes_dgrp_nmlen = strlen(dgrp);
3744 args.lstio_tes_dgrp_name = dgrp;
3745 args.lstio_tes_param_len = plen;
3746 args.lstio_tes_param = param;
3747 args.lstio_tes_retp = retp;
3748 args.lstio_tes_resultp = resultp;
3750 return lst_ioctl(LSTIO_TEST_ADD, &args, sizeof(args));
3754 jt_lst_add_test(int argc, char **argv)
3756 struct list_head head;
3776 static const struct option add_test_opts[] = {
3777 { .name = "batch", .has_arg = required_argument, .val = 'b' },
3778 { .name = "concurrency", .has_arg = required_argument, .val = 'c' },
3779 { .name = "distribute", .has_arg = required_argument, .val = 'd' },
3780 { .name = "from", .has_arg = required_argument, .val = 'f' },
3781 { .name = "to", .has_arg = required_argument, .val = 't' },
3782 { .name = "loop", .has_arg = required_argument, .val = 'l' },
3785 if (session_key == 0) {
3787 "Can't find env LST_SESSION or value is not valid\n");
3792 c = getopt_long(argc, argv, "b:c:d:f:l:t:",
3793 add_test_opts, &optidx);
3795 /* Detect the end of the options. */
3804 concur = atoi(optarg);
3813 loop = atoi(optarg);
3819 lst_print_usage(argv[0]);
3824 if (optind == argc || from == NULL || to == NULL) {
3825 lst_print_usage(argv[0]);
3829 if (concur <= 0 || concur > LST_MAX_CONCUR) {
3830 fprintf(stderr, "Invalid concurrency of test: %d\n", concur);
3835 batch = LST_DEFAULT_BATCH;
3838 rc = lst_parse_distribute(dstr, &dist, &span);
3840 fprintf(stderr, "Invalid distribution: %s\n", dstr);
3845 test = argv[optind++];
3850 type = lst_get_test_param(test, argc, argv, ¶m, &plen);
3852 fprintf(stderr, "Failed to add test (%s)\n", test);
3856 INIT_LIST_HEAD(&head);
3858 rc = lst_get_node_count(LST_OPC_GROUP, from, &fcount, NULL);
3860 fprintf(stderr, "Can't get count of nodes from %s: %s\n",
3861 from, strerror(errno));
3865 rc = lst_get_node_count(LST_OPC_GROUP, to, &tcount, NULL);
3867 fprintf(stderr, "Can't get count of nodes from %s: %s\n",
3868 to, strerror(errno));
3872 rc = lst_alloc_rpcent(&head, fcount > tcount ? fcount : tcount, 0);
3874 fprintf(stderr, "Out of memory\n");
3878 rc = lst_add_test_ioctl(batch, type, loop, concur,
3879 dist, span, from, to, param, plen, &ret, &head);
3882 fprintf(stdout, "Test was added successfully\n");
3884 fprintf(stdout, "Server group contains userland test "
3885 "nodes, old version of tcplnd can't accept "
3886 "connection request\n");
3893 lst_print_error("test", "Failed to add test: %s\n",
3898 lst_print_transerr(&head, "add test");
3900 lst_free_rpcent(&head);
3908 static command_t lst_cmdlist[] = {
3909 {"new_session", jt_lst_new_session, NULL,
3910 "Usage: lst new_session [--timeout TIME] [--force] [NAME]" },
3911 {"end_session", jt_lst_end_session, NULL,
3912 "Usage: lst end_session" },
3913 {"show_session", jt_lst_show_session, NULL,
3914 "Usage: lst show_session" },
3915 {"ping", jt_lst_ping , NULL,
3916 "Usage: lst ping [--group NAME] [--batch NAME] [--session] [--nodes IDS]" },
3917 {"add_group", jt_lst_add_group, NULL,
3918 "Usage: lst group NAME IDs [IDs]..." },
3919 {"del_group", jt_lst_del_group, NULL,
3920 "Usage: lst del_group NAME" },
3921 {"update_group", jt_lst_update_group, NULL,
3922 "Usage: lst update_group NAME [--clean] [--refresh] [--remove IDs]" },
3923 {"list_group", jt_lst_list_group, NULL,
3924 "Usage: lst list_group [--active] [--busy] [--down] [--unknown] GROUP ..." },
3925 {"stat", jt_lst_stat, NULL,
3926 "Usage: lst stat [--bw] [--rate] [--read] [--write] [--max] [--min] [--avg] "
3927 " [--mbs] [--timeout #] [--delay #] [--count #] GROUP [GROUP]" },
3928 {"show_error", jt_lst_show_error, NULL,
3929 "Usage: lst show_error NAME | IDS ..." },
3930 {"add_batch", jt_lst_add_batch, NULL,
3931 "Usage: lst add_batch NAME" },
3932 {"run", jt_lst_start_batch, NULL,
3933 "Usage: lst run [--timeout TIME] [NAME]" },
3934 {"stop", jt_lst_stop_batch, NULL,
3935 "Usage: lst stop [--force] BATCH_NAME" },
3936 {"list_batch", jt_lst_list_batch, NULL,
3937 "Usage: lst list_batch NAME [--test ID] [--server]" },
3938 {"query", jt_lst_query_batch, NULL,
3939 "Usage: lst query [--test ID] [--server] [--timeout TIME] NAME" },
3940 {"add_test", jt_lst_add_test, NULL,
3941 "Usage: lst add_test [--batch BATCH] [--loop #] [--concurrency #] "
3942 " [--distribute #:#] [--from GROUP] [--to GROUP] TEST..." },
3947 lst_initialize(void)
3952 feats = getenv("LST_FEATURES");
3954 session_features = strtol(feats, NULL, 16);
3956 if ((session_features & ~LST_FEATS_MASK) != 0) {
3958 "Unsupported session features %x, "
3959 "only support these features so far: %x\n",
3960 (session_features & ~LST_FEATS_MASK), LST_FEATS_MASK);
3964 key = getenv("LST_SESSION");
3971 session_key = atoi(key);
3976 int main(int argc, char **argv)
3982 rc = lst_initialize();
3986 rc = lustre_lnet_config_lib_init();
3990 rc = cfs_parser(argc, argv, lst_cmdlist);