Whamcloud - gitweb
LU-9399 llite: register mountpoint before process llog
[fs/lustre-release.git] / lnet / utils / lst.c
1 /*
2  * GPL HEADER START
3  *
4  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
5  *
6  * This program is free software; you can redistribute it and/or modify
7  * it under the terms of the GNU General Public License version 2 only,
8  * as published by the Free Software Foundation.
9  *
10  * This program is distributed in the hope that it will be useful, but
11  * WITHOUT ANY WARRANTY; without even the implied warranty of
12  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
13  * General Public License version 2 for more details (a copy is included
14  * in the LICENSE file that accompanied this code).
15  *
16  * You should have received a copy of the GNU General Public License
17  * version 2 along with this program; If not, see
18  * http://www.gnu.org/licenses/gpl-2.0.html
19  *
20  * GPL HEADER END
21  */
22 /*
23  * Copyright (c) 2007, 2010, Oracle and/or its affiliates. All rights reserved.
24  * Use is subject to license terms.
25  *
26  * Copyright (c) 2012, 2016, Intel Corporation.
27  */
28 /*
29  * This file is part of Lustre, http://www.lustre.org/
30  * Lustre is a trademark of Sun Microsystems, Inc.
31  *
32  * lnet/selftest/conctl.c
33  *
34  * Author: Liang Zhen <liangzhen@clusterfs.com>
35  */
36 #include <errno.h>
37 #include <getopt.h>
38 #include <inttypes.h>
39 #include <pwd.h>
40 #include <unistd.h>
41 #include <stdarg.h>
42 #include <stdio.h>
43 #include <stdlib.h>
44 #include <string.h>
45 #include <sys/ioctl.h>
46 #include <time.h>
47
48 #include <libcfs/util/list.h>
49 #include <libcfs/util/ioctl.h>
50 #include <libcfs/util/parser.h>
51 #include <lnet/lnetctl.h>
52 #include <lnet/lnetst.h>
53 #include <lnet/lnet.h>
54 #include <utils/obdctl.h>
55
56 struct lst_sid LST_INVALID_SID = { .ses_nid = LNET_NID_ANY, .ses_stamp = -1 };
57 static struct lst_sid session_id;
58 static int                 session_key;
59 static int lst_list_commands(int argc, char **argv);
60
61 /* All nodes running 2.6.50 or later understand feature LST_FEAT_BULK_LEN */
62 static unsigned         session_features = LST_FEATS_MASK;
63 static struct lstcon_trans_stat trans_stat;
64
65 typedef struct list_string {
66         struct list_string *lstr_next;
67         int                 lstr_sz;
68         char                lstr_str[0];
69 } lstr_t;
70
71 #ifndef offsetof
72 # define offsetof(typ,memb)     ((unsigned long)((char *)&(((typ *)0)->memb)))
73 #endif
74
75 static int alloc_count = 0;
76 static int alloc_nob   = 0;
77
78 lstr_t *
79 alloc_lstr(int sz)
80 {
81         lstr_t  *lstr = malloc(offsetof(lstr_t, lstr_str[sz]));
82
83         if (lstr == NULL) {
84                 fprintf(stderr, "Can't allocate lstr\n");
85                 abort();
86         }
87
88         alloc_nob += sz;
89         alloc_count++;
90
91         lstr->lstr_str[0] = 0;
92         lstr->lstr_sz = sz;
93         return lstr;
94 }
95
96 void
97 free_lstr(lstr_t *lstr)
98 {
99         alloc_count--;
100         alloc_nob -= lstr->lstr_sz;
101         free(lstr);
102 }
103
104 void
105 free_lstrs(lstr_t **list)
106 {
107         lstr_t   *lstr;
108
109         while ((lstr = *list) != NULL) {
110                 *list = lstr->lstr_next;
111                 free_lstr(lstr);
112         }
113 }
114
115 void
116 new_lstrs(lstr_t **list, char *prefix, char *postfix,
117           int lo, int hi, int stride)
118 {
119         int    n1 = strlen(prefix);
120         int    n2 = strlen(postfix);
121         int    sz = n1 + 20 + n2 + 1;
122
123         do {
124                 lstr_t *n = alloc_lstr(sz);
125
126                 snprintf(n->lstr_str, sz - 1, "%s%u%s",
127                          prefix, lo, postfix);
128
129                 n->lstr_next = *list;
130                 *list = n;
131
132                 lo += stride;
133         } while (lo <= hi);
134 }
135
136 int
137 expand_lstr(lstr_t **list, lstr_t *l)
138 {
139         int          nob = strlen(l->lstr_str);
140         char        *b1;
141         char        *b2;
142         char        *expr;
143         char        *sep;
144         int          x;
145         int          y;
146         int          z;
147         int          n;
148
149         b1 = strchr(l->lstr_str, '[');
150         if (b1 == NULL) {
151                 l->lstr_next = *list;
152                 *list = l;
153                 return 0;
154         }
155
156         b2 = strchr(b1, ']');
157         if (b2 == NULL || b2 == b1 + 1)
158                 return -1;
159
160         *b1++ = 0;
161         *b2++ = 0;
162         expr = b1;
163         do {
164
165                 sep = strchr(expr, ',');
166                 if (sep != NULL)
167                         *sep++ = 0;
168
169                 nob = strlen(expr);
170                 n = nob;
171                 if (sscanf(expr, "%u%n", &x, &n) >= 1 && n == nob) {
172                         /* simple number */
173                         new_lstrs(list, l->lstr_str, b2, x, x, 1);
174                         continue;
175                 }
176
177                 n = nob;
178                 if (sscanf(expr, "%u-%u%n", &x, &y, &n) >= 2 && n == nob &&
179                     x < y) {
180                         /* simple range */
181                         new_lstrs(list, l->lstr_str, b2, x, y, 1);
182                         continue;
183                 }
184
185                 n = nob;
186                 if (sscanf(expr, "%u-%u/%u%n", &x, &y, &z, &n) >= 3 && n == nob &&
187                     x < y) {
188                         /* strided range */
189                         new_lstrs(list, l->lstr_str, b2, x, y, z);
190                         continue;
191                 }
192
193                 /* syntax error */
194                 return -1;
195         } while ((expr = sep) != NULL);
196
197         free_lstr(l);
198
199         return 1;
200 }
201
202 int
203 expand_strs(char *str, lstr_t **head)
204 {
205         lstr_t  *list = NULL;
206         lstr_t  *nlist;
207         lstr_t  *l;
208         int      rc = 0;
209         int      expanded;
210
211         l = alloc_lstr(strlen(str) + 1);
212         memcpy(l->lstr_str, str, strlen(str) + 1);
213         l->lstr_next = NULL;
214         list = l;
215
216         do {
217                 expanded = 0;
218                 nlist = NULL;
219
220                 while ((l = list) != NULL) {
221                         list = l->lstr_next;
222
223                         rc = expand_lstr(&nlist, l);
224                         if (rc < 0) {
225                                 fprintf(stderr, "Syntax error in \"%s\"\n", str);
226                                 free_lstr(l);
227                                 break;
228                         }
229
230                         expanded |= rc > 0;
231                 }
232
233                 /* re-order onto 'list' */
234                 while ((l = nlist) != NULL) {
235                         nlist = l->lstr_next;
236                         l->lstr_next = list;
237                         list = l;
238                 }
239
240         } while (expanded && rc > 0);
241
242         if (rc >= 0) {
243                 *head = list;
244                 return 0;
245         }
246
247         while ((l = list) != NULL) {
248                 list = l->lstr_next;
249
250                 free_lstr(l);
251         }
252         return rc;
253 }
254
255 int
256 lst_parse_nids(char *str, int *countp, struct lnet_process_id **idspp)
257 {
258         lstr_t  *head = NULL;
259         lstr_t  *l;
260         int      c = 0;
261         int      i;
262         int      rc;
263
264         rc = expand_strs(str, &head);
265         if (rc != 0)
266                 goto out;
267
268         l = head;
269         while (l != NULL) {
270                 l = l->lstr_next;
271                 c++;
272         }
273
274         *idspp = malloc(c * sizeof(struct lnet_process_id));
275         if (*idspp == NULL) {
276                 fprintf(stderr, "Out of memory\n");
277                 rc = -1;
278         }
279
280         *countp = c;
281 out:
282         i = 0;
283         while ((l = head) != NULL) {
284                 head = l->lstr_next;
285
286                 if (rc == 0) {
287                         (*idspp)[i].nid = libcfs_str2nid(l->lstr_str);
288                         if ((*idspp)[i].nid == LNET_NID_ANY) {
289                                 fprintf(stderr, "Invalid nid: %s\n",
290                                         l->lstr_str);
291                                 rc = -1;
292                         }
293
294                         (*idspp)[i].pid = LNET_PID_LUSTRE;
295                         i++;
296                 }
297
298                 free_lstr(l);
299         }
300
301         if (rc == 0)
302                 return 0;
303
304         free(*idspp);
305         *idspp = NULL;
306
307         return rc;
308 }
309
310 char *
311 lst_node_state2str(int state)
312 {
313         if (state == LST_NODE_ACTIVE)
314                 return "Active";
315         if (state == LST_NODE_BUSY)
316                 return "Busy";
317         if (state == LST_NODE_DOWN)
318                 return "Down";
319
320         return "Unknown";
321 }
322
323 int
324 lst_node_str2state(char *str)
325 {
326         if (strcasecmp(str, "active") == 0)
327                 return LST_NODE_ACTIVE;
328         if (strcasecmp(str, "busy") == 0)
329                 return LST_NODE_BUSY;
330         if (strcasecmp(str, "down") == 0)
331                 return LST_NODE_DOWN;
332         if (strcasecmp(str, "unknown") == 0)
333                 return LST_NODE_UNKNOWN;
334         if (strcasecmp(str, "invalid") == 0)
335                 return (LST_NODE_UNKNOWN | LST_NODE_DOWN | LST_NODE_BUSY);
336
337         return -1;
338 }
339
340 char *
341 lst_test_type2name(int type)
342 {
343         if (type == LST_TEST_PING)
344                 return "ping";
345         if (type == LST_TEST_BULK)
346                 return "brw";
347
348         return "unknown";
349 }
350
351 int
352 lst_test_name2type(char *name)
353 {
354         if (strcasecmp(name, "ping") == 0)
355                 return LST_TEST_PING;
356         if (strcasecmp(name, "brw") == 0)
357                 return LST_TEST_BULK;
358
359         return -1;
360 }
361
362 void
363 lst_print_usage(char *cmd)
364 {
365         Parser_printhelp(cmd);
366 }
367
368 void
369 lst_print_error(char *sub, const char *def_format, ...)
370 {
371         va_list ap;
372
373         /* local error returned from kernel */
374         switch (errno) {
375         case ESRCH:
376                 fprintf(stderr, "No session exists\n");
377                 return;
378         case ESHUTDOWN:
379                 fprintf(stderr, "Session is shutting down\n");
380                 return;
381         case EACCES:
382                 fprintf(stderr, "Unmatched session key or not root\n");
383                 return;
384         case ENOENT:
385                 fprintf(stderr, "Can't find %s in current session\n", sub);
386                 return;
387         case EINVAL:
388                 fprintf(stderr, "Invalid parameters list in command line\n");
389                 return;
390         case EFAULT:
391                 fprintf(stderr, "Bad parameter address\n");
392                 return;
393         case EEXIST:
394                 fprintf(stderr, "%s already exists\n", sub);
395                 return;
396         default:
397                 va_start(ap, def_format);
398                 vfprintf(stderr, def_format, ap);
399                 va_end(ap);
400
401                 return;
402         }
403 }
404
405 void
406 lst_free_rpcent(struct list_head *head)
407 {
408         struct lstcon_rpc_ent *ent;
409
410         while (!list_empty(head)) {
411                 ent = list_entry(head->next, struct lstcon_rpc_ent, rpe_link);
412
413                 list_del(&ent->rpe_link);
414                 free(ent);
415         }
416 }
417
418 void
419 lst_reset_rpcent(struct list_head *head)
420 {
421         struct lstcon_rpc_ent *ent;
422
423         list_for_each_entry(ent, head, rpe_link) {
424                 ent->rpe_sid       = LST_INVALID_SID;
425                 ent->rpe_peer.nid  = LNET_NID_ANY;
426                 ent->rpe_peer.pid  = LNET_PID_ANY;
427                 ent->rpe_rpc_errno = ent->rpe_fwk_errno = 0;
428         }
429 }
430
431 int
432 lst_alloc_rpcent(struct list_head *head, int count, int offset)
433 {
434         struct lstcon_rpc_ent *ent;
435         int               i;
436
437         for (i = 0; i < count; i++) {
438                 ent = malloc(offsetof(struct lstcon_rpc_ent, rpe_payload[offset]));
439                 if (ent == NULL) {
440                         lst_free_rpcent(head);
441                         return -1;
442                 }
443
444                 memset(ent, 0, offsetof(struct lstcon_rpc_ent, rpe_payload[offset]));
445
446                 ent->rpe_sid      = LST_INVALID_SID;
447                 ent->rpe_peer.nid = LNET_NID_ANY;
448                 ent->rpe_peer.pid = LNET_PID_ANY;
449                 list_add(&ent->rpe_link, head);
450         }
451
452         return 0;
453 }
454
455 void
456 lst_print_transerr(struct list_head *head, char *optstr)
457 {
458         struct lstcon_rpc_ent *ent;
459
460         list_for_each_entry(ent, head, rpe_link) {
461                 if (ent->rpe_rpc_errno == 0 && ent->rpe_fwk_errno == 0)
462                         continue;
463
464                 if (ent->rpe_rpc_errno != 0) {
465                         fprintf(stderr, "%s RPC failed on %s: %s\n",
466                                 optstr, libcfs_id2str(ent->rpe_peer),
467                                 strerror(ent->rpe_rpc_errno));
468                         continue;
469                 }
470
471                 fprintf(stderr, "operation %s failed on %s: %s\n",
472                         optstr, libcfs_id2str(ent->rpe_peer),
473                         strerror(ent->rpe_fwk_errno));
474         }
475 }
476
477 int lst_info_batch_ioctl(char *batch, int test, int server,
478                         struct lstcon_test_batch_ent *entp, int *idxp,
479                         int *ndentp, struct lstcon_node_ent *dentsp);
480
481 int lst_info_group_ioctl(char *name, struct lstcon_ndlist_ent *gent,
482                          int *idx, int *count, struct lstcon_node_ent *dents);
483
484 int lst_query_batch_ioctl(char *batch, int test, int server,
485                           int timeout, struct list_head *head);
486
487 int
488 lst_ioctl(unsigned int opc, void *buf, int len)
489 {
490         struct libcfs_ioctl_data data;
491         int    rc;
492
493         LIBCFS_IOC_INIT (data);
494         data.ioc_u32[0]  = opc;
495         data.ioc_plen1   = len;
496         data.ioc_pbuf1   = (char *)buf;
497         data.ioc_plen2   = sizeof(trans_stat);
498         data.ioc_pbuf2   = (char *)&trans_stat;
499
500         memset(&trans_stat, 0, sizeof(trans_stat));
501
502         rc = l_ioctl(LNET_DEV_ID, IOC_LIBCFS_LNETST, &data);
503
504         /* local error, no valid RPC result */
505         if (rc != 0)
506                 return -1;
507
508         /* RPC error */
509         if (trans_stat.trs_rpc_errno != 0)
510                 return -2;
511
512         /* Framework error */
513         if (trans_stat.trs_fwk_errno != 0)
514                 return -3;
515
516         return 0;
517 }
518
519 int
520 lst_new_session_ioctl(char *name, int timeout, int force, struct lst_sid *sid)
521 {
522         struct lstio_session_new_args args = { 0 };
523
524         args.lstio_ses_key     = session_key;
525         args.lstio_ses_timeout = timeout;
526         args.lstio_ses_force   = force;
527         args.lstio_ses_idp     = sid;
528         args.lstio_ses_feats   = session_features;
529         args.lstio_ses_nmlen   = strlen(name);
530         args.lstio_ses_namep   = name;
531
532         return lst_ioctl (LSTIO_SESSION_NEW, &args, sizeof(args));
533 }
534
535 int
536 jt_lst_new_session(int argc, char **argv)
537 {
538         char  buf[LST_NAME_SIZE];
539         char *name;
540         int   optidx = 0;
541         int   timeout = 300;
542         int   force = 0;
543         int   c;
544         int   rc;
545
546         static const struct option session_opts[] = {
547                 { .name = "timeout", .has_arg = required_argument, .val = 't' },
548                 { .name = "force",   .has_arg = no_argument,       .val = 'f' },
549                 { .name = NULL } };
550
551         if (session_key == 0) {
552                 fprintf(stderr,
553                         "Can't find env LST_SESSION or value is not valid\n");
554                 return -1;
555         }
556
557         while (1) {
558
559                 c = getopt_long(argc, argv, "ft:",
560                                 session_opts, &optidx);
561
562                 if (c == -1)
563                         break;
564
565                 switch (c) {
566                 case 'f':
567                         force = 1;
568                         break;
569                 case 't':
570                         timeout = atoi(optarg);
571                         break;
572                 default:
573                         lst_print_usage(argv[0]);
574                         return -1;
575                 }
576         }
577
578         if (timeout <= 0) {
579                 fprintf(stderr, "Invalid timeout value\n");
580                 return -1;
581         }
582
583         if (optind == argc - 1) {
584                 name = argv[optind ++];
585                 if (strlen(name) >= LST_NAME_SIZE) {
586                         fprintf(stderr, "Name size is limited to %d\n",
587                                 LST_NAME_SIZE - 1);
588                         return -1;
589                 }
590
591         } else if (optind == argc) {
592                 char           user[LST_NAME_SIZE];
593                 char           host[LST_NAME_SIZE];
594                 struct passwd *pw = getpwuid(getuid());
595
596                 if (pw == NULL)
597                         snprintf(user, sizeof(user), "%d", (int)getuid());
598                 else
599                         snprintf(user, sizeof(user), "%s", pw->pw_name);
600
601                 rc = gethostname(host, sizeof(host));
602                 if (rc != 0)
603                         snprintf(host, sizeof(host), "unknown_host");
604
605                 snprintf(buf, sizeof(buf), "%s@%s", user, host);
606                 name = buf;
607
608         } else {
609                 lst_print_usage(argv[0]);
610                 return -1;
611         }
612
613         rc = lst_new_session_ioctl(name, timeout, force, &session_id);
614         if (rc != 0) {
615                 lst_print_error("session", "Failed to create session: %s\n",
616                                 strerror(errno));
617                 return rc;
618         }
619
620         fprintf(stdout, "SESSION: %s FEATURES: %x TIMEOUT: %d FORCE: %s\n",
621                 name, session_features, timeout, force ? "Yes" : "No");
622         return 0;
623 }
624
625 int
626 lst_session_info_ioctl(char *name, int len, int *key, unsigned *featp,
627                        struct lst_sid *sid, struct lstcon_ndlist_ent *ndinfo)
628 {
629         struct lstio_session_info_args args = { 0 };
630
631         args.lstio_ses_idp     = sid;
632         args.lstio_ses_keyp    = key;
633         args.lstio_ses_featp   = featp;
634         args.lstio_ses_ndinfo  = ndinfo;
635         args.lstio_ses_nmlen   = len;
636         args.lstio_ses_namep   = name;
637
638         return lst_ioctl(LSTIO_SESSION_INFO, &args, sizeof(args));
639 }
640
641 int
642 jt_lst_show_session(int argc, char **argv)
643 {
644         struct lstcon_ndlist_ent ndinfo;
645         struct lst_sid sid;
646         char                name[LST_NAME_SIZE];
647         unsigned            feats;
648         int                 key;
649         int                 rc;
650
651         rc = lst_session_info_ioctl(name, sizeof(name), &key,
652                                     &feats, &sid, &ndinfo);
653
654         if (rc != 0) {
655                 lst_print_error("session", "Failed to show session: %s\n",
656                                 strerror(errno));
657                 return -1;
658         }
659
660         fprintf(stdout, "%s ID: %ju@%s, KEY: %d FEATURES: %x NODES: %d\n",
661                 name, (uintmax_t)sid.ses_stamp, libcfs_nid2str(sid.ses_nid),
662                 key, feats, ndinfo.nle_nnode);
663
664         return 0;
665 }
666
667 int
668 lst_end_session_ioctl(void)
669 {
670         struct lstio_session_end_args args = { 0 };
671
672         args.lstio_ses_key = session_key;
673         return lst_ioctl(LSTIO_SESSION_END, &args, sizeof(args));
674 }
675
676 int
677 jt_lst_end_session(int argc, char **argv)
678 {
679         int             rc;
680
681         if (session_key == 0) {
682                 fprintf(stderr,
683                         "Can't find env LST_SESSION or value is not valid\n");
684                 return -1;
685         }
686
687         rc = lst_end_session_ioctl();
688
689         if (rc == 0) {
690                 fprintf(stdout, "session is ended\n");
691                 return 0;
692         }
693
694         if (rc == -1) {
695                 lst_print_error("session", "Failed to end session: %s\n",
696                                 strerror(errno));
697                 return rc;
698         }
699
700         if (trans_stat.trs_rpc_errno != 0) {
701                 fprintf(stderr,
702                         "[RPC] Failed to send %d session RPCs: %s\n",
703                         lstcon_rpc_stat_failure(&trans_stat, 0),
704                         strerror(trans_stat.trs_rpc_errno));
705         }
706
707         if (trans_stat.trs_fwk_errno != 0) {
708                 fprintf(stderr,
709                         "[FWK] Failed to end session on %d nodes: %s\n",
710                         lstcon_sesop_stat_failure(&trans_stat, 0),
711                         strerror(trans_stat.trs_fwk_errno));
712         }
713
714         return rc;
715 }
716
717 int
718 lst_ping_ioctl(char *str, int type, int timeout,
719                int count, struct lnet_process_id *ids, struct list_head *head)
720 {
721         struct lstio_debug_args args = { 0 };
722
723         args.lstio_dbg_key     = session_key;
724         args.lstio_dbg_type    = type;
725         args.lstio_dbg_flags   = 0;
726         args.lstio_dbg_timeout = timeout;
727         args.lstio_dbg_nmlen   = (str == NULL) ? 0: strlen(str);
728         args.lstio_dbg_namep   = str;
729         args.lstio_dbg_count   = count;
730         args.lstio_dbg_idsp    = ids;
731         args.lstio_dbg_resultp = head;
732
733         return lst_ioctl (LSTIO_DEBUG, &args, sizeof(args));
734 }
735
736 int
737 lst_get_node_count(int type, char *str, int *countp,
738                    struct lnet_process_id **idspp)
739 {
740         char                    buf[LST_NAME_SIZE];
741         struct lstcon_test_batch_ent ent;
742         struct lstcon_ndlist_ent    *entp = &ent.tbe_cli_nle;
743         struct lst_sid sid;
744         unsigned                feats;
745         int                     key;
746         int                     rc;
747
748         switch (type) {
749         case LST_OPC_SESSION:
750                 rc = lst_session_info_ioctl(buf, LST_NAME_SIZE,
751                                             &key, &feats, &sid, entp);
752                 break;
753
754         case LST_OPC_BATCHSRV:
755                 entp = &ent.tbe_srv_nle;
756         case LST_OPC_BATCHCLI:
757                 rc = lst_info_batch_ioctl(str, 0, 0, &ent, NULL, NULL, NULL);
758                 break;
759
760         case LST_OPC_GROUP:
761                 rc = lst_info_group_ioctl(str, entp, NULL, NULL, NULL);
762                 break;
763
764         case LST_OPC_NODES:
765                 rc = lst_parse_nids(str, &entp->nle_nnode, idspp) < 0 ? -1 : 0;
766                 break;
767
768         default:
769                 rc = -1;
770                 break;
771         }
772
773         if (rc == 0)
774                 *countp = entp->nle_nnode;
775
776         return rc;
777 }
778
779 int
780 jt_lst_ping(int argc,  char **argv)
781 {
782         struct list_head   head;
783         struct lnet_process_id *ids = NULL;
784         struct lstcon_rpc_ent  *ent = NULL;
785         char              *str = NULL;
786         int                optidx  = 0;
787         int                server  = 0;
788         int                timeout = 5;
789         int                count   = 0;
790         int                type    = 0;
791         int                rc      = 0;
792         int                c;
793
794         static const struct option ping_opts[] = {
795                 { .name = "session", .has_arg = no_argument,       .val = 's' },
796                 { .name = "server",  .has_arg = no_argument,       .val = 'v' },
797                 { .name = "batch",   .has_arg = required_argument, .val = 'b' },
798                 { .name = "group",   .has_arg = required_argument, .val = 'g' },
799                 { .name = "nodes",   .has_arg = required_argument, .val = 'n' },
800                 { .name = "timeout", .has_arg = required_argument, .val = 't' },
801                 { .name = NULL, } };
802
803         if (session_key == 0) {
804                 fprintf(stderr,
805                         "Can't find env LST_SESSION or value is not valid\n");
806                 return -1;
807         }
808
809         while (1) {
810
811                 c = getopt_long(argc, argv, "g:b:n:t:sv",
812                                 ping_opts, &optidx);
813
814                 if (c == -1)
815                         break;
816
817                 switch (c) {
818                 case 's':
819                         type = LST_OPC_SESSION;
820                         break;
821
822                 case 'g':
823                         type = LST_OPC_GROUP;
824                         str = optarg;
825                         break;
826
827                 case 'b':
828                         type = LST_OPC_BATCHCLI;
829                         str = optarg;
830                         break;
831
832                 case 'n':
833                         type = LST_OPC_NODES;
834                         str = optarg;
835                         break;
836
837                 case 't':
838                         timeout = atoi(optarg);
839                         break;
840
841                 case 'v':
842                         server = 1;
843                         break;
844
845                 default:
846                         lst_print_usage(argv[0]);
847                         return -1;
848                 }
849         }
850
851         if (type == 0 || timeout <= 0 || optind != argc) {
852                 lst_print_usage(argv[0]);
853                 return -1;
854         }
855
856         if (type == LST_OPC_BATCHCLI && server)
857                 type = LST_OPC_BATCHSRV;
858
859         rc = lst_get_node_count(type, str, &count, &ids);
860         if (rc < 0) {
861                 fprintf(stderr, "Failed to get count of nodes from %s: %s\n",
862                         (str == NULL) ? "session" : str, strerror(errno));
863                 return -1;
864         }
865
866         INIT_LIST_HEAD(&head);
867
868         rc = lst_alloc_rpcent(&head, count, LST_NAME_SIZE);
869         if (rc != 0) {
870                 fprintf(stderr, "Out of memory\n");
871                 goto out;
872         }
873
874         if (count == 0) {
875                 fprintf(stdout, "Target %s is empty\n",
876                         (str == NULL) ? "session" : str);
877                 goto out;
878         }
879
880         rc = lst_ping_ioctl(str, type, timeout, count, ids, &head);
881         if (rc == -1) { /* local failure */
882                 lst_print_error("debug", "Failed to ping %s: %s\n",
883                                 (str == NULL) ? "session" : str,
884                                 strerror(errno));
885                 rc = -1;
886                 goto out;
887         }
888
889         /* ignore RPC errors and framwork errors */
890         list_for_each_entry(ent, &head, rpe_link) {
891                 fprintf(stdout, "\t%s: %s [session: %s id: %s]\n",
892                         libcfs_id2str(ent->rpe_peer),
893                         lst_node_state2str(ent->rpe_state),
894                         (ent->rpe_state == LST_NODE_ACTIVE ||
895                          ent->rpe_state == LST_NODE_BUSY) ?
896                                 (ent->rpe_rpc_errno == 0 ?
897                                         &ent->rpe_payload[0] : "Unknown") :
898                                 "<NULL>", libcfs_nid2str(ent->rpe_sid.ses_nid));
899         }
900
901 out:
902         lst_free_rpcent(&head);
903
904         if (ids != NULL)
905                 free(ids);
906
907         return rc;
908
909 }
910
911 int
912 lst_add_nodes_ioctl(char *name, int count, struct lnet_process_id *ids,
913                     unsigned *featp, struct list_head *resultp)
914 {
915         struct lstio_group_nodes_args args = { 0 };
916
917         args.lstio_grp_key     = session_key;
918         args.lstio_grp_nmlen   = strlen(name);
919         args.lstio_grp_namep   = name;
920         args.lstio_grp_count   = count;
921         args.lstio_grp_featp   = featp;
922         args.lstio_grp_idsp    = ids;
923         args.lstio_grp_resultp = resultp;
924
925         return lst_ioctl(LSTIO_NODES_ADD, &args, sizeof(args));
926 }
927
928 int
929 lst_del_group_ioctl(char *name)
930 {
931         struct lstio_group_del_args args = { 0 };
932
933         args.lstio_grp_key   = session_key;
934         args.lstio_grp_nmlen = strlen(name);
935         args.lstio_grp_namep = name;
936
937         return lst_ioctl(LSTIO_GROUP_DEL, &args, sizeof(args));
938 }
939
940 int
941 lst_del_group(char *grp_name)
942 {
943         int     rc;
944
945         rc = lst_del_group_ioctl(grp_name);
946         if (rc == 0) {
947                 fprintf(stdout, "Group is deleted\n");
948                 return 0;
949         }
950
951         if (rc == -1) {
952                 lst_print_error("group", "Failed to delete group: %s\n",
953                                 strerror(errno));
954                 return rc;
955         }
956
957         fprintf(stderr, "Group is deleted with some errors\n");
958
959         if (trans_stat.trs_rpc_errno != 0) {
960                 fprintf(stderr,
961                         "[RPC] Failed to send %d end session RPCs: %s\n",
962                         lstcon_rpc_stat_failure(&trans_stat, 0),
963                         strerror(trans_stat.trs_rpc_errno));
964         }
965
966         if (trans_stat.trs_fwk_errno != 0) {
967                 fprintf(stderr,
968                         "[FWK] Failed to end session on %d nodes: %s\n",
969                 lstcon_sesop_stat_failure(&trans_stat, 0),
970                 strerror(trans_stat.trs_fwk_errno));
971         }
972
973         return -1;
974 }
975
976 int
977 lst_add_group_ioctl(char *name)
978 {
979         struct lstio_group_add_args args = { 0 };
980
981         args.lstio_grp_key     =  session_key;
982         args.lstio_grp_nmlen   =  strlen(name);
983         args.lstio_grp_namep   =  name;
984
985         return lst_ioctl(LSTIO_GROUP_ADD, &args, sizeof(args));
986 }
987
988 int
989 jt_lst_add_group(int argc, char **argv)
990 {
991         struct list_head   head;
992         struct lnet_process_id *ids;
993         char              *name;
994         unsigned           feats = session_features;
995         int                count;
996         int                rc;
997         int                i;
998         bool               nodes_added = false;
999
1000         if (session_key == 0) {
1001                 fprintf(stderr,
1002                         "Can't find env LST_SESSION or value is not valid\n");
1003                 return -1;
1004         }
1005
1006         if (argc < 3) {
1007                 lst_print_usage(argv[0]);
1008                 return -1;
1009         }
1010
1011         name = argv[1];
1012         if (strlen(name) >= LST_NAME_SIZE) {
1013                 fprintf(stderr, "Name length is limited to %d\n",
1014                         LST_NAME_SIZE - 1);
1015                 return -1;
1016         }
1017
1018         rc = lst_add_group_ioctl(name);
1019         if (rc != 0) {
1020                 lst_print_error("group", "Failed to add group %s: %s\n",
1021                                 name, strerror(errno));
1022                 return -1;
1023         }
1024
1025         INIT_LIST_HEAD(&head);
1026
1027         for (i = 2; i < argc; i++) {
1028                 /* parse address list */
1029                 rc = lst_parse_nids(argv[i], &count, &ids);
1030                 if (rc < 0) {
1031                         fprintf(stderr, "Ignore invalid id list %s\n",
1032                                 argv[i]);
1033                         continue;
1034                 }
1035
1036                 if (count == 0)
1037                         continue;
1038
1039                 rc = lst_alloc_rpcent(&head, count, 0);
1040                 if (rc != 0) {
1041                         fprintf(stderr, "Out of memory\n");
1042                         free(ids);
1043                         rc = -1;
1044                         goto failed;
1045                 }
1046
1047                 rc = lst_add_nodes_ioctl(name, count, ids, &feats, &head);
1048
1049                 free(ids);
1050
1051                 if (rc != 0)
1052                         goto failed;
1053
1054                 fprintf(stdout, "%s are added to session\n", argv[i]);
1055
1056                 nodes_added = true;
1057
1058                 if ((feats & session_features) != session_features) {
1059                         fprintf(stdout,
1060                                 "Warning, this session will run with "
1061                                 "compatible mode because some test nodes "
1062                                 "might not understand these features: %x\n",
1063                                 (~feats & session_features));
1064                 }
1065
1066                 lst_free_rpcent(&head);
1067         }
1068
1069         if (!nodes_added) {
1070                 /*
1071                  * The selftest kernel module expects that a group should
1072                  * have at least one node, since it doesn't make sense for
1073                  * an empty group to be added to a test.
1074                  */
1075                 fprintf(stderr,
1076                         "No nodes added successfully, deleting group %s\n",
1077                         name);
1078                 rc = lst_del_group(name);
1079                 if (rc != 0) {
1080                         fprintf(stderr,
1081                                 "Failed to delete group %s."
1082                                 "  Group is empty.\n", name);
1083                 }
1084         }
1085
1086         return rc;
1087
1088 failed:
1089         if (rc == -1) {
1090                 lst_print_error("group", "Failed to add nodes %s: %s\n",
1091                                 argv[i], strerror(errno));
1092
1093         } else {
1094                 if (trans_stat.trs_fwk_errno == EPROTO) {
1095                         fprintf(stderr,
1096                                 "test nodes might have different LST "
1097                                 "features, please disable some features by "
1098                                 "setting LST_FEATURES\n");
1099                 }
1100
1101                 lst_print_transerr(&head, "create session");
1102         }
1103
1104         lst_free_rpcent(&head);
1105
1106         if (!nodes_added) {
1107                 fprintf(stderr,
1108                         "No nodes added successfully, deleting group %s\n",
1109                         name);
1110                 if (lst_del_group(name) != 0) {
1111                         fprintf(stderr,
1112                                 "Failed to delete group %s."
1113                                 "  Group is empty.\n", name);
1114                 }
1115         }
1116
1117         return rc;
1118 }
1119
1120 int
1121 jt_lst_del_group(int argc, char **argv)
1122 {
1123         int     rc;
1124
1125         if (session_key == 0) {
1126                 fprintf(stderr,
1127                         "Can't find env LST_SESSION or value is not valid\n");
1128                 return -1;
1129         }
1130
1131         if (argc != 2) {
1132                 lst_print_usage(argv[0]);
1133                 return -1;
1134         }
1135
1136         rc = lst_del_group(argv[1]);
1137
1138         return rc;
1139 }
1140
1141 int
1142 lst_update_group_ioctl(int opc, char *name, int clean, int count,
1143                        struct lnet_process_id *ids, struct list_head *resultp)
1144 {
1145         struct lstio_group_update_args args = { 0 };
1146
1147         args.lstio_grp_key      = session_key;
1148         args.lstio_grp_opc      = opc;
1149         args.lstio_grp_args     = clean;
1150         args.lstio_grp_nmlen    = strlen(name);
1151         args.lstio_grp_namep    = name;
1152         args.lstio_grp_count    = count;
1153         args.lstio_grp_idsp     = ids;
1154         args.lstio_grp_resultp  = resultp;
1155
1156         return lst_ioctl(LSTIO_GROUP_UPDATE, &args, sizeof(args));
1157 }
1158
1159 int
1160 jt_lst_update_group(int argc, char **argv)
1161 {
1162         struct list_head   head;
1163         struct lnet_process_id *ids = NULL;
1164         char              *str = NULL;
1165         char              *grp = NULL;
1166         int                optidx = 0;
1167         int                count = 0;
1168         int                clean = 0;
1169         int                opc = 0;
1170         int                rc;
1171         int                c;
1172
1173         static const struct option update_group_opts[] = {
1174                 { .name = "refresh", .has_arg = no_argument,       .val = 'f' },
1175                 { .name = "clean",   .has_arg = required_argument, .val = 'c' },
1176                 { .name = "remove",  .has_arg = required_argument, .val = 'r' },
1177                 { .name = NULL } };
1178
1179         if (session_key == 0) {
1180                 fprintf(stderr,
1181                         "Can't find env LST_SESSION or value is not valid\n");
1182                 return -1;
1183         }
1184
1185         while (1) {
1186                 c = getopt_long(argc, argv, "fc:r:",
1187                                 update_group_opts, &optidx);
1188
1189                 /* Detect the end of the options. */
1190                 if (c == -1)
1191                         break;
1192
1193                 switch (c) {
1194                 case 'f':
1195                         if (opc != 0) {
1196                                 lst_print_usage(argv[0]);
1197                                 return -1;
1198                         }
1199                         opc = LST_GROUP_REFRESH;
1200                         break;
1201
1202                 case 'r':
1203                         if (opc != 0) {
1204                                 lst_print_usage(argv[0]);
1205                                 return -1;
1206                         }
1207                         opc = LST_GROUP_RMND;
1208                         str = optarg;
1209                         break;
1210
1211                 case 'c':
1212                         clean = lst_node_str2state(optarg);
1213                         if (opc != 0 || clean <= 0) {
1214                                 lst_print_usage(argv[0]);
1215                                 return -1;
1216                         }
1217                         opc = LST_GROUP_CLEAN;
1218                         break;
1219
1220                 default:
1221                         lst_print_usage(argv[0]);
1222                         return -1;
1223                 }
1224         }
1225
1226         /* no OPC or group is specified */
1227         if (opc == 0 || optind != argc - 1) {
1228                 lst_print_usage(argv[0]);
1229                 return -1;
1230         }
1231
1232         grp = argv[optind];
1233
1234         INIT_LIST_HEAD(&head);
1235
1236         if (opc == LST_GROUP_RMND || opc == LST_GROUP_REFRESH) {
1237                 rc = lst_get_node_count(opc == LST_GROUP_RMND ? LST_OPC_NODES :
1238                                                                 LST_OPC_GROUP,
1239                                         opc == LST_GROUP_RMND ? str : grp,
1240                                         &count, &ids);
1241
1242                 if (rc != 0) {
1243                         fprintf(stderr, "Can't get count of nodes from %s: %s\n",
1244                                 opc == LST_GROUP_RMND ? str : grp,
1245                                 strerror(errno));
1246                         return -1;
1247                 }
1248
1249                 rc = lst_alloc_rpcent(&head, count, 0);
1250                 if (rc != 0) {
1251                         fprintf(stderr, "Out of memory\n");
1252                         free(ids);
1253                         return -1;
1254                 }
1255
1256         }
1257
1258         rc = lst_update_group_ioctl(opc, grp, clean, count, ids, &head);
1259
1260         if (ids != NULL)
1261                 free(ids);
1262
1263         if (rc == 0) {
1264                 lst_free_rpcent(&head);
1265                 return 0;
1266         }
1267
1268         if (rc == -1) {
1269                 lst_free_rpcent(&head);
1270                 lst_print_error("group", "Failed to update group: %s\n",
1271                                 strerror(errno));
1272                 return rc;
1273         }
1274
1275         lst_print_transerr(&head, "Updating group");
1276
1277         lst_free_rpcent(&head);
1278
1279         return rc;
1280 }
1281
1282 int
1283 lst_list_group_ioctl(int len, char *name, int idx)
1284 {
1285         struct lstio_group_list_args args = { 0 };
1286
1287         args.lstio_grp_key   = session_key;
1288         args.lstio_grp_idx   = idx;
1289         args.lstio_grp_nmlen = len;
1290         args.lstio_grp_namep = name;
1291
1292         return lst_ioctl(LSTIO_GROUP_LIST, &args, sizeof(args));
1293 }
1294
1295 int
1296 lst_info_group_ioctl(char *name, struct lstcon_ndlist_ent *gent,
1297                      int *idx, int *count, struct lstcon_node_ent *dents)
1298 {
1299         struct lstio_group_info_args args = { 0 };
1300
1301         args.lstio_grp_key    = session_key;
1302         args.lstio_grp_nmlen  = strlen(name);
1303         args.lstio_grp_namep  = name;
1304         args.lstio_grp_entp   = gent;
1305         args.lstio_grp_idxp   = idx;
1306         args.lstio_grp_ndentp = count;
1307         args.lstio_grp_dentsp = dents;
1308
1309         return lst_ioctl(LSTIO_GROUP_INFO, &args, sizeof(args));
1310 }
1311
1312 int
1313 lst_list_group_all(void)
1314 {
1315         char  name[LST_NAME_SIZE];
1316         int   rc;
1317         int   i;
1318
1319         /* no group is specified, list name of all groups */
1320         for (i = 0; ; i++) {
1321                 rc = lst_list_group_ioctl(LST_NAME_SIZE, name, i);
1322                 if (rc == 0) {
1323                         fprintf(stdout, "%d) %s\n", i + 1, name);
1324                         continue;
1325                 }
1326
1327                 if (errno == ENOENT)
1328                         break;
1329
1330                 lst_print_error("group", "Failed to list group: %s\n",
1331                                 strerror(errno));
1332                 return -1;
1333         }
1334
1335         fprintf(stdout, "Total %d groups\n", i);
1336
1337         return 0;
1338 }
1339
1340 #define LST_NODES_TITLE "\tACTIVE\tBUSY\tDOWN\tUNKNOWN\tTOTAL\n"
1341
1342 int
1343 jt_lst_list_group(int argc, char **argv)
1344 {
1345         struct lstcon_ndlist_ent gent;
1346         struct lstcon_node_ent   *dents;
1347         int optidx  = 0;
1348         int verbose = 0;
1349         int active  = 0;
1350         int busy    = 0;
1351         int down    = 0;
1352         int unknown = 0;
1353         int all     = 0;
1354         int count;
1355         int index;
1356         int i;
1357         int j;
1358         int c;
1359         int rc      = 0;
1360
1361         static const struct option list_group_opts[] = {
1362                 { .name = "active",  .has_arg = no_argument, .val = 'a' },
1363                 { .name = "busy",    .has_arg = no_argument, .val = 'b' },
1364                 { .name = "down",    .has_arg = no_argument, .val = 'd' },
1365                 { .name = "unknown", .has_arg = no_argument, .val = 'u' },
1366                 { .name = "all",     .has_arg = no_argument, .val = 'l' },
1367                 { .name = NULL, } };
1368
1369         if (session_key == 0) {
1370                 fprintf(stderr,
1371                         "Can't find env LST_SESSION or value is not valid\n");
1372                 return -1;
1373         }
1374
1375         while (1) {
1376                 c = getopt_long(argc, argv, "abdul",
1377                                 list_group_opts, &optidx);
1378
1379                 if (c == -1)
1380                         break;
1381
1382                 switch (c) {
1383                 case 'a':
1384                         verbose = active = 1;
1385                         all = 0;
1386                         break;
1387                 case 'b':
1388                         verbose = busy = 1;
1389                         all = 0;
1390                         break;
1391                 case 'd':
1392                         verbose = down = 1;
1393                         all = 0;
1394                         break;
1395                 case 'u':
1396                         verbose = unknown = 1;
1397                         all = 0;
1398                         break;
1399                 case 'l':
1400                         verbose = all = 1;
1401                         break;
1402                 default:
1403                         lst_print_usage(argv[0]);
1404                         return -1;
1405                 }
1406         }
1407
1408         if (optind == argc) {
1409                 /* no group is specified, list name of all groups */
1410                 rc = lst_list_group_all();
1411
1412                 return rc;
1413         }
1414
1415         if (!verbose)
1416                 fprintf(stdout, LST_NODES_TITLE);
1417
1418         /* list nodes in specified groups */
1419         for (i = optind; i < argc; i++) {
1420                 rc = lst_info_group_ioctl(argv[i], &gent, NULL, NULL, NULL);
1421                 if (rc != 0) {
1422                         if (errno == ENOENT) {
1423                                 rc = 0;
1424                                 break;
1425                         }
1426
1427                         lst_print_error("group", "Failed to list group\n",
1428                                         strerror(errno));
1429                         break;
1430                 }
1431
1432                 if (!verbose) {
1433                         fprintf(stdout, "\t%d\t%d\t%d\t%d\t%d\t%s\n",
1434                                 gent.nle_nactive, gent.nle_nbusy,
1435                                 gent.nle_ndown, gent.nle_nunknown,
1436                                 gent.nle_nnode, argv[i]);
1437                         continue;
1438                 }
1439
1440                 fprintf(stdout, "Group [ %s ]\n", argv[i]);
1441
1442                 if (gent.nle_nnode == 0) {
1443                         fprintf(stdout, "No nodes found [ %s ]\n", argv[i]);
1444                         continue;
1445                 }
1446
1447                 count = gent.nle_nnode;
1448
1449                 dents = malloc(count * sizeof(struct lstcon_node_ent));
1450                 if (dents == NULL) {
1451                         fprintf(stderr, "Failed to malloc: %s\n",
1452                                 strerror(errno));
1453                         return -1;
1454                 }
1455
1456                 index = 0;
1457                 rc = lst_info_group_ioctl(argv[i], &gent, &index, &count, dents);
1458                 if (rc != 0) {
1459                         lst_print_error("group", "Failed to list group: %s\n",
1460                                         strerror(errno));
1461                         free(dents);
1462                         return -1;
1463                 }
1464
1465                 for (j = 0, c = 0; j < count; j++) {
1466                         if (all ||
1467                             ((active  &&  dents[j].nde_state == LST_NODE_ACTIVE) ||
1468                              (busy    &&  dents[j].nde_state == LST_NODE_BUSY)   ||
1469                              (down    &&  dents[j].nde_state == LST_NODE_DOWN)   ||
1470                              (unknown &&  dents[j].nde_state == LST_NODE_UNKNOWN))) {
1471
1472                                 fprintf(stdout, "\t%s: %s\n",
1473                                         libcfs_id2str(dents[j].nde_id),
1474                                         lst_node_state2str(dents[j].nde_state));
1475                                 c++;
1476                         }
1477                 }
1478
1479                 fprintf(stdout, "Total %d nodes [ %s ]\n", c, argv[i]);
1480
1481                 free(dents);
1482         }
1483
1484         return rc;
1485 }
1486
1487 int
1488 lst_stat_ioctl(char *name, int count, struct lnet_process_id *idsp,
1489                int timeout, struct list_head *resultp)
1490 {
1491         struct lstio_stat_args args = { 0 };
1492
1493         args.lstio_sta_key     = session_key;
1494         args.lstio_sta_timeout = timeout;
1495         args.lstio_sta_nmlen   = strlen(name);
1496         args.lstio_sta_namep   = name;
1497         args.lstio_sta_count   = count;
1498         args.lstio_sta_idsp    = idsp;
1499         args.lstio_sta_resultp = resultp;
1500
1501         return lst_ioctl(LSTIO_STAT_QUERY, &args, sizeof(args));
1502 }
1503
1504 typedef struct {
1505         struct list_head              srp_link;
1506         int                     srp_count;
1507         char                   *srp_name;
1508         struct lnet_process_id      *srp_ids;
1509         struct list_head              srp_result[2];
1510 } lst_stat_req_param_t;
1511
1512 static void
1513 lst_stat_req_param_free(lst_stat_req_param_t *srp)
1514 {
1515         int     i;
1516
1517         for (i = 0; i < 2; i++)
1518                 lst_free_rpcent(&srp->srp_result[i]);
1519
1520         if (srp->srp_ids != NULL)
1521                 free(srp->srp_ids);
1522
1523         free(srp);
1524 }
1525
1526 static int
1527 lst_stat_req_param_alloc(char *name, lst_stat_req_param_t **srpp, int save_old)
1528 {
1529         lst_stat_req_param_t *srp = NULL;
1530         int                   count = save_old ? 2 : 1;
1531         int                   rc;
1532         int                   i;
1533
1534         srp = malloc(sizeof(*srp));
1535         if (srp == NULL)
1536                 return -ENOMEM;
1537
1538         memset(srp, 0, sizeof(*srp));
1539         INIT_LIST_HEAD(&srp->srp_result[0]);
1540         INIT_LIST_HEAD(&srp->srp_result[1]);
1541
1542         rc = lst_get_node_count(LST_OPC_GROUP, name,
1543                                 &srp->srp_count, NULL);
1544         if (rc != 0 && errno == ENOENT) {
1545                 rc = lst_get_node_count(LST_OPC_NODES, name,
1546                                         &srp->srp_count, &srp->srp_ids);
1547         }
1548
1549         if (rc != 0) {
1550                 fprintf(stderr,
1551                         "Failed to get count of nodes from %s: %s\n",
1552                         name, strerror(errno));
1553                 lst_stat_req_param_free(srp);
1554
1555                 return rc;
1556         }
1557
1558         srp->srp_name = name;
1559
1560         for (i = 0; i < count; i++) {
1561                 rc = lst_alloc_rpcent(&srp->srp_result[i], srp->srp_count,
1562                                       sizeof(struct sfw_counters)  +
1563                                       sizeof(struct srpc_counters) +
1564                                       sizeof(struct lnet_counters));
1565                 if (rc != 0) {
1566                         fprintf(stderr, "Out of memory\n");
1567                         break;
1568                 }
1569         }
1570
1571         if (rc == 0) {
1572                 *srpp = srp;
1573                 return 0;
1574         }
1575
1576         lst_stat_req_param_free(srp);
1577
1578         return rc;
1579 }
1580
1581 typedef struct {
1582         /* TODO */
1583         int foo;
1584 } lst_srpc_stat_result;
1585
1586 #define LST_LNET_AVG    0
1587 #define LST_LNET_MIN    1
1588 #define LST_LNET_MAX    2
1589
1590 typedef struct {
1591         float           lnet_avg_sndrate;
1592         float           lnet_min_sndrate;
1593         float           lnet_max_sndrate;
1594         float           lnet_total_sndrate;
1595
1596         float           lnet_avg_rcvrate;
1597         float           lnet_min_rcvrate;
1598         float           lnet_max_rcvrate;
1599         float           lnet_total_rcvrate;
1600
1601         float           lnet_avg_sndperf;
1602         float           lnet_min_sndperf;
1603         float           lnet_max_sndperf;
1604         float           lnet_total_sndperf;
1605
1606         float           lnet_avg_rcvperf;
1607         float           lnet_min_rcvperf;
1608         float           lnet_max_rcvperf;
1609         float           lnet_total_rcvperf;
1610
1611         int             lnet_stat_count;
1612 } lst_lnet_stat_result_t;
1613
1614 lst_lnet_stat_result_t lnet_stat_result;
1615
1616 static float
1617 lst_lnet_stat_value(int bw, int send, int off)
1618 {
1619         float  *p;
1620
1621         p = bw ? &lnet_stat_result.lnet_avg_sndperf :
1622                  &lnet_stat_result.lnet_avg_sndrate;
1623
1624         if (!send)
1625                 p += 4;
1626
1627         p += off;
1628
1629         return *p;
1630 }
1631
1632 static void
1633 lst_timeval_diff(struct timeval *tv1,
1634                  struct timeval *tv2, struct timeval *df)
1635 {
1636         if (tv1->tv_usec >= tv2->tv_usec) {
1637                 df->tv_sec  = tv1->tv_sec - tv2->tv_sec;
1638                 df->tv_usec = tv1->tv_usec - tv2->tv_usec;
1639                 return;
1640         }
1641
1642         df->tv_sec  = tv1->tv_sec - 1 - tv2->tv_sec;
1643         df->tv_usec = tv1->tv_usec + 1000000 - tv2->tv_usec;
1644
1645         return;
1646 }
1647
1648 static void
1649 lst_cal_lnet_stat(float delta, struct lnet_counters *lnet_new,
1650                   struct lnet_counters *lnet_old, int mbs)
1651 {
1652         float perf;
1653         float rate;
1654         unsigned int unit_divisor;
1655
1656         unit_divisor = (mbs) ? (1000 * 1000) : (1024 * 1024);
1657         perf = (float)(lnet_new->send_length -
1658                        lnet_old->send_length) / unit_divisor / delta;
1659         lnet_stat_result.lnet_total_sndperf += perf;
1660
1661         if (lnet_stat_result.lnet_min_sndperf > perf ||
1662             lnet_stat_result.lnet_min_sndperf == 0)
1663                 lnet_stat_result.lnet_min_sndperf = perf;
1664
1665         if (lnet_stat_result.lnet_max_sndperf < perf)
1666                 lnet_stat_result.lnet_max_sndperf = perf;
1667
1668         perf = (float)(lnet_new->recv_length -
1669                        lnet_old->recv_length) / unit_divisor / delta;
1670         lnet_stat_result.lnet_total_rcvperf += perf;
1671
1672         if (lnet_stat_result.lnet_min_rcvperf > perf ||
1673             lnet_stat_result.lnet_min_rcvperf == 0)
1674                 lnet_stat_result.lnet_min_rcvperf = perf;
1675
1676         if (lnet_stat_result.lnet_max_rcvperf < perf)
1677                 lnet_stat_result.lnet_max_rcvperf = perf;
1678
1679         rate = (lnet_new->send_count - lnet_old->send_count) / delta;
1680         lnet_stat_result.lnet_total_sndrate += rate;
1681
1682         if (lnet_stat_result.lnet_min_sndrate > rate ||
1683             lnet_stat_result.lnet_min_sndrate == 0)
1684                 lnet_stat_result.lnet_min_sndrate = rate;
1685
1686         if (lnet_stat_result.lnet_max_sndrate < rate)
1687                 lnet_stat_result.lnet_max_sndrate = rate;
1688
1689         rate = (lnet_new->recv_count - lnet_old->recv_count) / delta;
1690         lnet_stat_result.lnet_total_rcvrate += rate;
1691
1692         if (lnet_stat_result.lnet_min_rcvrate > rate ||
1693             lnet_stat_result.lnet_min_rcvrate == 0)
1694                 lnet_stat_result.lnet_min_rcvrate = rate;
1695
1696         if (lnet_stat_result.lnet_max_rcvrate < rate)
1697                 lnet_stat_result.lnet_max_rcvrate = rate;
1698
1699         lnet_stat_result.lnet_stat_count++;
1700
1701         lnet_stat_result.lnet_avg_sndrate = lnet_stat_result.lnet_total_sndrate /
1702                                             lnet_stat_result.lnet_stat_count;
1703         lnet_stat_result.lnet_avg_rcvrate = lnet_stat_result.lnet_total_rcvrate /
1704                                             lnet_stat_result.lnet_stat_count;
1705
1706         lnet_stat_result.lnet_avg_sndperf = lnet_stat_result.lnet_total_sndperf /
1707                                             lnet_stat_result.lnet_stat_count;
1708         lnet_stat_result.lnet_avg_rcvperf = lnet_stat_result.lnet_total_rcvperf /
1709                                             lnet_stat_result.lnet_stat_count;
1710 }
1711
1712 static void
1713 lst_print_lnet_stat(char *name, int bwrt, int rdwr, int type, int mbs)
1714 {
1715         int     start1 = 0;
1716         int     end1   = 1;
1717         int     start2 = 0;
1718         int     end2   = 1;
1719         int     i;
1720         int     j;
1721         char   *units;
1722
1723         if (lnet_stat_result.lnet_stat_count == 0)
1724                 return;
1725
1726         units = (mbs) ? "MB/s  " : "MiB/s ";
1727
1728         if (bwrt == 1) /* bw only */
1729                 start1 = 1;
1730
1731         if (bwrt == 2) /* rates only */
1732                 end1 = 0;
1733
1734         if (rdwr == 1) /* recv only */
1735                 start2 = 1;
1736
1737         if (rdwr == 2) /* send only */
1738                 end2 = 0;
1739
1740         for (i = start1; i <= end1; i++) {
1741                 fprintf(stdout, "[LNet %s of %s]\n",
1742                         i == 0 ? "Rates" : "Bandwidth", name);
1743
1744                 for (j = start2; j <= end2; j++) {
1745                         fprintf(stdout, "[%c] ", j == 0 ? 'R' : 'W');
1746
1747                         if ((type & 1) != 0) {
1748                                 fprintf(stdout, i == 0 ? "Avg: %-8.0f RPC/s " :
1749                                                          "Avg: %-8.2f %s",
1750                                         lst_lnet_stat_value(i, j, 0), units);
1751                         }
1752
1753                         if ((type & 2) != 0) {
1754                                 fprintf(stdout, i == 0 ? "Min: %-8.0f RPC/s " :
1755                                                          "Min: %-8.2f %s",
1756                                         lst_lnet_stat_value(i, j, 1), units);
1757                         }
1758
1759                         if ((type & 4) != 0) {
1760                                 fprintf(stdout, i == 0 ? "Max: %-8.0f RPC/s" :
1761                                                          "Max: %-8.2f %s",
1762                                         lst_lnet_stat_value(i, j, 2), units);
1763                         }
1764
1765                         fprintf(stdout, "\n");
1766                 }
1767         }
1768 }
1769
1770 static void
1771 lst_print_stat(char *name, struct list_head *resultp,
1772                int idx, int lnet, int bwrt, int rdwr, int type,
1773                int mbs)
1774 {
1775         struct list_head        tmp[2];
1776         struct lstcon_rpc_ent *new;
1777         struct lstcon_rpc_ent *old;
1778         struct sfw_counters   *sfwk_new;
1779         struct sfw_counters   *sfwk_old;
1780         struct srpc_counters  *srpc_new;
1781         struct srpc_counters  *srpc_old;
1782         struct lnet_counters  *lnet_new;
1783         struct lnet_counters  *lnet_old;
1784         float             delta;
1785         int               errcount = 0;
1786
1787         INIT_LIST_HEAD(&tmp[0]);
1788         INIT_LIST_HEAD(&tmp[1]);
1789
1790         memset(&lnet_stat_result, 0, sizeof(lnet_stat_result));
1791
1792         while (!list_empty(&resultp[idx])) {
1793                 if (list_empty(&resultp[1 - idx])) {
1794                         fprintf(stderr, "Group is changed, re-run stat\n");
1795                         break;
1796                 }
1797
1798                 new = list_entry(resultp[idx].next, struct lstcon_rpc_ent,
1799                                      rpe_link);
1800                 old = list_entry(resultp[1 - idx].next, struct lstcon_rpc_ent,
1801                                      rpe_link);
1802
1803                 /* first time get stats result, can't calculate diff */
1804                 if (new->rpe_peer.nid == LNET_NID_ANY)
1805                         break;
1806
1807                 if (new->rpe_peer.nid != old->rpe_peer.nid ||
1808                     new->rpe_peer.pid != old->rpe_peer.pid) {
1809                         /* Something wrong. i.e, somebody change the group */
1810                         break;
1811                 }
1812
1813                 list_del(&new->rpe_link);
1814                 list_add_tail(&new->rpe_link, &tmp[idx]);
1815
1816                 list_del(&old->rpe_link);
1817                 list_add_tail(&old->rpe_link, &tmp[1 - idx]);
1818
1819                 if (new->rpe_rpc_errno != 0 || new->rpe_fwk_errno != 0 ||
1820                     old->rpe_rpc_errno != 0 || old->rpe_fwk_errno != 0) {
1821                         errcount ++;
1822                         continue;
1823                 }
1824
1825                 sfwk_new = (struct sfw_counters *)&new->rpe_payload[0];
1826                 sfwk_old = (struct sfw_counters *)&old->rpe_payload[0];
1827
1828                 srpc_new = (struct srpc_counters *)((char *)sfwk_new + sizeof(*sfwk_new));
1829                 srpc_old = (struct srpc_counters *)((char *)sfwk_old + sizeof(*sfwk_old));
1830
1831                 lnet_new = (struct lnet_counters *)((char *)srpc_new + sizeof(*srpc_new));
1832                 lnet_old = (struct lnet_counters *)((char *)srpc_old + sizeof(*srpc_old));
1833
1834                 /* Prior to version 2.3, the running_ms field was a counter for
1835                  * the number of running tests.  We are looking at this value
1836                  * to determine if it is a millisecond timestamep (>= 2.3) or a
1837                  * test counter (< 2.3).  The number 500 is being used for this
1838                  * barrier as the test counter should never get this high, and
1839                  * the timestamp should never get this low. */
1840
1841                 if (sfwk_new->running_ms > 500) {
1842                         /* use the timestamp from the remote node, not our
1843                          * rpe_stamp from when we copied up the data out of
1844                          * the kernel */
1845
1846                         delta = (float) (sfwk_new->running_ms -
1847                                         sfwk_old->running_ms) / 1000;
1848                 } else {
1849                         struct timeval    tv;
1850
1851                         lst_timeval_diff(&new->rpe_stamp, &old->rpe_stamp, &tv);
1852                         delta = tv.tv_sec + (float)tv.tv_usec / 1000000;
1853                 }
1854
1855                 if (!lnet) /* TODO */
1856                         continue;
1857
1858                 lst_cal_lnet_stat(delta, lnet_new, lnet_old, mbs);
1859         }
1860
1861         list_splice(&tmp[idx], &resultp[idx]);
1862         list_splice(&tmp[1 - idx], &resultp[1 - idx]);
1863
1864         if (errcount > 0)
1865                 fprintf(stdout, "Failed to stat on %d nodes\n", errcount);
1866
1867         if (!lnet)  /* TODO */
1868                 return;
1869
1870         lst_print_lnet_stat(name, bwrt, rdwr, type, mbs);
1871 }
1872
1873 int
1874 jt_lst_stat(int argc, char **argv)
1875 {
1876         struct list_head        head;
1877         lst_stat_req_param_t *srp;
1878         time_t                last    = 0;
1879         int                   optidx  = 0;
1880         int                   timeout = 5; /* default timeout, 5 sec */
1881         int                   delay   = 5; /* default delay, 5 sec */
1882         int                   count   = -1; /* run forever */
1883         int                   lnet    = 1; /* lnet stat by default */
1884         int                   bwrt    = 0;
1885         int                   rdwr    = 0;
1886         int                   type    = -1;
1887         int                   idx     = 0;
1888         int                   rc;
1889         int                   c;
1890         int                   mbs     = 0; /* report as MB/s */
1891
1892         static const struct option stat_opts[] = {
1893                 { .name = "timeout", .has_arg = required_argument, .val = 't' },
1894                 { .name = "delay",   .has_arg = required_argument, .val = 'd' },
1895                 { .name = "count",   .has_arg = required_argument, .val = 'o' },
1896                 { .name = "lnet",    .has_arg = no_argument,       .val = 'l' },
1897                 { .name = "rpc",     .has_arg = no_argument,       .val = 'c' },
1898                 { .name = "bw",      .has_arg = no_argument,       .val = 'b' },
1899                 { .name = "rate",    .has_arg = no_argument,       .val = 'a' },
1900                 { .name = "read",    .has_arg = no_argument,       .val = 'r' },
1901                 { .name = "write",   .has_arg = no_argument,       .val = 'w' },
1902                 { .name = "avg",     .has_arg = no_argument,       .val = 'g' },
1903                 { .name = "min",     .has_arg = no_argument,       .val = 'n' },
1904                 { .name = "max",     .has_arg = no_argument,       .val = 'x' },
1905                 { .name = "mbs",     .has_arg = no_argument,       .val = 'm' },
1906                 { .name = NULL } };
1907
1908         if (session_key == 0) {
1909                 fprintf(stderr,
1910                         "Can't find env LST_SESSION or value is not valid\n");
1911                 return -1;
1912         }
1913
1914         while (1) {
1915                 c = getopt_long(argc, argv, "t:d:lcbarwgnxm", stat_opts,
1916                                 &optidx);
1917
1918                 if (c == -1)
1919                         break;
1920
1921                 switch (c) {
1922                 case 't':
1923                         timeout = atoi(optarg);
1924                         break;
1925                 case 'd':
1926                         delay = atoi(optarg);
1927                         break;
1928                 case 'o':
1929                         count = atoi(optarg);
1930                         break;
1931                 case 'l':
1932                         lnet = 1;
1933                         break;
1934                 case 'c':
1935                         lnet = 0;
1936                         break;
1937                 case 'b':
1938                         bwrt |= 1;
1939                         break;
1940                 case 'a':
1941                         bwrt |= 2;
1942                         break;
1943                 case 'r':
1944                         rdwr |= 1;
1945                         break;
1946                 case 'w':
1947                         rdwr |= 2;
1948                         break;
1949                 case 'g':
1950                         if (type == -1) {
1951                                 type = 1;
1952                                 break;
1953                         }
1954                         type |= 1;
1955                         break;
1956                 case 'n':
1957                         if (type == -1) {
1958                                 type = 2;
1959                                 break;
1960                         }
1961                         type |= 2;
1962                         break;
1963                 case 'x':
1964                         if (type == -1) {
1965                                 type = 4;
1966                                 break;
1967                         }
1968                         type |= 4;
1969                         break;
1970                 case 'm':
1971                         mbs = 1;
1972                         break;
1973
1974                 default:
1975                         lst_print_usage(argv[0]);
1976                         return -1;
1977                 }
1978         }
1979
1980         if (optind == argc) {
1981                 lst_print_usage(argv[0]);
1982                 return -1;
1983         }
1984
1985         if (timeout <= 0 || delay <= 0) {
1986                 fprintf(stderr, "Invalid timeout or delay value\n");
1987                 return -1;
1988         }
1989
1990         if (count < -1) {
1991             fprintf(stderr, "Invalid count value\n");
1992             return -1;
1993         }
1994
1995         /* extra count to get first data point */
1996         if (count != -1)
1997             count++;
1998
1999         INIT_LIST_HEAD(&head);
2000
2001         while (optind < argc) {
2002                 rc = lst_stat_req_param_alloc(argv[optind++], &srp, 1);
2003                 if (rc != 0)
2004                         goto out;
2005
2006                 list_add_tail(&srp->srp_link, &head);
2007         }
2008
2009         do {
2010                 time_t  now = time(NULL);
2011
2012                 if (now - last < delay) {
2013                         sleep(delay - now + last);
2014                         time(&now);
2015                 }
2016                 last = now;
2017
2018                 list_for_each_entry(srp, &head, srp_link) {
2019                         rc = lst_stat_ioctl(srp->srp_name,
2020                                             srp->srp_count, srp->srp_ids,
2021                                             timeout, &srp->srp_result[idx]);
2022                         if (rc == -1) {
2023                                 lst_print_error("stat", "Failed to stat %s: %s\n",
2024                                                 srp->srp_name, strerror(errno));
2025                                 goto out;
2026                         }
2027
2028                         lst_print_stat(srp->srp_name, srp->srp_result,
2029                                        idx, lnet, bwrt, rdwr, type, mbs);
2030
2031                         lst_reset_rpcent(&srp->srp_result[1 - idx]);
2032                 }
2033
2034                 idx = 1 - idx;
2035
2036                 if (count > 0)
2037                         count--;
2038         } while (count == -1 || count > 0);
2039
2040 out:
2041         while (!list_empty(&head)) {
2042                 srp = list_entry(head.next, lst_stat_req_param_t, srp_link);
2043
2044                 list_del(&srp->srp_link);
2045                 lst_stat_req_param_free(srp);
2046         }
2047
2048         return rc;
2049 }
2050
2051 int
2052 jt_lst_show_error(int argc, char **argv)
2053 {
2054         struct list_head       head;
2055         lst_stat_req_param_t  *srp;
2056         struct lstcon_rpc_ent *ent;
2057         struct sfw_counters   *sfwk;
2058         struct srpc_counters  *srpc;
2059         int                    show_rpc = 1;
2060         int                    optidx = 0;
2061         int                    rc = 0;
2062         int                    ecount;
2063         int                    c;
2064
2065         static const struct option show_error_opts[] = {
2066                 { .name = "session", .has_arg = no_argument, .val = 's' },
2067                 { .name = NULL, } };
2068
2069         if (session_key == 0) {
2070                 fprintf(stderr,
2071                         "Can't find env LST_SESSION or value is not valid\n");
2072                 return -1;
2073         }
2074
2075         while (1) {
2076                 c = getopt_long(argc, argv, "s", show_error_opts, &optidx);
2077
2078                 if (c == -1)
2079                         break;
2080
2081                 switch (c) {
2082                 case 's':
2083                         show_rpc  = 0;
2084                         break;
2085
2086                 default:
2087                         lst_print_usage(argv[0]);
2088                         return -1;
2089                 }
2090         }
2091
2092         if (optind == argc) {
2093                 lst_print_usage(argv[0]);
2094                 return -1;
2095         }
2096
2097         INIT_LIST_HEAD(&head);
2098
2099         while (optind < argc) {
2100                 rc = lst_stat_req_param_alloc(argv[optind++], &srp, 0);
2101                 if (rc != 0)
2102                         goto out;
2103
2104                 list_add_tail(&srp->srp_link, &head);
2105         }
2106
2107         list_for_each_entry(srp, &head, srp_link) {
2108                 rc = lst_stat_ioctl(srp->srp_name, srp->srp_count,
2109                                     srp->srp_ids, 10, &srp->srp_result[0]);
2110
2111                 if (rc == -1) {
2112                         lst_print_error(srp->srp_name, "Failed to show errors of %s: %s\n",
2113                                         srp->srp_name, strerror(errno));
2114                         goto out;
2115                 }
2116
2117                 fprintf(stdout, "%s:\n", srp->srp_name);
2118
2119                 ecount = 0;
2120
2121                 list_for_each_entry(ent, &srp->srp_result[0], rpe_link) {
2122                         if (ent->rpe_rpc_errno != 0) {
2123                                 ecount ++;
2124                                 fprintf(stderr, "RPC failure, can't show error on %s\n",
2125                                         libcfs_id2str(ent->rpe_peer));
2126                                 continue;
2127                         }
2128
2129                         if (ent->rpe_fwk_errno != 0) {
2130                                 ecount ++;
2131                                 fprintf(stderr, "Framework failure, can't show error on %s\n",
2132                                         libcfs_id2str(ent->rpe_peer));
2133                                 continue;
2134                         }
2135
2136                         sfwk = (struct sfw_counters *)&ent->rpe_payload[0];
2137                         srpc = (struct srpc_counters *)((char *)sfwk + sizeof(*sfwk));
2138
2139                         if (srpc->errors == 0 &&
2140                             sfwk->brw_errors == 0 && sfwk->ping_errors == 0)
2141                                 continue;
2142
2143                         if (!show_rpc  &&
2144                             sfwk->brw_errors == 0 && sfwk->ping_errors == 0)
2145                                 continue;
2146
2147                         ecount ++;
2148
2149                         fprintf(stderr, "%s: [Session %d brw errors, %d ping errors]%c",
2150                                 libcfs_id2str(ent->rpe_peer),
2151                                 sfwk->brw_errors, sfwk->ping_errors,
2152                                 show_rpc  ? ' ' : '\n');
2153
2154                         if (!show_rpc)
2155                                 continue;
2156
2157                         fprintf(stderr, "[RPC: %d errors, %d dropped, %d expired]\n",
2158                                 srpc->errors, srpc->rpcs_dropped, srpc->rpcs_expired);
2159                 }
2160
2161                 fprintf(stdout, "Total %d error nodes in %s\n", ecount, srp->srp_name);
2162         }
2163 out:
2164         while (!list_empty(&head)) {
2165                 srp = list_entry(head.next, lst_stat_req_param_t, srp_link);
2166
2167                 list_del(&srp->srp_link);
2168                 lst_stat_req_param_free(srp);
2169         }
2170
2171         return rc;
2172 }
2173
2174 int
2175 lst_add_batch_ioctl(char *name)
2176 {
2177         struct lstio_batch_add_args args = { 0 };
2178
2179         args.lstio_bat_key   = session_key;
2180         args.lstio_bat_nmlen = strlen(name);
2181         args.lstio_bat_namep = name;
2182
2183         return lst_ioctl (LSTIO_BATCH_ADD, &args, sizeof(args));
2184 }
2185
2186 int
2187 jt_lst_add_batch(int argc, char **argv)
2188 {
2189         char   *name;
2190         int     rc;
2191
2192         if (session_key == 0) {
2193                 fprintf(stderr,
2194                         "Can't find env LST_SESSION or value is not valid\n");
2195                 return -1;
2196         }
2197
2198         if (argc != 2) {
2199                 lst_print_usage(argv[0]);
2200                 return -1;
2201         }
2202
2203         name = argv[1];
2204         if (strlen(name) >= LST_NAME_SIZE) {
2205                 fprintf(stderr, "Name length is limited to %d\n",
2206                         LST_NAME_SIZE - 1);
2207                 return -1;
2208         }
2209
2210         rc = lst_add_batch_ioctl(name);
2211         if (rc == 0)
2212                 return 0;
2213
2214         lst_print_error("batch", "Failed to create batch: %s\n",
2215                         strerror(errno));
2216
2217         return -1;
2218 }
2219
2220 int
2221 lst_start_batch_ioctl(char *name, int timeout, struct list_head *resultp)
2222 {
2223         struct lstio_batch_run_args args = { 0 };
2224
2225         args.lstio_bat_key     = session_key;
2226         args.lstio_bat_timeout = timeout;
2227         args.lstio_bat_nmlen   = strlen(name);
2228         args.lstio_bat_namep   = name;
2229         args.lstio_bat_resultp = resultp;
2230
2231         return lst_ioctl(LSTIO_BATCH_START, &args, sizeof(args));
2232 }
2233
2234 int
2235 jt_lst_start_batch(int argc, char **argv)
2236 {
2237         struct list_head  head;
2238         char             *batch;
2239         int               optidx = 0;
2240         int               timeout = 0;
2241         int               count = 0;
2242         int               rc;
2243         int               c;
2244
2245         static const struct option start_batch_opts[] = {
2246                 { .name = "timeout", .has_arg = required_argument, .val = 't' },
2247                 { .name = NULL } };
2248
2249         if (session_key == 0) {
2250                 fprintf(stderr,
2251                         "Can't find env LST_SESSION or value is not valid\n");
2252                 return -1;
2253         }
2254
2255         while (1) {
2256                 c = getopt_long(argc, argv, "t:",
2257                                 start_batch_opts, &optidx);
2258
2259                 /* Detect the end of the options. */
2260                 if (c == -1)
2261                         break;
2262
2263                 switch (c) {
2264                 case 't':
2265                         timeout = atoi(optarg);
2266                         break;
2267                 default:
2268                         lst_print_usage(argv[0]);
2269                         return -1;
2270                 }
2271         }
2272
2273         if (optind == argc) {
2274                 batch = LST_DEFAULT_BATCH;
2275
2276         } else if (optind == argc - 1) {
2277                 batch = argv[optind];
2278
2279         } else {
2280                 lst_print_usage(argv[0]);
2281                 return -1;
2282         }
2283
2284         rc = lst_get_node_count(LST_OPC_BATCHCLI, batch, &count, NULL);
2285         if (rc != 0) {
2286                 fprintf(stderr, "Failed to get count of nodes from %s: %s\n",
2287                         batch, strerror(errno));
2288                 return -1;
2289         }
2290
2291         INIT_LIST_HEAD(&head);
2292
2293         rc = lst_alloc_rpcent(&head, count, 0);
2294         if (rc != 0) {
2295                 fprintf(stderr, "Out of memory\n");
2296                 return -1;
2297         }
2298
2299         rc = lst_start_batch_ioctl(batch, timeout, &head);
2300
2301         if (rc == 0) {
2302                 fprintf(stdout, "%s is running now\n", batch);
2303                 lst_free_rpcent(&head);
2304                 return 0;
2305         }
2306
2307         if (rc == -1) {
2308                 lst_print_error("batch", "Failed to start batch: %s\n",
2309                                 strerror(errno));
2310                 lst_free_rpcent(&head);
2311                 return rc;
2312         }
2313
2314         lst_print_transerr(&head, "Run batch");
2315
2316         lst_free_rpcent(&head);
2317
2318         return rc;
2319 }
2320
2321 int
2322 lst_stop_batch_ioctl(char *name, int force, struct list_head *resultp)
2323 {
2324         struct lstio_batch_stop_args args = { 0 };
2325
2326         args.lstio_bat_key     = session_key;
2327         args.lstio_bat_force   = force;
2328         args.lstio_bat_nmlen   = strlen(name);
2329         args.lstio_bat_namep   = name;
2330         args.lstio_bat_resultp = resultp;
2331
2332         return lst_ioctl(LSTIO_BATCH_STOP, &args, sizeof(args));
2333 }
2334
2335 int
2336 jt_lst_stop_batch(int argc, char **argv)
2337 {
2338         struct list_head  head;
2339         char             *batch;
2340         int               force = 0;
2341         int               optidx;
2342         int               count;
2343         int               rc;
2344         int               c;
2345
2346         static const struct option stop_batch_opts[] = {
2347                 { .name = "force", .has_arg = no_argument, .val = 'f' },
2348                 { .name = NULL } };
2349
2350         if (session_key == 0) {
2351                 fprintf(stderr,
2352                         "Can't find env LST_SESSION or value is not valid\n");
2353                 return -1;
2354         }
2355
2356         while (1) {
2357                 c = getopt_long(argc, argv, "f",
2358                                 stop_batch_opts, &optidx);
2359
2360                 /* Detect the end of the options. */
2361                 if (c == -1)
2362                         break;
2363
2364                 switch (c) {
2365                 case 'f':
2366                         force = 1;
2367                         break;
2368                 default:
2369                         lst_print_usage(argv[0]);
2370                         return -1;
2371                 }
2372         }
2373
2374         if (optind == argc) {
2375                 batch = LST_DEFAULT_BATCH;
2376
2377         } else if (optind == argc - 1) {
2378                 batch = argv[optind];
2379
2380         } else {
2381                 lst_print_usage(argv[0]);
2382                 return -1;
2383         }
2384
2385         rc = lst_get_node_count(LST_OPC_BATCHCLI, batch, &count, NULL);
2386         if (rc != 0) {
2387                 fprintf(stderr, "Failed to get count of nodes from %s: %s\n",
2388                         batch, strerror(errno));
2389                 return -1;
2390         }
2391
2392         INIT_LIST_HEAD(&head);
2393
2394         rc = lst_alloc_rpcent(&head, count, 0);
2395         if (rc != 0) {
2396                 fprintf(stderr, "Out of memory\n");
2397                 return -1;
2398         }
2399
2400         rc = lst_stop_batch_ioctl(batch, force, &head);
2401         if (rc != 0)
2402                 goto out;
2403
2404         while (1) {
2405                 lst_reset_rpcent(&head);
2406
2407                 rc = lst_query_batch_ioctl(batch, 0, 0, 30, &head);
2408                 if (rc != 0)
2409                         goto out;
2410
2411                 if (lstcon_tsbqry_stat_run(&trans_stat, 0)  == 0 &&
2412                     lstcon_tsbqry_stat_failure(&trans_stat, 0) == 0)
2413                         break;
2414
2415                 fprintf(stdout, "%d batch in stopping\n",
2416                         lstcon_tsbqry_stat_run(&trans_stat, 0));
2417                 sleep(1);
2418         }
2419
2420         fprintf(stdout, "Batch is stopped\n");
2421         lst_free_rpcent(&head);
2422
2423         return 0;
2424 out:
2425         if (rc == -1) {
2426                 lst_print_error("batch", "Failed to stop batch: %s\n",
2427                                 strerror(errno));
2428                 lst_free_rpcent(&head);
2429                 return -1;
2430         }
2431
2432         lst_print_transerr(&head, "stop batch");
2433
2434         lst_free_rpcent(&head);
2435
2436         return rc;
2437 }
2438
2439 int
2440 lst_list_batch_ioctl(int len, char *name, int index)
2441 {
2442         struct lstio_batch_list_args args = { 0 };
2443
2444         args.lstio_bat_key   = session_key;
2445         args.lstio_bat_idx   = index;
2446         args.lstio_bat_nmlen = len;
2447         args.lstio_bat_namep = name;
2448
2449         return lst_ioctl(LSTIO_BATCH_LIST, &args, sizeof(args));
2450 }
2451
2452 int
2453 lst_info_batch_ioctl(char *batch, int test, int server,
2454                      struct lstcon_test_batch_ent *entp, int *idxp,
2455                      int *ndentp, struct lstcon_node_ent *dentsp)
2456 {
2457         struct lstio_batch_info_args args = { 0 };
2458
2459         args.lstio_bat_key     = session_key;
2460         args.lstio_bat_nmlen   = strlen(batch);
2461         args.lstio_bat_namep   = batch;
2462         args.lstio_bat_server  = server;
2463         args.lstio_bat_testidx = test;
2464         args.lstio_bat_entp    = entp;
2465         args.lstio_bat_idxp    = idxp;
2466         args.lstio_bat_ndentp  = ndentp;
2467         args.lstio_bat_dentsp  = dentsp;
2468
2469         return lst_ioctl(LSTIO_BATCH_INFO, &args, sizeof(args));
2470 }
2471
2472 int
2473 lst_list_batch_all(void)
2474 {
2475         char name[LST_NAME_SIZE];
2476         int  rc;
2477         int  i;
2478
2479         for (i = 0; ; i++) {
2480                 rc = lst_list_batch_ioctl(LST_NAME_SIZE, name, i);
2481                 if (rc == 0) {
2482                         fprintf(stdout, "%d) %s\n", i + 1, name);
2483                         continue;
2484                 }
2485
2486                 if (errno == ENOENT)
2487                         break;
2488
2489                 lst_print_error("batch", "Failed to list batch: %s\n",
2490                                 strerror(errno));
2491                 return rc;
2492         }
2493
2494         fprintf(stdout, "Total %d batches\n", i);
2495
2496         return 0;
2497 }
2498
2499 int
2500 lst_list_tsb_nodes(char *batch, int test, int server,
2501                    int count, int active, int invalid)
2502 {
2503         struct lstcon_node_ent *dents;
2504         int                index = 0;
2505         int                rc;
2506         int                c;
2507         int                i;
2508
2509         if (count == 0)
2510                 return 0;
2511
2512         /* verbose list, show nodes in batch or test */
2513         dents = malloc(count * sizeof(struct lstcon_node_ent));
2514         if (dents == NULL) {
2515                 fprintf(stdout, "Can't allocate memory\n");
2516                 return -1;
2517         }
2518
2519         rc = lst_info_batch_ioctl(batch, test, server,
2520                                   NULL, &index, &count, dents);
2521         if (rc != 0) {
2522                 free(dents);
2523                 lst_print_error((test > 0) ? "test" : "batch",
2524                                 (test > 0) ? "Failed to query test: %s\n" :
2525                                              "Failed to query batch: %s\n",
2526                                 strerror(errno));
2527                 return -1;
2528         }
2529
2530         for (i = 0, c = 0; i < count; i++) {
2531                 if ((!active  && dents[i].nde_state == LST_NODE_ACTIVE) ||
2532                     (!invalid && (dents[i].nde_state == LST_NODE_BUSY  ||
2533                                   dents[i].nde_state == LST_NODE_DOWN  ||
2534                                   dents[i].nde_state == LST_NODE_UNKNOWN)))
2535                         continue;
2536
2537                 fprintf(stdout, "\t%s: %s\n",
2538                         libcfs_id2str(dents[i].nde_id),
2539                         lst_node_state2str(dents[i].nde_state));
2540                 c++;
2541         }
2542
2543         fprintf(stdout, "Total %d nodes\n", c);
2544         free(dents);
2545
2546         return 0;
2547 }
2548
2549 int
2550 jt_lst_list_batch(int argc, char **argv)
2551 {
2552         struct lstcon_test_batch_ent ent;
2553         char *batch   = NULL;
2554         int   optidx  = 0;
2555         int   verbose = 0; /* list nodes in batch or test */
2556         int   invalid = 0;
2557         int   active  = 0;
2558         int   server  = 0;
2559         int   ntest   = 0;
2560         int   test    = 0;
2561         int   c       = 0;
2562         int   rc;
2563
2564         static const struct option list_batch_opts[] = {
2565                 { .name = "test",    .has_arg = required_argument, .val = 't' },
2566                 { .name = "invalid", .has_arg = no_argument,       .val = 'i' },
2567                 { .name = "active",  .has_arg = no_argument,       .val = 'a' },
2568                 { .name = "all",     .has_arg = no_argument,       .val = 'l' },
2569                 { .name = "server",  .has_arg = no_argument,       .val = 's' },
2570                 { .name = NULL, } };
2571
2572         if (session_key == 0) {
2573                 fprintf(stderr,
2574                         "Can't find env LST_SESSION or value is not valid\n");
2575                 return -1;
2576         }
2577
2578         while (1) {
2579                 c = getopt_long(argc, argv, "ailst:",
2580                                 list_batch_opts, &optidx);
2581
2582                 if (c == -1)
2583                         break;
2584
2585                 switch (c) {
2586                 case 'a':
2587                         verbose = active = 1;
2588                         break;
2589                 case 'i':
2590                         verbose = invalid = 1;
2591                         break;
2592                 case 'l':
2593                         verbose = active = invalid = 1;
2594                         break;
2595                 case 's':
2596                         server = 1;
2597                         break;
2598                 case 't':
2599                         test = atoi(optarg);
2600                         ntest = 1;
2601                         break;
2602                 default:
2603                         lst_print_usage(argv[0]);
2604                         return -1;
2605                 }
2606         }
2607
2608         if (optind == argc) {
2609                 /* list all batches */
2610                 rc = lst_list_batch_all();
2611                 return rc;
2612         }
2613
2614         if (ntest == 1 && test <= 0) {
2615                 fprintf(stderr, "Invalid test id, test id starts from 1\n");
2616                 return -1;
2617         }
2618
2619         if (optind != argc - 1) {
2620                 lst_print_usage(argv[0]);
2621                 return -1;
2622         }
2623
2624         batch = argv[optind];
2625
2626 loop:
2627         /* show detail of specified batch or test */
2628         rc = lst_info_batch_ioctl(batch, test, server,
2629                                   &ent, NULL, NULL, NULL);
2630         if (rc != 0) {
2631                 lst_print_error((test > 0) ? "test" : "batch",
2632                                 (test > 0) ? "Failed to query test: %s\n" :
2633                                              "Failed to query batch: %s\n",
2634                                 strerror(errno));
2635                 return -1;
2636         }
2637
2638         if (verbose) {
2639                 /* list nodes in test or batch */
2640                 rc = lst_list_tsb_nodes(batch, test, server,
2641                                         server ? ent.tbe_srv_nle.nle_nnode :
2642                                                  ent.tbe_cli_nle.nle_nnode,
2643                                         active, invalid);
2644                 return rc;
2645         }
2646
2647         /* only show number of hosts in batch or test */
2648         if (test == 0) {
2649                 fprintf(stdout, "Batch: %s Tests: %d State: %d\n",
2650                         batch, ent.u.tbe_batch.bae_ntest,
2651                         ent.u.tbe_batch.bae_state);
2652                 ntest = ent.u.tbe_batch.bae_ntest;
2653                 test = 1; /* starting from test 1 */
2654
2655         } else {
2656                 fprintf(stdout,
2657                         "\tTest %d(%s) (loop: %d, concurrency: %d)\n",
2658                         test, lst_test_type2name(ent.u.tbe_test.tse_type),
2659                         ent.u.tbe_test.tse_loop,
2660                         ent.u.tbe_test.tse_concur);
2661                 ntest --;
2662                 test ++;
2663         }
2664
2665         fprintf(stdout, LST_NODES_TITLE);
2666         fprintf(stdout, "client\t%d\t%d\t%d\t%d\t%d\n"
2667                         "server\t%d\t%d\t%d\t%d\t%d\n",
2668                 ent.tbe_cli_nle.nle_nactive,
2669                 ent.tbe_cli_nle.nle_nbusy,
2670                 ent.tbe_cli_nle.nle_ndown,
2671                 ent.tbe_cli_nle.nle_nunknown,
2672                 ent.tbe_cli_nle.nle_nnode,
2673                 ent.tbe_srv_nle.nle_nactive,
2674                 ent.tbe_srv_nle.nle_nbusy,
2675                 ent.tbe_srv_nle.nle_ndown,
2676                 ent.tbe_srv_nle.nle_nunknown,
2677                 ent.tbe_srv_nle.nle_nnode);
2678
2679         if (ntest != 0)
2680                 goto loop;
2681
2682         return 0;
2683 }
2684
2685 int
2686 lst_query_batch_ioctl(char *batch, int test, int server,
2687                       int timeout, struct list_head *head)
2688 {
2689         struct lstio_batch_query_args args = { 0 };
2690
2691         args.lstio_bat_key     = session_key;
2692         args.lstio_bat_testidx = test;
2693         args.lstio_bat_client  = !(server);
2694         args.lstio_bat_timeout = timeout;
2695         args.lstio_bat_nmlen   = strlen(batch);
2696         args.lstio_bat_namep   = batch;
2697         args.lstio_bat_resultp = head;
2698
2699         return lst_ioctl(LSTIO_BATCH_QUERY, &args, sizeof(args));
2700 }
2701
2702 void
2703 lst_print_tsb_verbose(struct list_head *head,
2704                       int active, int idle, int error)
2705 {
2706         struct lstcon_rpc_ent *ent;
2707
2708         list_for_each_entry(ent, head, rpe_link) {
2709                 if (ent->rpe_priv[0] == 0 && active)
2710                         continue;
2711
2712                 if (ent->rpe_priv[0] != 0 && idle)
2713                         continue;
2714
2715                 if (ent->rpe_fwk_errno == 0 && error)
2716                         continue;
2717
2718                 fprintf(stdout, "%s [%s]: %s\n",
2719                         libcfs_id2str(ent->rpe_peer),
2720                         lst_node_state2str(ent->rpe_state),
2721                         ent->rpe_rpc_errno != 0 ?
2722                                 strerror(ent->rpe_rpc_errno) :
2723                                 (ent->rpe_priv[0] > 0 ? "Running" : "Idle"));
2724         }
2725 }
2726
2727 int
2728 jt_lst_query_batch(int argc, char **argv)
2729 {
2730         struct lstcon_test_batch_ent ent;
2731         struct list_head head;
2732         char   *batch   = NULL;
2733         time_t  last    = 0;
2734         int     optidx  = 0;
2735         int     verbose = 0;
2736         int     server  = 0;
2737         int     timeout = 5; /* default 5 seconds */
2738         int     delay   = 5; /* default 5 seconds */
2739         int     loop    = 1; /* default 1 loop */
2740         int     active  = 0;
2741         int     error   = 0;
2742         int     idle    = 0;
2743         int     count   = 0;
2744         int     test    = 0;
2745         int     rc      = 0;
2746         int     c       = 0;
2747         int     i;
2748
2749         static const struct option query_batch_opts[] = {
2750                 { .name = "timeout", .has_arg = required_argument, .val = 'o' },
2751                 { .name = "delay",   .has_arg = required_argument, .val = 'd' },
2752                 { .name = "loop",    .has_arg = required_argument, .val = 'c' },
2753                 { .name = "test",    .has_arg = required_argument, .val = 't' },
2754                 { .name = "server",  .has_arg = no_argument,       .val = 's' },
2755                 { .name = "active",  .has_arg = no_argument,       .val = 'a' },
2756                 { .name = "idle",    .has_arg = no_argument,       .val = 'i' },
2757                 { .name = "error",   .has_arg = no_argument,       .val = 'e' },
2758                 { .name = "all",     .has_arg = no_argument,       .val = 'l' },
2759                 { .name = NULL, } };
2760
2761         if (session_key == 0) {
2762                 fprintf(stderr,
2763                         "Can't find env LST_SESSION or value is not valid\n");
2764                 return -1;
2765         }
2766
2767         while (1) {
2768                 c = getopt_long(argc, argv, "o:d:c:t:saiel",
2769                                 query_batch_opts, &optidx);
2770
2771                 /* Detect the end of the options. */
2772                 if (c == -1)
2773                         break;
2774
2775                 switch (c) {
2776                 case 'o':
2777                         timeout = atoi(optarg);
2778                         break;
2779                 case 'd':
2780                         delay = atoi(optarg);
2781                         break;
2782                 case 'c':
2783                         loop = atoi(optarg);
2784                         break;
2785                 case 't':
2786                         test = atoi(optarg);
2787                         break;
2788                 case 's':
2789                         server = 1;
2790                         break;
2791                 case 'a':
2792                         active = verbose = 1;
2793                         break;
2794                 case 'i':
2795                         idle = verbose = 1;
2796                         break;
2797                 case 'e':
2798                         error = verbose = 1;
2799                         break;
2800                 case 'l':
2801                         verbose = 1;
2802                         break;
2803                 default:
2804                         lst_print_usage(argv[0]);
2805                         return -1;
2806                 }
2807         }
2808
2809         if (test < 0 || timeout <= 0 || delay <= 0 || loop <= 0) {
2810                 lst_print_usage(argv[0]);
2811                 return -1;
2812         }
2813
2814         if (optind == argc) {
2815                 batch = LST_DEFAULT_BATCH;
2816
2817         } else if (optind == argc - 1) {
2818                 batch = argv[optind];
2819
2820         } else {
2821                 lst_print_usage(argv[0]);
2822                 return -1;
2823         }
2824
2825
2826         INIT_LIST_HEAD(&head);
2827
2828         if (verbose) {
2829                 rc = lst_info_batch_ioctl(batch, test, server,
2830                                           &ent, NULL, NULL, NULL);
2831                 if (rc != 0) {
2832                         fprintf(stderr, "Failed to query %s [%d]: %s\n",
2833                                 batch, test, strerror(errno));
2834                         return -1;
2835                 }
2836
2837                 count = server ? ent.tbe_srv_nle.nle_nnode :
2838                                  ent.tbe_cli_nle.nle_nnode;
2839                 if (count == 0) {
2840                         fprintf(stdout, "Batch or test is empty\n");
2841                         return 0;
2842                 }
2843         }
2844
2845         rc = lst_alloc_rpcent(&head, count, 0);
2846         if (rc != 0) {
2847                 fprintf(stderr, "Out of memory\n");
2848                 return rc;
2849         }
2850
2851         for (i = 0; i < loop; i++) {
2852                 time_t  now = time(NULL);
2853
2854                 if (now - last < delay) {
2855                         sleep(delay - now + last);
2856                         time(&now);
2857                 }
2858
2859                 last = now;
2860
2861                 rc = lst_query_batch_ioctl(batch, test,
2862                                            server, timeout, &head);
2863                 if (rc == -1) {
2864                         fprintf(stderr, "Failed to query batch: %s\n",
2865                                 strerror(errno));
2866                         break;
2867                 }
2868
2869                 if (verbose) {
2870                         /* Verbose mode */
2871                         lst_print_tsb_verbose(&head, active, idle, error);
2872                         continue;
2873                 }
2874
2875                 fprintf(stdout, "%s [%d] ", batch, test);
2876
2877                 if (lstcon_rpc_stat_failure(&trans_stat, 0) != 0) {
2878                         fprintf(stdout, "%d of %d nodes are unknown, ",
2879                                 lstcon_rpc_stat_failure(&trans_stat, 0),
2880                                 lstcon_rpc_stat_total(&trans_stat, 0));
2881                 }
2882
2883                 if (lstcon_rpc_stat_failure(&trans_stat, 0) == 0 &&
2884                     lstcon_tsbqry_stat_run(&trans_stat, 0)  == 0  &&
2885                     lstcon_tsbqry_stat_failure(&trans_stat, 0) == 0) {
2886                         fprintf(stdout, "is stopped\n");
2887                         continue;
2888                 }
2889
2890                 if (lstcon_rpc_stat_failure(&trans_stat, 0) == 0 &&
2891                     lstcon_tsbqry_stat_idle(&trans_stat, 0) == 0 &&
2892                     lstcon_tsbqry_stat_failure(&trans_stat, 0) == 0) {
2893                         fprintf(stdout, "is running\n");
2894                         continue;
2895                 }
2896
2897                 fprintf(stdout, "stopped: %d , running: %d, failed: %d\n",
2898                                 lstcon_tsbqry_stat_idle(&trans_stat, 0),
2899                                 lstcon_tsbqry_stat_run(&trans_stat, 0),
2900                                 lstcon_tsbqry_stat_failure(&trans_stat, 0));
2901         }
2902
2903         lst_free_rpcent(&head);
2904
2905         return rc;
2906 }
2907
2908 int
2909 lst_parse_distribute(char *dstr, int *dist, int *span)
2910 {
2911         *dist = atoi(dstr);
2912         if (*dist <= 0)
2913                 return -1;
2914
2915         dstr = strchr(dstr, ':');
2916         if (dstr == NULL)
2917                 return -1;
2918
2919         *span = atoi(dstr + 1);
2920         if (*span <= 0)
2921                 return -1;
2922
2923         return 0;
2924 }
2925
2926 int
2927 lst_get_bulk_param(int argc, char **argv, struct lst_test_bulk_param *bulk)
2928 {
2929         char   *tok = NULL;
2930         char   *end = NULL;
2931         int     rc  = 0;
2932         int     i   = 0;
2933
2934         bulk->blk_size  = 4096;
2935         bulk->blk_opc   = LST_BRW_READ;
2936         bulk->blk_flags = LST_BRW_CHECK_NONE;
2937         bulk->blk_srv_off = bulk->blk_cli_off = 0;
2938
2939         while (i < argc) {
2940                 if (strcasestr(argv[i], "check=") == argv[i] ||
2941                     strcasestr(argv[i], "c=") == argv[i]) {
2942                         tok = strchr(argv[i], '=') + 1;
2943
2944                         if (strcasecmp(tok, "full") == 0) {
2945                                 bulk->blk_flags = LST_BRW_CHECK_FULL;
2946                         } else if (strcasecmp(tok, "simple") == 0) {
2947                                 bulk->blk_flags = LST_BRW_CHECK_SIMPLE;
2948                         } else {
2949                                 fprintf(stderr, "Unknow flag %s\n", tok);
2950                                 return -1;
2951                         }
2952
2953                 } else if (strcasestr(argv[i], "size=") == argv[i] ||
2954                            strcasestr(argv[i], "s=") == argv[i]) {
2955                         int max_size = sysconf(_SC_PAGESIZE) * LNET_MAX_IOV;
2956
2957                         tok = strchr(argv[i], '=') + 1;
2958
2959                         bulk->blk_size = strtol(tok, &end, 0);
2960                         if (bulk->blk_size <= 0) {
2961                                 fprintf(stderr, "Invalid size %s\n", tok);
2962                                 return -1;
2963                         }
2964
2965                         if (end == NULL)
2966                                 return 0;
2967
2968                         if (*end == 'k' || *end == 'K')
2969                                 bulk->blk_size *= 1024;
2970                         else if (*end == 'm' || *end == 'M')
2971                                 bulk->blk_size *= 1024 * 1024;
2972
2973                         if (bulk->blk_size > max_size) {
2974                                 fprintf(stderr, "Size exceed limitation: %d bytes\n",
2975                                         bulk->blk_size);
2976                                 return -1;
2977                         }
2978
2979                 } else if (strcasestr(argv[i], "off=") == argv[i]) {
2980                         int     off;
2981
2982                         tok = strchr(argv[i], '=') + 1;
2983
2984                         off = strtol(tok, &end, 0);
2985                         /* NB: align with sizeof(__u64) to simplify page
2986                          * checking implementation */
2987                         if (off < 0 || off % sizeof(__u64) != 0) {
2988                                 fprintf(stderr,
2989                                         "Invalid offset %s/%d, it should be "
2990                                         "postive value and multiple of %d\n",
2991                                         tok, off, (int)sizeof(__u64));
2992                                 return -1;
2993                         }
2994
2995                         /* NB: blk_srv_off is reserved so far */
2996                         bulk->blk_cli_off = bulk->blk_srv_off = off;
2997                         if (end == NULL)
2998                                 return 0;
2999
3000                 } else if (strcasecmp(argv[i], "read") == 0 ||
3001                            strcasecmp(argv[i], "r") == 0) {
3002                         bulk->blk_opc = LST_BRW_READ;
3003
3004                 } else if (strcasecmp(argv[i], "write") == 0 ||
3005                            strcasecmp(argv[i], "w") == 0) {
3006                         bulk->blk_opc = LST_BRW_WRITE;
3007
3008                 } else {
3009                         fprintf(stderr, "Unknow parameter: %s\n", argv[i]);
3010                         return -1;
3011                 }
3012
3013                 i++;
3014         }
3015
3016         return rc;
3017 }
3018
3019 int
3020 lst_get_test_param(char *test, int argc, char **argv, void **param, int *plen)
3021 {
3022         struct lst_test_bulk_param *bulk = NULL;
3023         int                    type;
3024
3025         type = lst_test_name2type(test);
3026         if (type < 0) {
3027                 fprintf(stderr, "Unknow test name %s\n", test);
3028                 return -1;
3029         }
3030
3031         switch (type) {
3032         case LST_TEST_PING:
3033                 break;
3034
3035         case LST_TEST_BULK:
3036                 bulk = malloc(sizeof(*bulk));
3037                 if (bulk == NULL) {
3038                         fprintf(stderr, "Out of memory\n");
3039                         return -1;
3040                 }
3041
3042                 memset(bulk, 0, sizeof(*bulk));
3043
3044                 if (lst_get_bulk_param(argc, argv, bulk) != 0) {
3045                         free(bulk);
3046                         return -1;
3047                 }
3048
3049                 *param = bulk;
3050                 *plen  = sizeof(*bulk);
3051
3052                 break;
3053
3054         default:
3055                 break;
3056         }
3057
3058         /* TODO: parse more parameter */
3059         return type;
3060 }
3061
3062 int
3063 lst_add_test_ioctl(char *batch, int type, int loop, int concur,
3064                    int dist, int span, char *sgrp, char *dgrp,
3065                    void *param, int plen, int *retp, struct list_head *resultp)
3066 {
3067         struct lstio_test_args args = { 0 };
3068
3069         args.lstio_tes_key        = session_key;
3070         args.lstio_tes_bat_nmlen  = strlen(batch);
3071         args.lstio_tes_bat_name   = batch;
3072         args.lstio_tes_type       = type;
3073         args.lstio_tes_oneside    = 0;
3074         args.lstio_tes_loop       = loop;
3075         args.lstio_tes_concur     = concur;
3076         args.lstio_tes_dist       = dist;
3077         args.lstio_tes_span       = span;
3078         args.lstio_tes_sgrp_nmlen = strlen(sgrp);
3079         args.lstio_tes_sgrp_name  = sgrp;
3080         args.lstio_tes_dgrp_nmlen = strlen(dgrp);
3081         args.lstio_tes_dgrp_name  = dgrp;
3082         args.lstio_tes_param_len  = plen;
3083         args.lstio_tes_param      = param;
3084         args.lstio_tes_retp       = retp;
3085         args.lstio_tes_resultp    = resultp;
3086
3087         return lst_ioctl(LSTIO_TEST_ADD, &args, sizeof(args));
3088 }
3089
3090 int
3091 jt_lst_add_test(int argc, char **argv)
3092 {
3093         struct list_head head;
3094         char *batch  = NULL;
3095         char *test   = NULL;
3096         char *dstr   = NULL;
3097         char *from   = NULL;
3098         char *to     = NULL;
3099         void *param  = NULL;
3100         int   optidx = 0;
3101         int   concur = 1;
3102         int   loop   = -1;
3103         int   dist   = 1;
3104         int   span   = 1;
3105         int   plen   = 0;
3106         int   fcount = 0;
3107         int   tcount = 0;
3108         int   ret    = 0;
3109         int   type;
3110         int   rc;
3111         int   c;
3112
3113         static const struct option add_test_opts[] = {
3114         { .name = "batch",       .has_arg = required_argument, .val = 'b' },
3115         { .name = "concurrency", .has_arg = required_argument, .val = 'c' },
3116         { .name = "distribute",  .has_arg = required_argument, .val = 'd' },
3117         { .name = "from",        .has_arg = required_argument, .val = 'f' },
3118         { .name = "to",          .has_arg = required_argument, .val = 't' },
3119         { .name = "loop",        .has_arg = required_argument, .val = 'l' },
3120         { .name = NULL } };
3121
3122         if (session_key == 0) {
3123                 fprintf(stderr,
3124                         "Can't find env LST_SESSION or value is not valid\n");
3125                 return -1;
3126         }
3127
3128         while (1) {
3129                 c = getopt_long(argc, argv, "b:c:d:f:l:t:",
3130                                 add_test_opts, &optidx);
3131
3132                 /* Detect the end of the options. */
3133                 if (c == -1)
3134                         break;
3135
3136                 switch (c) {
3137                 case 'b':
3138                         batch = optarg;
3139                         break;
3140                 case 'c':
3141                         concur = atoi(optarg);
3142                         break;
3143                 case 'd':
3144                         dstr = optarg;
3145                         break;
3146                 case 'f':
3147                         from = optarg;
3148                         break;
3149                 case 'l':
3150                         loop = atoi(optarg);
3151                         break;
3152                 case 't':
3153                         to = optarg;
3154                         break;
3155                 default:
3156                         lst_print_usage(argv[0]);
3157                         return -1;
3158                 }
3159         }
3160
3161         if (optind == argc || from == NULL || to == NULL) {
3162                 lst_print_usage(argv[0]);
3163                 return -1;
3164         }
3165
3166         if (concur <= 0 || concur > LST_MAX_CONCUR) {
3167                 fprintf(stderr, "Invalid concurrency of test: %d\n", concur);
3168                 return -1;
3169         }
3170
3171         if (batch == NULL)
3172                 batch = LST_DEFAULT_BATCH;
3173
3174         if (dstr != NULL) {
3175                 rc = lst_parse_distribute(dstr, &dist, &span);
3176                 if (rc != 0) {
3177                         fprintf(stderr, "Invalid distribution: %s\n", dstr);
3178                         return -1;
3179                 }
3180         }
3181
3182         test = argv[optind++];
3183
3184         argc -= optind;
3185         argv += optind;
3186
3187         type = lst_get_test_param(test, argc, argv, &param, &plen);
3188         if (type < 0) {
3189                 fprintf(stderr, "Failed to add test (%s)\n", test);
3190                 return -1;
3191         }
3192
3193         INIT_LIST_HEAD(&head);
3194
3195         rc = lst_get_node_count(LST_OPC_GROUP, from, &fcount, NULL);
3196         if (rc != 0) {
3197                 fprintf(stderr, "Can't get count of nodes from %s: %s\n",
3198                         from, strerror(errno));
3199                 goto out;
3200         }
3201
3202         rc = lst_get_node_count(LST_OPC_GROUP, to, &tcount, NULL);
3203         if (rc != 0) {
3204                 fprintf(stderr, "Can't get count of nodes from %s: %s\n",
3205                         to, strerror(errno));
3206                 goto out;
3207         }
3208
3209         rc = lst_alloc_rpcent(&head, fcount > tcount ? fcount : tcount, 0);
3210         if (rc != 0) {
3211                 fprintf(stderr, "Out of memory\n");
3212                 goto out;
3213         }
3214
3215         rc = lst_add_test_ioctl(batch, type, loop, concur,
3216                                 dist, span, from, to, param, plen, &ret, &head);
3217
3218         if (rc == 0) {
3219                 fprintf(stdout, "Test was added successfully\n");
3220                 if (ret != 0) {
3221                         fprintf(stdout, "Server group contains userland test "
3222                                 "nodes, old version of tcplnd can't accept "
3223                                 "connection request\n");
3224                 }
3225
3226                 goto out;
3227         }
3228
3229         if (rc == -1) {
3230                 lst_print_error("test", "Failed to add test: %s\n",
3231                                 strerror(errno));
3232                 goto out;
3233         }
3234
3235         lst_print_transerr(&head, "add test");
3236 out:
3237         lst_free_rpcent(&head);
3238
3239         if (param != NULL)
3240                 free(param);
3241
3242         return rc;
3243 }
3244
3245 static command_t lst_cmdlist[] = {
3246         {"new_session",         jt_lst_new_session,     NULL,
3247          "Usage: lst new_session [--timeout TIME] [--force] [NAME]"                     },
3248         {"end_session",         jt_lst_end_session,     NULL,
3249          "Usage: lst end_session"                                                       },
3250         {"show_session",        jt_lst_show_session,    NULL,
3251          "Usage: lst show_session"                                                      },
3252         {"ping",                jt_lst_ping ,           NULL,
3253          "Usage: lst ping  [--group NAME] [--batch NAME] [--session] [--nodes IDS]"     },
3254         {"add_group",           jt_lst_add_group,       NULL,
3255          "Usage: lst group NAME IDs [IDs]..."                                           },
3256         {"del_group",           jt_lst_del_group,       NULL,
3257          "Usage: lst del_group NAME"                                                    },
3258         {"update_group",        jt_lst_update_group,    NULL,
3259          "Usage: lst update_group NAME [--clean] [--refresh] [--remove IDs]"            },
3260         {"list_group",          jt_lst_list_group,      NULL,
3261           "Usage: lst list_group [--active] [--busy] [--down] [--unknown] GROUP ..."    },
3262         {"stat",                jt_lst_stat,            NULL,
3263          "Usage: lst stat [--bw] [--rate] [--read] [--write] [--max] [--min] [--avg] "
3264          " [--mbs] [--timeout #] [--delay #] [--count #] GROUP [GROUP]"                 },
3265         {"show_error",          jt_lst_show_error,      NULL,
3266          "Usage: lst show_error NAME | IDS ..."                                         },
3267         {"add_batch",           jt_lst_add_batch,       NULL,
3268          "Usage: lst add_batch NAME"                                                    },
3269         {"run",                 jt_lst_start_batch,     NULL,
3270          "Usage: lst run [--timeout TIME] [NAME]"                                       },
3271         {"stop",                jt_lst_stop_batch,      NULL,
3272          "Usage: lst stop [--force] BATCH_NAME"                                         },
3273         {"list_batch",          jt_lst_list_batch,      NULL,
3274          "Usage: lst list_batch NAME [--test ID] [--server]"                            },
3275         {"query",               jt_lst_query_batch,     NULL,
3276          "Usage: lst query [--test ID] [--server] [--timeout TIME] NAME"                },
3277         {"add_test",            jt_lst_add_test,        NULL,
3278          "Usage: lst add_test [--batch BATCH] [--loop #] [--concurrency #] "
3279          " [--distribute #:#] [--from GROUP] [--to GROUP] TEST..."                      },
3280         {"help",                Parser_help,            0,     "help"                   },
3281         {"--list-commands",     lst_list_commands,      0,     "list commands"          },
3282         {0,                     0,                      0,      NULL                    }
3283 };
3284
3285 int
3286 lst_initialize(void)
3287 {
3288         char   *key;
3289         char   *feats;
3290
3291         feats = getenv("LST_FEATURES");
3292         if (feats != NULL)
3293                 session_features = strtol(feats, NULL, 16);
3294
3295         if ((session_features & ~LST_FEATS_MASK) != 0) {
3296                 fprintf(stderr,
3297                         "Unsupported session features %x, "
3298                         "only support these features so far: %x\n",
3299                         (session_features & ~LST_FEATS_MASK), LST_FEATS_MASK);
3300                 return -1;
3301         }
3302
3303         key = getenv("LST_SESSION");
3304
3305         if (key == NULL) {
3306                 session_key = 0;
3307                 return 0;
3308         }
3309
3310         session_key = atoi(key);