4 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 only,
8 * as published by the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License version 2 for more details. A copy is
14 * included in the COPYING file that accompanied this code.
16 * You should have received a copy of the GNU General Public License
17 * along with this program; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
23 * Copyright (c) 2012, 2016, Intel Corporation.
26 * lustre/utils/lustre_lfsck.c
28 * Lustre user-space tools for LFSCK.
30 * Author: Fan Yong <yong.fan@whamcloud.com>
39 #include <sys/ioctl.h>
44 #include <lustre/lustre_lfsck_user.h>
45 #include <lnet/lnetctl.h>
46 #include <lustre_ioctl.h>
47 /* Needs to be last to avoid clashes */
48 #include <libcfs/util/ioctl.h>
49 #include <libcfs/util/param.h>
51 static struct option long_opt_start[] = {
52 {"device", required_argument, 0, 'M'},
53 {"all", no_argument, 0, 'A'},
54 {"create_ostobj", optional_argument, 0, 'c'},
55 {"create-ostobj", optional_argument, 0, 'c'},
56 {"create_mdtobj", optional_argument, 0, 'C'},
57 {"create-mdtobj", optional_argument, 0, 'C'},
58 {"delay_create_ostobj", optional_argument, 0, 'd'},
59 {"delay-create-ostobj", optional_argument, 0, 'd'},
60 {"error", required_argument, 0, 'e'},
61 {"help", no_argument, 0, 'h'},
62 {"dryrun", optional_argument, 0, 'n'},
63 {"orphan", no_argument, 0, 'o'},
64 {"reset", no_argument, 0, 'r'},
65 {"speed", required_argument, 0, 's'},
66 {"type", required_argument, 0, 't'},
67 {"window_size", required_argument, 0, 'w'},
68 {"window-size", required_argument, 0, 'w'},
72 static struct option long_opt_stop[] = {
73 {"device", required_argument, 0, 'M'},
74 {"all", no_argument, 0, 'A'},
75 {"help", no_argument, 0, 'h'},
79 static struct option long_opt_query[] = {
80 {"device", required_argument, 0, 'M'},
81 {"type", required_argument, 0, 't'},
82 {"help", no_argument, 0, 'h'},
83 {"wait", no_argument, 0, 'w'},
87 struct lfsck_type_name {
89 enum lfsck_type ltn_type;
92 static struct lfsck_type_name lfsck_types_names[] = {
93 { "scrub", LFSCK_TYPE_SCRUB },
94 { "layout", LFSCK_TYPE_LAYOUT },
95 { "namespace", LFSCK_TYPE_NAMESPACE },
96 { "default", LFSCK_TYPES_DEF },
97 { "all", LFSCK_TYPES_SUPPORTED },
101 static enum lfsck_type lfsck_name2type(const char *name)
105 for (i = 0; lfsck_types_names[i].ltn_name != NULL; i++) {
106 if (strcmp(lfsck_types_names[i].ltn_name, name) == 0)
107 return lfsck_types_names[i].ltn_type;
112 static const char *lfsck_type2name(__u16 type)
116 for (i = 0; lfsck_types_names[i].ltn_name != NULL; i++) {
117 if (type == lfsck_types_names[i].ltn_type)
118 return lfsck_types_names[i].ltn_name;
124 static void usage_start(void)
126 fprintf(stderr, "start LFSCK\n"
128 "lfsck_start [-M | --device {MDT,OST}_device]\n"
129 " [-A | --all] [-c | --create_ostobj [on | off]]\n"
130 " [-C | --create_mdtobj [on | off]]\n"
131 " [-d | --delay_create_ostobj [on | off]]\n"
132 " [-e | --error {continue | abort}] [-h | --help]\n"
133 " [-n | --dryrun [on | off]] [-o | --orphan]\n"
134 " [-r | --reset] [-s | --speed ops_per_sec_limit]\n"
135 " [-t | --type check_type[,check_type...]]\n"
136 " [-w | --window_size size]\n"
138 "-M: device to start LFSCK/scrub on\n"
139 "-A: start LFSCK on all nodes via the specified MDT device "
140 "(see \"-M\" option) by single LFSCK command\n"
141 "-c: create the lost OST-object for dangling LOV EA "
142 "(default 'off', or 'on')\n"
143 "-C: create the lost MDT-object for dangling name entry "
144 "(default 'off', or 'on')\n"
145 "-d: delay create the lost OST-object for dangling LOV EA "
146 "until orphan OST-objects handled (default 'off', or 'on')\n"
147 "-e: error handle mode (default 'continue', or 'abort')\n"
148 "-h: this help message\n"
149 "-n: check with no modification (default 'off', or 'on')\n"
150 "-o: repair orphan OST-objects\n"
151 "-r: reset scanning to the start of the device\n"
152 "-s: maximum items to be scanned per second "
153 "(default '%d' = no limit)\n"
154 "-t: check type(s) to be performed (default all)\n"
155 "-w: window size for async requests pipeline\n",
156 LFSCK_SPEED_NO_LIMIT);
159 static void usage_stop(void)
161 fprintf(stderr, "stop LFSCK\n"
163 "lfsck_stop [-M | --device {MDT,OST}_device]\n"
164 " [-A | --all] [-h | --help]\n"
166 "-M: device to stop LFSCK/scrub on\n"
167 "-A: stop LFSCK on all nodes via the specified MDT device "
168 "(see \"-M\" option) by single LFSCK command\n"
169 "-h: this help message\n");
172 static void usage_query(void)
174 fprintf(stderr, "check the LFSCK global status\n"
176 "lfsck_query [-M | --device MDT_device] [-h | --help]\n"
177 " [-t | --type check_type[,check_type...]]\n"
180 "-M: device to query LFSCK on\n"
181 "-t: LFSCK type(s) to be queried (default is all)\n"
182 "-h: this help message\n"
183 "-w: do not return until LFSCK not running\n");
186 static int lfsck_pack_dev(struct obd_ioctl_data *data, char *device, char *arg)
188 int len = strlen(arg) + 1;
190 if (len > MAX_OBD_NAME) {
191 fprintf(stderr, "device name is too long. "
192 "Valid length should be less than %d\n", MAX_OBD_NAME);
196 memcpy(device, arg, len);
197 data->ioc_inlbuf4 = device;
198 data->ioc_inllen4 = len;
199 data->ioc_dev = OBD_DEV_BY_DEVNAME;
203 static int lfsck_get_dev_name(struct obd_ioctl_data *data, char *device,
204 int types, bool multipe_devices)
206 glob_t param = { 0 };
211 rc = cfs_get_param_paths(¶m, "mdd/*-MDT*");
213 if (multipe_devices || errno != ENOENT ||
214 types & LFSCK_TYPE_NAMESPACE) {
215 fprintf(stderr, "Fail to get device name: rc = %d\n."
216 "You can specify the device explicitly "
217 "via '-M' option.\n", rc);
221 rc = cfs_get_param_paths(¶m, "obdfilter/*-OST*");
223 fprintf(stderr, "Fail to get device name: rc = %d\n."
224 "You can specify the device explicitly "
225 "via '-M' option.\n", rc);
230 if (param.gl_pathc == 1)
233 if (!multipe_devices) {
235 "Detect multiple devices on current node. "
236 "Please specify the device explicitly "
237 "via '-M' option or '-A' option for all.\n");
242 ptr = strrchr(param.gl_pathv[0], '-');
243 LASSERT(ptr != NULL);
245 for (i = 1; i < param.gl_pathc; i++) {
246 char *ptr2 = strrchr(param.gl_pathv[i], '-');
248 LASSERT(ptr2 != NULL);
250 if ((ptr - param.gl_pathv[0]) != (ptr2 - param.gl_pathv[i]) ||
251 strncmp(param.gl_pathv[0], param.gl_pathv[i],
252 (ptr - param.gl_pathv[0])) != 0) {
254 "Detect multiple filesystems on current node. "
255 "Please specify the device explicitly "
256 "via '-M' option.\n");
263 rc = lfsck_pack_dev(data, device, basename(param.gl_pathv[0]));
266 cfs_free_param_data(¶m);
271 int jt_lfsck_start(int argc, char **argv)
273 struct obd_ioctl_data data;
274 char rawbuf[MAX_IOC_BUFLEN], *buf = rawbuf;
275 char device[MAX_OBD_NAME];
276 struct lfsck_start start;
277 char *optstring = "Ac::C::d::e:hM:n::ors:t:w:";
278 int opt, index, rc, val, i;
280 memset(&data, 0, sizeof(data));
281 memset(&start, 0, sizeof(start));
282 memset(device, 0, MAX_OBD_NAME);
283 start.ls_version = LFSCK_VERSION_V1;
284 start.ls_active = LFSCK_TYPES_ALL;
286 /* Reset the 'optind' for the case of getopt_long() called multiple
287 * times under the same lctl. */
289 while ((opt = getopt_long(argc, argv, optstring, long_opt_start,
293 start.ls_flags |= LPF_ALL_TGT | LPF_BROADCAST;
296 if (optarg == NULL || strcmp(optarg, "on") == 0) {
297 start.ls_flags |= LPF_CREATE_OSTOBJ;
298 } else if (strcmp(optarg, "off") != 0) {
299 fprintf(stderr, "invalid switch: -c '%s'. "
300 "valid switches are:\n"
301 "empty ('on'), or 'off' without space. "
303 "'-c', '-con', '-coff'\n", optarg);
306 start.ls_valid |= LSV_CREATE_OSTOBJ;
309 if (optarg == NULL || strcmp(optarg, "on") == 0) {
310 start.ls_flags |= LPF_CREATE_MDTOBJ;
311 } else if (strcmp(optarg, "off") != 0) {
312 fprintf(stderr, "invalid switch: -C '%s'. "
313 "valid switches are:\n"
314 "empty ('on'), or 'off' without space. "
316 "'-C', '-Con', '-Coff'\n", optarg);
319 start.ls_valid |= LSV_CREATE_MDTOBJ;
322 if (optarg == NULL || strcmp(optarg, "on") == 0) {
323 start.ls_flags |= LPF_DELAY_CREATE_OSTOBJ;
324 } else if (strcmp(optarg, "off") != 0) {
325 fprintf(stderr, "invalid switch: -c '%s'. "
326 "valid switches are:\n"
327 "empty ('on'), or 'off' without space. "
329 "'-c', '-con', '-coff'\n", optarg);
332 start.ls_valid |= LSV_DELAY_CREATE_OSTOBJ;
335 if (strcmp(optarg, "abort") == 0) {
336 start.ls_flags |= LPF_FAILOUT;
337 } else if (strcmp(optarg, "continue") != 0) {
338 fprintf(stderr, "invalid error mode: -e '%s'."
340 "'continue' or 'abort'.\n", optarg);
343 start.ls_valid |= LSV_ERROR_HANDLE;
349 rc = lfsck_pack_dev(&data, device, optarg);
354 if (optarg == NULL || strcmp(optarg, "on") == 0) {
355 start.ls_flags |= LPF_DRYRUN;
356 } else if (strcmp(optarg, "off") != 0) {
357 fprintf(stderr, "invalid switch: -n '%s'. "
358 "valid switches are:\n"
359 "empty ('on'), or 'off' without space. "
361 "'-n', '-non', '-noff'\n", optarg);
364 start.ls_valid |= LSV_DRYRUN;
367 start.ls_flags |= LPF_ALL_TGT | LPF_BROADCAST |
371 start.ls_flags |= LPF_RESET;
375 start.ls_speed_limit = val;
376 start.ls_valid |= LSV_SPEED_LIMIT;
381 if (start.ls_active == LFSCK_TYPES_ALL)
383 while ((typename = strsep(&optarg, ",")) != NULL) {
384 enum lfsck_type type;
386 type = lfsck_name2type(typename);
389 start.ls_active |= type;
393 fprintf(stderr, "invalid check type -t '%s'. "
394 "valid types are:\n", typename);
395 for (i = 0; lfsck_types_names[i].ltn_name != NULL; i++)
396 fprintf(stderr, "%s%s", i != 0 ? "," : "",
397 lfsck_types_names[i].ltn_name);
398 fprintf(stderr, "\n");
403 if (val < 1 || val > LFSCK_ASYNC_WIN_MAX) {
405 "Invalid async window size that "
406 "may cause memory issues. The valid "
407 "range is [1 - %u].\n",
408 LFSCK_ASYNC_WIN_MAX);
412 start.ls_async_windows = val;
413 start.ls_valid |= LSV_ASYNC_WINDOWS;
416 fprintf(stderr, "Invalid option, '-h' for help.\n");
421 if (start.ls_active == LFSCK_TYPES_ALL)
422 start.ls_active = LFSCK_TYPES_DEF;
424 if (data.ioc_inlbuf4 == NULL) {
425 rc = lfsck_get_dev_name(&data, device, start.ls_active,
426 start.ls_flags & LPF_ALL_TGT);
431 data.ioc_inlbuf1 = (char *)&start;
432 data.ioc_inllen1 = sizeof(start);
433 memset(buf, 0, sizeof(rawbuf));
434 rc = obd_ioctl_pack(&data, &buf, sizeof(rawbuf));
436 fprintf(stderr, "Fail to pack ioctl data: rc = %d.\n", rc);
440 rc = l_ioctl(OBD_DEV_ID, OBD_IOC_START_LFSCK, buf);
442 perror("Fail to start LFSCK");
446 obd_ioctl_unpack(&data, buf, sizeof(rawbuf));
447 printf("Started LFSCK on the device %s: scrub", device);
448 for (i = 0; lfsck_types_names[i].ltn_name != NULL; i++) {
449 if (start.ls_active & lfsck_types_names[i].ltn_type) {
450 printf(" %s", lfsck_types_names[i].ltn_name);
451 start.ls_active &= ~lfsck_types_names[i].ltn_type;
454 if (start.ls_active != 0)
455 printf(" unknown(0x%x)", start.ls_active);
461 int jt_lfsck_stop(int argc, char **argv)
463 struct obd_ioctl_data data;
464 char rawbuf[MAX_IOC_BUFLEN], *buf = rawbuf;
465 char device[MAX_OBD_NAME];
466 struct lfsck_stop stop;
467 char *optstring = "AhM:";
470 memset(&data, 0, sizeof(data));
471 memset(&stop, 0, sizeof(stop));
472 memset(device, 0, MAX_OBD_NAME);
474 /* Reset the 'optind' for the case of getopt_long() called multiple
475 * times under the same lctl. */
477 while ((opt = getopt_long(argc, argv, optstring, long_opt_stop,
481 stop.ls_flags |= LPF_ALL_TGT | LPF_BROADCAST;
487 rc = lfsck_pack_dev(&data, device, optarg);
492 fprintf(stderr, "Invalid option, '-h' for help.\n");
497 if (data.ioc_inlbuf4 == NULL) {
498 rc = lfsck_get_dev_name(&data, device, 0,
499 stop.ls_flags & LPF_ALL_TGT);
504 data.ioc_inlbuf1 = (char *)&stop;
505 data.ioc_inllen1 = sizeof(stop);
506 memset(buf, 0, sizeof(rawbuf));
507 rc = obd_ioctl_pack(&data, &buf, sizeof(rawbuf));
509 fprintf(stderr, "Fail to pack ioctl data: rc = %d.\n", rc);
513 rc = l_ioctl(OBD_DEV_ID, OBD_IOC_STOP_LFSCK, buf);
515 perror("Fail to stop LFSCK");
519 printf("Stopped LFSCK on the device %s.\n", device);
523 int jt_lfsck_query(int argc, char **argv)
525 struct obd_ioctl_data data = { 0 };
526 char rawbuf[MAX_IOC_BUFLEN], *buf = rawbuf;
527 char device[MAX_OBD_NAME] = "";
528 struct lfsck_query query = { .lu_types = LFSCK_TYPES_ALL };
529 int opt, index, rc, i;
530 enum lfsck_type type;
532 while ((opt = getopt_long(argc, argv, "hM:t:w", long_opt_query,
539 rc = lfsck_pack_dev(&data, device, optarg);
546 if (query.lu_types == LFSCK_TYPES_ALL)
548 while ((typename = strsep(&optarg, ",")) != NULL) {
549 type = lfsck_name2type(typename);
552 query.lu_types |= type;
557 fprintf(stderr, "invalid LFSCK type -t '%s'. "
558 "valid types are:\n", typename);
559 for (i = 0; lfsck_types_names[i].ltn_name != NULL; i++)
560 fprintf(stderr, "%s%s", i != 0 ? "," : "",
561 lfsck_types_names[i].ltn_name);
562 fprintf(stderr, "\n");
566 query.lu_flags |= LPF_WAIT;
569 fprintf(stderr, "Invalid option, '-h' for help.\n");
575 if (data.ioc_inlbuf4 == NULL) {
576 rc = lfsck_get_dev_name(&data, device, 0, true);
581 data.ioc_inlbuf1 = (char *)&query;
582 data.ioc_inllen1 = sizeof(query);
583 memset(buf, 0, sizeof(rawbuf));
584 rc = obd_ioctl_pack(&data, &buf, sizeof(rawbuf));
586 fprintf(stderr, "Fail to pack ioctl data: rc = %d.\n", rc);
590 rc = l_ioctl(OBD_DEV_ID, OBD_IOC_QUERY_LFSCK, buf);
592 perror("Fail to query LFSCK");
596 obd_ioctl_unpack(&data, buf, sizeof(rawbuf));
597 for (i = 0, type = 1 << i; i < LFSCK_TYPE_BITS; i++, type = 1 << i) {
601 if (!(query.lu_types & type))
604 name = lfsck_type2name(type);
605 for (j = 0; j <= LS_MAX; j++)
606 printf("%s_mdts_%s: %d\n", name,
607 lfsck_status2name(j), query.lu_mdts_count[i][j]);
609 for (j = 0; j <= LS_MAX; j++)
610 printf("%s_osts_%s: %d\n", name,
611 lfsck_status2name(j), query.lu_osts_count[i][j]);
613 printf("%s_repaired: %llu\n", name, query.lu_repaired[i]);