4 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 only,
8 * as published by the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * General Public License version 2 for more details (a copy is included
14 * in the LICENSE file that accompanied this code).
16 * You should have received a copy of the GNU General Public License
17 * version 2 along with this program; If not, see
18 * http://www.gnu.org/licenses/gpl-2.0.html
23 * Copyright (c) 2003, 2010, Oracle and/or its affiliates. All rights reserved.
24 * Use is subject to license terms.
26 * Copyright (c) 2011, 2016, Intel Corporation.
29 * This file is part of Lustre, http://www.lustre.org/
30 * Lustre is a trademark of Sun Microsystems, Inc.
32 * lustre/utils/liblustreapi.c
34 * Author: Peter J. Braam <braam@clusterfs.com>
35 * Author: Phil Schwan <phil@clusterfs.com>
36 * Author: Robert Read <rread@clusterfs.com>
49 #include <sys/ioctl.h>
56 #include <sys/statfs.h>
57 #include <sys/syscall.h>
59 #include <sys/types.h>
60 #include <sys/xattr.h>
63 #include <libgen.h> /* for dirname() */
64 #ifdef HAVE_LINUX_UNISTD_H
65 #include <linux/unistd.h>
71 #include <libcfs/util/param.h>
72 #include <libcfs/util/string.h>
73 #include <lnet/lnetctl.h>
74 #include <lustre/lustreapi.h>
75 #include <lustre/lustre_ostid.h>
76 #include <lustre_ioctl.h>
77 #include "lustreapi_internal.h"
79 static int llapi_msg_level = LLAPI_MSG_MAX;
81 char *mdt_hash_name[] = { "none",
82 LMV_HASH_NAME_ALL_CHARS,
83 LMV_HASH_NAME_FNV_1A_64 };
85 void llapi_msg_set_level(int level)
87 /* ensure level is in the good range */
88 if (level < LLAPI_MSG_OFF)
89 llapi_msg_level = LLAPI_MSG_OFF;
90 else if (level > LLAPI_MSG_MAX)
91 llapi_msg_level = LLAPI_MSG_MAX;
93 llapi_msg_level = level;
96 int llapi_msg_get_level(void)
98 return llapi_msg_level;
101 static void error_callback_default(enum llapi_message_level level, int err,
102 const char *fmt, va_list ap)
104 vfprintf(stderr, fmt, ap);
105 if (level & LLAPI_MSG_NO_ERRNO)
106 fprintf(stderr, "\n");
108 fprintf(stderr, ": %s (%d)\n", strerror(err), err);
111 static void info_callback_default(enum llapi_message_level level, int err,
112 const char *fmt, va_list ap)
114 vfprintf(stdout, fmt, ap);
117 static llapi_log_callback_t llapi_error_callback = error_callback_default;
118 static llapi_log_callback_t llapi_info_callback = info_callback_default;
121 /* llapi_error will preserve errno */
122 void llapi_error(enum llapi_message_level level, int err, const char *fmt, ...)
125 int tmp_errno = errno;
127 if ((level & LLAPI_MSG_MASK) > llapi_msg_level)
131 llapi_error_callback(level, abs(err), fmt, args);
136 /* llapi_printf will preserve errno */
137 void llapi_printf(enum llapi_message_level level, const char *fmt, ...)
140 int tmp_errno = errno;
142 if ((level & LLAPI_MSG_MASK) > llapi_msg_level)
146 llapi_info_callback(level, 0, fmt, args);
152 * Set a custom error logging function. Passing in NULL will reset the logging
153 * callback to its default value.
155 * This function returns the value of the old callback.
157 llapi_log_callback_t llapi_error_callback_set(llapi_log_callback_t cb)
159 llapi_log_callback_t old = llapi_error_callback;
162 llapi_error_callback = cb;
164 llapi_error_callback = error_callback_default;
170 * Set a custom info logging function. Passing in NULL will reset the logging
171 * callback to its default value.
173 * This function returns the value of the old callback.
175 llapi_log_callback_t llapi_info_callback_set(llapi_log_callback_t cb)
177 llapi_log_callback_t old = llapi_info_callback;
180 llapi_info_callback = cb;
182 llapi_info_callback = info_callback_default;
188 * size_units is to be initialized (or zeroed) by caller.
190 int llapi_parse_size(const char *optarg, unsigned long long *size,
191 unsigned long long *size_units, int bytes_spec)
194 char *argbuf = (char *)optarg;
195 unsigned long long frac = 0, frac_d = 1;
197 if (strncmp(optarg, "-", 1) == 0)
200 if (*size_units == 0)
203 *size = strtoull(argbuf, &end, 0);
204 if (end != NULL && *end == '.') {
208 frac = strtoull(argbuf, &end, 10);
209 /* count decimal places */
210 for (i = 0; i < (end - argbuf); i++)
215 if ((*end == 'b') && *(end + 1) == '\0' &&
216 (*size & (~0ULL << (64 - 9))) == 0 &&
218 *size_units = 1 << 9;
219 } else if ((*end == 'b') &&
220 *(end + 1) == '\0' &&
223 } else if ((*end == 'k' || *end == 'K') &&
224 *(end + 1) == '\0' &&
225 (*size & (~0ULL << (64 - 10))) == 0) {
226 *size_units = 1 << 10;
227 } else if ((*end == 'm' || *end == 'M') &&
228 *(end + 1) == '\0' &&
229 (*size & (~0ULL << (64 - 20))) == 0) {
230 *size_units = 1 << 20;
231 } else if ((*end == 'g' || *end == 'G') &&
232 *(end + 1) == '\0' &&
233 (*size & (~0ULL << (64 - 30))) == 0) {
234 *size_units = 1 << 30;
235 } else if ((*end == 't' || *end == 'T') &&
236 *(end + 1) == '\0' &&
237 (*size & (~0ULL << (64 - 40))) == 0) {
238 *size_units = 1ULL << 40;
239 } else if ((*end == 'p' || *end == 'P') &&
240 *(end + 1) == '\0' &&
241 (*size & (~0ULL << (64 - 50))) == 0) {
242 *size_units = 1ULL << 50;
243 } else if ((*end == 'e' || *end == 'E') &&
244 *(end + 1) == '\0' &&
245 (*size & (~0ULL << (64 - 60))) == 0) {
246 *size_units = 1ULL << 60;
251 *size = *size * *size_units + frac * *size_units / frac_d;
256 /* XXX: llapi_xxx() functions return negative values upon failure */
258 int llapi_stripe_limit_check(unsigned long long stripe_size, int stripe_offset,
259 int stripe_count, int stripe_pattern)
263 /* 64 KB is the largest common page size I'm aware of (on ia64), but
264 * check the local page size just in case. */
265 page_size = LOV_MIN_STRIPE_SIZE;
266 if (getpagesize() > page_size) {
267 page_size = getpagesize();
268 llapi_err_noerrno(LLAPI_MSG_WARN,
269 "warning: your page size (%u) is "
270 "larger than expected (%u)", page_size,
271 LOV_MIN_STRIPE_SIZE);
273 if (!llapi_stripe_size_is_aligned(stripe_size)) {
275 llapi_error(LLAPI_MSG_ERROR, rc, "error: bad stripe_size %llu, "
276 "must be an even multiple of %d bytes",
277 stripe_size, page_size);
280 if (!llapi_stripe_index_is_valid(stripe_offset)) {
282 llapi_error(LLAPI_MSG_ERROR, rc, "error: bad stripe offset %d",
286 if (!llapi_stripe_count_is_valid(stripe_count)) {
288 llapi_error(LLAPI_MSG_ERROR, rc, "error: bad stripe count %d",
292 if (llapi_stripe_size_is_too_big(stripe_size)) {
294 llapi_error(LLAPI_MSG_ERROR, rc,
295 "warning: stripe size 4G or larger "
296 "is not currently supported and would wrap");
303 * Trim a trailing newline from a string, if it exists.
305 int llapi_chomp_string(char *buf)
321 * Wrapper to grab parameter settings for lov.*-clilov-*.* values
323 static int get_param_lov(const char *path, const char *param,
324 char *buf, size_t buf_size)
326 struct obd_uuid uuid;
329 rc = llapi_file_get_lov_uuid(path, &uuid);
333 return get_lustre_param_value("lov", uuid.uuid, FILTER_BY_EXACT, param,
338 * Wrapper to grab parameter settings for lmv.*-clilov-*.* values
340 static int get_param_lmv(const char *path, const char *param,
341 char *buf, size_t buf_size)
343 struct obd_uuid uuid;
346 rc = llapi_file_get_lmv_uuid(path, &uuid);
350 return get_lustre_param_value("lmv", uuid.uuid, FILTER_BY_EXACT, param,
354 static int get_mds_md_size(const char *path)
356 char buf[PATH_MAX], inst[PATH_MAX];
357 int md_size = lov_user_md_size(LOV_MAX_STRIPE_COUNT, LOV_USER_MAGIC_V3);
360 rc = llapi_getname(path, inst, sizeof(inst));
364 /* Get the max ea size from llite parameters. */
365 rc = get_lustre_param_value("llite", inst, FILTER_BY_EXACT,
366 "max_easize", buf, sizeof(buf));
372 return rc > 0 ? rc : md_size;
375 int llapi_get_agent_uuid(char *path, char *buf, size_t bufsize)
377 return get_param_lmv(path, "uuid", buf, bufsize);
381 * if pool is NULL, search ostname in target_obd
382 * if pool is not NULL:
383 * if pool not found returns errno < 0
384 * if ostname is NULL, returns 1 if pool is not empty and 0 if pool empty
385 * if ostname is not NULL, returns 1 if OST is in pool and 0 if not
387 int llapi_search_ost(char *fsname, char *poolname, char *ostname)
389 char buffer[PATH_MAX];
395 /* You need one or the other */
396 if (poolname == NULL && fsname == NULL)
400 len = strlen(ostname);
402 if (poolname == NULL && len == 0)
405 /* Search by poolname and fsname if is not NULL */
406 if (poolname != NULL) {
407 rc = poolpath(¶m, fsname, NULL);
409 snprintf(buffer, sizeof(buffer), "%s/%s",
410 param.gl_pathv[0], poolname);
412 } else if (fsname != NULL) {
413 rc = get_lustre_param_path("lov", fsname,
415 "target_obd", ¶m);
417 strncpy(buffer, param.gl_pathv[0],
423 cfs_free_param_data(¶m);
427 fd = fopen(buffer, "r");
431 while (fgets(buffer, sizeof(buffer), fd) != NULL) {
432 if (poolname == NULL) {
434 /* Search for an ostname in the list of OSTs
435 Line format is IDX: fsname-OSTxxxx_UUID STATUS */
436 ptr = strchr(buffer, ' ');
438 (strncmp(ptr + 1, ostname, len) == 0)) {
443 /* Search for an ostname in a pool,
444 (or an existing non-empty pool if no ostname) */
445 if ((ostname == NULL) ||
446 (strncmp(buffer, ostname, len) == 0)) {
457 * Open a Lustre file.
459 * \param name the name of the file to be opened
460 * \param flags access mode, see flags in open(2)
461 * \param mode permission of the file if it is created, see mode in open(2)
462 * \param param stripe pattern of the newly created file
464 * \retval file descriptor of opened file
465 * \retval negative errno on failure
467 int llapi_file_open_param(const char *name, int flags, mode_t mode,
468 const struct llapi_stripe_param *param)
470 char fsname[MAX_OBD_NAME + 1] = { 0 };
471 char *pool_name = param->lsp_pool;
472 struct lov_user_md *lum = NULL;
473 size_t lum_size = sizeof(*lum);
476 /* Make sure we are on a Lustre file system */
477 rc = llapi_search_fsname(name, fsname);
479 llapi_error(LLAPI_MSG_ERROR, rc,
480 "'%s' is not on a Lustre filesystem",
485 /* Check if the stripe pattern is sane. */
486 rc = llapi_stripe_limit_check(param->lsp_stripe_size,
487 param->lsp_stripe_offset,
488 param->lsp_stripe_count,
489 param->lsp_stripe_pattern);
493 /* Make sure we have a good pool */
494 if (pool_name != NULL) {
495 /* in case user gives the full pool name <fsname>.<poolname>,
496 * strip the fsname */
497 char *ptr = strchr(pool_name, '.');
500 if (strcmp(pool_name, fsname) != 0) {
502 llapi_err_noerrno(LLAPI_MSG_ERROR,
503 "Pool '%s' is not on filesystem '%s'",
510 /* Make sure the pool exists and is non-empty */
511 rc = llapi_search_ost(fsname, pool_name, NULL);
513 char *err = rc == 0 ? "has no OSTs" : "does not exist";
515 llapi_err_noerrno(LLAPI_MSG_ERROR, "pool '%s.%s' %s",
516 fsname, pool_name, err);
520 lum_size = sizeof(struct lov_user_md_v3);
523 /* sanity check of target list */
524 if (param->lsp_is_specific) {
525 char ostname[MAX_OBD_NAME + 1];
529 for (i = 0; i < param->lsp_stripe_count; i++) {
530 snprintf(ostname, sizeof(ostname), "%s-OST%04x_UUID",
531 fsname, param->lsp_osts[i]);
532 rc = llapi_search_ost(fsname, pool_name, ostname);
537 llapi_error(LLAPI_MSG_ERROR, rc,
538 "%s: cannot find OST %s in %s",
545 /* Make sure stripe offset is in OST list. */
546 if (param->lsp_osts[i] == param->lsp_stripe_offset)
550 llapi_error(LLAPI_MSG_ERROR, -EINVAL,
551 "%s: stripe offset '%d' is not in the "
553 __func__, param->lsp_stripe_offset);
557 lum_size = lov_user_md_size(param->lsp_stripe_count,
558 LOV_USER_MAGIC_SPECIFIC);
561 lum = calloc(1, lum_size);
566 fd = open(name, flags | O_LOV_DELAY_CREATE, mode);
568 if (errno == EISDIR && !(flags & O_DIRECTORY)) {
569 flags = O_DIRECTORY | O_RDONLY;
576 llapi_error(LLAPI_MSG_ERROR, rc, "unable to open '%s'", name);
581 /* Initialize IOCTL striping pattern structure */
582 lum->lmm_magic = LOV_USER_MAGIC_V1;
583 lum->lmm_pattern = param->lsp_stripe_pattern;
584 lum->lmm_stripe_size = param->lsp_stripe_size;
585 lum->lmm_stripe_count = param->lsp_stripe_count;
586 lum->lmm_stripe_offset = param->lsp_stripe_offset;
587 if (pool_name != NULL) {
588 struct lov_user_md_v3 *lumv3 = (void *)lum;
590 lumv3->lmm_magic = LOV_USER_MAGIC_V3;
591 strncpy(lumv3->lmm_pool_name, pool_name, LOV_MAXPOOLNAME);
593 if (param->lsp_is_specific) {
594 struct lov_user_md_v3 *lumv3 = (void *)lum;
597 lumv3->lmm_magic = LOV_USER_MAGIC_SPECIFIC;
598 if (pool_name == NULL) {
599 /* LOV_USER_MAGIC_SPECIFIC uses v3 format plus specified
600 * OST list, therefore if pool is not specified we have
601 * to pack a null pool name for placeholder. */
602 memset(lumv3->lmm_pool_name, 0, LOV_MAXPOOLNAME);
605 for (i = 0; i < param->lsp_stripe_count; i++)
606 lumv3->lmm_objects[i].l_ost_idx = param->lsp_osts[i];
609 if (ioctl(fd, LL_IOC_LOV_SETSTRIPE, lum) != 0) {
610 char *errmsg = "stripe already set";
613 if (errno != EEXIST && errno != EALREADY)
614 errmsg = strerror(errno);
616 llapi_err_noerrno(LLAPI_MSG_ERROR,
617 "error on ioctl %#jx for '%s' (%d): %s",
618 (uintmax_t)LL_IOC_LOV_SETSTRIPE, name, fd,
630 int llapi_file_open_pool(const char *name, int flags, int mode,
631 unsigned long long stripe_size, int stripe_offset,
632 int stripe_count, int stripe_pattern, char *pool_name)
634 const struct llapi_stripe_param param = {
635 .lsp_stripe_size = stripe_size,
636 .lsp_stripe_count = stripe_count,
637 .lsp_stripe_pattern = stripe_pattern,
638 .lsp_stripe_offset = stripe_offset,
639 .lsp_pool = pool_name
641 return llapi_file_open_param(name, flags, mode, ¶m);
644 int llapi_file_open(const char *name, int flags, int mode,
645 unsigned long long stripe_size, int stripe_offset,
646 int stripe_count, int stripe_pattern)
648 return llapi_file_open_pool(name, flags, mode, stripe_size,
649 stripe_offset, stripe_count,
650 stripe_pattern, NULL);
653 int llapi_file_create(const char *name, unsigned long long stripe_size,
654 int stripe_offset, int stripe_count, int stripe_pattern)
658 fd = llapi_file_open_pool(name, O_CREAT | O_WRONLY, 0644, stripe_size,
659 stripe_offset, stripe_count, stripe_pattern,
668 int llapi_file_create_pool(const char *name, unsigned long long stripe_size,
669 int stripe_offset, int stripe_count,
670 int stripe_pattern, char *pool_name)
674 fd = llapi_file_open_pool(name, O_CREAT | O_WRONLY, 0644, stripe_size,
675 stripe_offset, stripe_count, stripe_pattern,
684 int llapi_dir_set_default_lmv_stripe(const char *name, int stripe_offset,
685 int stripe_count, int stripe_pattern,
686 const char *pool_name)
688 struct lmv_user_md lum = { 0 };
692 lum.lum_magic = LMV_USER_MAGIC;
693 lum.lum_stripe_offset = stripe_offset;
694 lum.lum_stripe_count = stripe_count;
695 lum.lum_hash_type = stripe_pattern;
696 if (pool_name != NULL) {
697 if (strlen(pool_name) >= sizeof(lum.lum_pool_name)) {
698 llapi_err_noerrno(LLAPI_MSG_ERROR,
699 "error LL_IOC_LMV_SET_DEFAULT_STRIPE '%s'"
700 ": too large pool name: %s", name, pool_name);
703 strncpy(lum.lum_pool_name, pool_name,
704 sizeof(lum.lum_pool_name));
707 fd = open(name, O_DIRECTORY | O_RDONLY);
710 llapi_error(LLAPI_MSG_ERROR, rc, "unable to open '%s'", name);
714 rc = ioctl(fd, LL_IOC_LMV_SET_DEFAULT_STRIPE, &lum);
716 char *errmsg = "stripe already set";
718 if (errno != EEXIST && errno != EALREADY)
719 errmsg = strerror(errno);
721 llapi_err_noerrno(LLAPI_MSG_ERROR,
722 "error on LL_IOC_LMV_SETSTRIPE '%s' (%d): %s",
729 int llapi_dir_create_pool(const char *name, int mode, int stripe_offset,
730 int stripe_count, int stripe_pattern,
731 const char *pool_name)
733 struct lmv_user_md lmu = { 0 };
734 struct obd_ioctl_data data = { 0 };
737 char *dirpath = NULL;
738 char *namepath = NULL;
744 dirpath = strdup(name);
745 namepath = strdup(name);
746 if (!dirpath || !namepath)
749 lmu.lum_magic = LMV_USER_MAGIC;
750 lmu.lum_stripe_offset = stripe_offset;
751 lmu.lum_stripe_count = stripe_count;
752 lmu.lum_hash_type = stripe_pattern;
753 if (pool_name != NULL) {
754 if (strlen(pool_name) > LOV_MAXPOOLNAME) {
755 llapi_err_noerrno(LLAPI_MSG_ERROR,
756 "error LL_IOC_LMV_SETSTRIPE '%s' : too large"
757 "pool name: %s", name, pool_name);
761 memcpy(lmu.lum_pool_name, pool_name, strlen(pool_name));
764 filename = basename(namepath);
765 dir = dirname(dirpath);
767 data.ioc_inlbuf1 = (char *)filename;
768 data.ioc_inllen1 = strlen(filename) + 1;
769 data.ioc_inlbuf2 = (char *)&lmu;
770 data.ioc_inllen2 = sizeof(struct lmv_user_md);
771 data.ioc_type = mode;
772 rc = obd_ioctl_pack(&data, &buf, sizeof(rawbuf));
774 llapi_error(LLAPI_MSG_ERROR, rc,
775 "error: LL_IOC_LMV_SETSTRIPE pack failed '%s'.",
780 fd = open(dir, O_DIRECTORY | O_RDONLY);
783 llapi_error(LLAPI_MSG_ERROR, rc, "unable to open '%s'", name);
787 if (ioctl(fd, LL_IOC_LMV_SETSTRIPE, buf)) {
788 char *errmsg = "stripe already set";
790 if (errno != EEXIST && errno != EALREADY)
791 errmsg = strerror(errno);
793 llapi_err_noerrno(LLAPI_MSG_ERROR,
794 "error on LL_IOC_LMV_SETSTRIPE '%s' (%d): %s",
804 int llapi_direntry_remove(char *dname)
806 char *dirpath = NULL;
807 char *namepath = NULL;
813 dirpath = strdup(dname);
814 namepath = strdup(dname);
815 if (!dirpath || !namepath)
818 filename = basename(namepath);
820 dir = dirname(dirpath);
822 fd = open(dir, O_DIRECTORY | O_RDONLY);
825 llapi_error(LLAPI_MSG_ERROR, rc, "unable to open '%s'",
830 if (ioctl(fd, LL_IOC_REMOVE_ENTRY, filename)) {
831 char *errmsg = strerror(errno);
832 llapi_err_noerrno(LLAPI_MSG_ERROR,
833 "error on ioctl %#jx for '%s' (%d): %s",
834 (uintmax_t)LL_IOC_LMV_SETSTRIPE, filename,
846 * Find the fsname, the full path, and/or an open fd.
847 * Either the fsname or path must not be NULL
849 int get_root_path(int want, char *fsname, int *outfd, char *path, int index)
852 char buf[PATH_MAX], mntdir[PATH_MAX];
855 int idx = 0, len = 0, mntlen, fd;
858 /* get the mount point */
859 fp = setmntent(PROC_MOUNTS, "r");
862 llapi_error(LLAPI_MSG_ERROR, rc,
863 "setmntent(%s) failed", PROC_MOUNTS);
867 if (getmntent_r(fp, &mnt, buf, sizeof(buf)) == NULL)
870 if (!llapi_is_lustre_mnt(&mnt))
873 if ((want & WANT_INDEX) && (idx++ != index))
876 mntlen = strlen(mnt.mnt_dir);
877 ptr = strchr(mnt.mnt_fsname, '/');
878 while (ptr && *ptr == '/')
880 /* thanks to the call to llapi_is_lustre_mnt() above,
881 * we are sure that mnt.mnt_fsname contains ":/",
882 * so ptr should never be NULL */
886 while (*ptr_end != '/' && *ptr_end != '\0')
889 /* Check the fsname for a match, if given */
890 if (!(want & WANT_FSNAME) && fsname != NULL &&
891 (strlen(fsname) > 0) &&
892 (strncmp(ptr, fsname, ptr_end - ptr) != 0))
895 /* If the path isn't set return the first one we find */
896 if (path == NULL || strlen(path) == 0) {
897 strncpy(mntdir, mnt.mnt_dir, strlen(mnt.mnt_dir));
898 mntdir[strlen(mnt.mnt_dir)] = '\0';
899 if ((want & WANT_FSNAME) && fsname != NULL) {
900 strncpy(fsname, ptr, ptr_end - ptr);
901 fsname[ptr_end - ptr] = '\0';
905 /* Otherwise find the longest matching path */
906 } else if ((strlen(path) >= mntlen) && (mntlen >= len) &&
907 (strncmp(mnt.mnt_dir, path, mntlen) == 0)) {
908 strncpy(mntdir, mnt.mnt_dir, strlen(mnt.mnt_dir));
909 mntdir[strlen(mnt.mnt_dir)] = '\0';
911 if ((want & WANT_FSNAME) && fsname != NULL) {
912 strncpy(fsname, ptr, ptr_end - ptr);
913 fsname[ptr_end - ptr] = '\0';
922 if ((want & WANT_PATH) && path != NULL) {
923 strncpy(path, mntdir, strlen(mntdir));
924 path[strlen(mntdir)] = '\0';
926 if (want & WANT_FD) {
927 fd = open(mntdir, O_RDONLY | O_DIRECTORY | O_NONBLOCK);
930 llapi_error(LLAPI_MSG_ERROR, rc,
931 "error opening '%s'", mntdir);
937 } else if (want & WANT_ERROR)
938 llapi_err_noerrno(LLAPI_MSG_ERROR,
939 "can't find fs root for '%s': %d",
940 (want & WANT_PATH) ? fsname : path, rc);
945 * search lustre mounts
947 * Calling this function will return to the user the mount point, mntdir, and
948 * the file system name, fsname, if the user passed a buffer to this routine.
950 * The user inputs are pathname and index. If the pathname is supplied then
951 * the value of the index will be ignored. The pathname will return data if
952 * the pathname is located on a lustre mount. Index is used to pick which
953 * mount point you want in the case of multiple mounted lustre file systems.
954 * See function lfs_osts in lfs.c for an example of the index use.
956 int llapi_search_mounts(const char *pathname, int index, char *mntdir,
959 int want = WANT_PATH, idx = -1;
961 if (!pathname || pathname[0] == '\0') {
965 strcpy(mntdir, pathname);
969 return get_root_path(want, fsname, NULL, mntdir, idx);
972 /* Given a path, find the corresponding Lustre fsname */
973 int llapi_search_fsname(const char *pathname, char *fsname)
978 path = realpath(pathname, NULL);
980 char buf[PATH_MAX], *ptr;
983 if (pathname[0] != '/') {
984 /* Need an absolute path, but realpath() only works for
985 * pathnames that actually exist. We go through the
986 * extra hurdle of dirname(getcwd() + pathname) in
987 * case the relative pathname contains ".." in it. */
988 if (getcwd(buf, sizeof(buf) - 2) == NULL)
990 rc = strlcat(buf, "/", sizeof(buf));
991 if (rc >= sizeof(buf))
994 rc = strlcat(buf, pathname, sizeof(buf));
995 if (rc >= sizeof(buf))
997 path = realpath(buf, NULL);
999 ptr = strrchr(buf, '/');
1003 path = realpath(buf, NULL);
1006 llapi_error(LLAPI_MSG_ERROR, rc,
1007 "pathname '%s' cannot expand",
1013 rc = get_root_path(WANT_FSNAME | WANT_ERROR, fsname, NULL, path, -1);
1018 int llapi_search_rootpath(char *pathname, const char *fsname)
1020 return get_root_path(WANT_PATH, (char *)fsname, NULL, pathname, -1);
1023 int llapi_getname(const char *path, char *buf, size_t size)
1025 struct obd_uuid uuid_buf;
1026 char *uuid = uuid_buf.uuid;
1029 memset(&uuid_buf, 0, sizeof(uuid_buf));
1030 rc = llapi_file_get_lov_uuid(path, &uuid_buf);
1034 /* We want to turn lustre-clilov-ffff88002738bc00 into
1035 * lustre-ffff88002738bc00. */
1037 nr = snprintf(buf, size, "%.*s-%s",
1038 (int) (strlen(uuid) - 24), uuid,
1039 uuid + strlen(uuid) - 16);
1048 * Get the list of pool members.
1049 * \param poolname string of format \<fsname\>.\<poolname\>
1050 * \param members caller-allocated array of char*
1051 * \param list_size size of the members array
1052 * \param buffer caller-allocated buffer for storing OST names
1053 * \param buffer_size size of the buffer
1055 * \return number of members retrieved for this pool
1056 * \retval -error failure
1058 int llapi_get_poolmembers(const char *poolname, char **members,
1059 int list_size, char *buffer, int buffer_size)
1061 char fsname[PATH_MAX];
1070 /* name is FSNAME.POOLNAME */
1071 if (strlen(poolname) >= sizeof(fsname))
1073 strlcpy(fsname, poolname, sizeof(fsname));
1074 pool = strchr(fsname, '.');
1081 rc = poolpath(&pathname, fsname, NULL);
1083 llapi_error(LLAPI_MSG_ERROR, rc,
1084 "Lustre filesystem '%s' not found",
1089 llapi_printf(LLAPI_MSG_NORMAL, "Pool: %s.%s\n", fsname, pool);
1090 rc = snprintf(buf, sizeof(buf), "%s/%s", pathname.gl_pathv[0], pool);
1091 cfs_free_param_data(&pathname);
1092 if (rc >= sizeof(buf))
1094 fd = fopen(buf, "r");
1097 llapi_error(LLAPI_MSG_ERROR, rc, "cannot open %s", buf);
1102 while (fgets(buf, sizeof(buf), fd) != NULL) {
1103 if (nb_entries >= list_size) {
1107 buf[sizeof(buf) - 1] = '\0';
1109 tmp = strchr(buf, '\n');
1112 if (used + strlen(buf) + 1 > buffer_size) {
1117 strcpy(buffer + used, buf);
1118 members[nb_entries] = buffer + used;
1119 used += strlen(buf) + 1;
1129 * Get the list of pools in a filesystem.
1130 * \param name filesystem name or path
1131 * \param poollist caller-allocated array of char*
1132 * \param list_size size of the poollist array
1133 * \param buffer caller-allocated buffer for storing pool names
1134 * \param buffer_size size of the buffer
1136 * \return number of pools retrieved for this filesystem
1137 * \retval -error failure
1139 int llapi_get_poollist(const char *name, char **poollist, int list_size,
1140 char *buffer, int buffer_size)
1142 char rname[PATH_MAX];
1148 struct dirent *cookie = NULL;
1150 unsigned int nb_entries = 0;
1151 unsigned int used = 0;
1154 /* initialize output array */
1155 for (i = 0; i < list_size; i++)
1158 /* is name a pathname ? */
1159 ptr = strchr(name, '/');
1161 /* only absolute pathname is supported */
1165 if (!realpath(name, rname)) {
1167 llapi_error(LLAPI_MSG_ERROR, rc, "invalid path '%s'",
1172 fsname = strdup(rname);
1176 rc = poolpath(&pathname, NULL, rname);
1178 /* name is FSNAME */
1179 fsname = strdup(name);
1182 rc = poolpath(&pathname, fsname, NULL);
1185 llapi_error(LLAPI_MSG_ERROR, rc,
1186 "Lustre filesystem '%s' not found", name);
1190 llapi_printf(LLAPI_MSG_NORMAL, "Pools from %s:\n", fsname);
1191 dir = opendir(pathname.gl_pathv[0]);
1194 llapi_error(LLAPI_MSG_ERROR, rc,
1195 "Could not open pool list for '%s'",
1201 rc = readdir_r(dir, &pool, &cookie);
1204 llapi_error(LLAPI_MSG_ERROR, rc,
1205 "Error reading pool list for '%s'", name);
1207 } else if ((rc == 0) && (cookie == NULL)) {
1208 /* end of directory */
1212 /* ignore . and .. */
1213 if (!strcmp(pool.d_name, ".") || !strcmp(pool.d_name, ".."))
1216 /* check output bounds */
1217 if (nb_entries >= list_size) {
1222 /* +2 for '.' and final '\0' */
1223 if (used + strlen(pool.d_name) + strlen(fsname) + 2
1229 sprintf(buffer + used, "%s.%s", fsname, pool.d_name);
1230 poollist[nb_entries] = buffer + used;
1231 used += strlen(pool.d_name) + strlen(fsname) + 2;
1238 cfs_free_param_data(&pathname);
1241 return rc != 0 ? rc : nb_entries;
1244 /* wrapper for lfs.c and obd.c */
1245 int llapi_poollist(const char *name)
1247 /* list of pool names (assume that pool count is smaller
1249 char **list, *buffer = NULL, *fsname = (char *)name;
1250 char *poolname = NULL, *tmp = NULL, data[16];
1251 enum param_filter type = FILTER_BY_PATH;
1252 int obdcount, bufsize, rc, nb, i;
1257 if (name[0] != '/') {
1258 fsname = strdup(name);
1262 poolname = strchr(fsname, '.');
1265 type = FILTER_BY_FS_NAME;
1268 rc = get_lustre_param_value("lov", fsname, type, "numobd",
1269 data, sizeof(data));
1272 obdcount = atoi(data);
1274 /* Allocate space for each fsname-OST0000_UUID, 1 per OST,
1275 * and also an array to store the pointers for all that
1276 * allocated space. */
1278 bufsize = sizeof(struct obd_uuid) * obdcount;
1279 buffer = realloc(tmp, bufsize + sizeof(*list) * obdcount);
1280 if (buffer == NULL) {
1284 list = (char **) (buffer + bufsize);
1287 /* name is a path or fsname */
1288 nb = llapi_get_poollist(name, list, obdcount,
1291 /* name is a pool name (<fsname>.<poolname>) */
1292 nb = llapi_get_poolmembers(name, list, obdcount,
1296 if (nb == -EOVERFLOW) {
1299 goto retry_get_pools;
1302 for (i = 0; i < nb; i++)
1303 llapi_printf(LLAPI_MSG_NORMAL, "%s\n", list[i]);
1304 rc = (nb < 0 ? nb : 0);
1308 if (fsname != NULL && type == FILTER_BY_FS_NAME)
1313 typedef int (semantic_func_t)(char *path, DIR *parent, DIR **d,
1314 void *data, struct dirent64 *de);
1316 #define OBD_NOT_FOUND (-1)
1318 static int common_param_init(struct find_param *param, char *path)
1320 int lum_size = get_mds_md_size(path);
1322 if (lum_size < PATH_MAX + 1)
1323 lum_size = PATH_MAX + 1;
1325 param->fp_lum_size = lum_size;
1326 param->fp_lmd = calloc(1, sizeof(lstat_t) + param->fp_lum_size);
1327 if (param->fp_lmd == NULL) {
1328 llapi_error(LLAPI_MSG_ERROR, -ENOMEM,
1329 "error: allocation of %zu bytes for ioctl",
1330 sizeof(lstat_t) + param->fp_lum_size);
1334 param->fp_lmv_stripe_count = 256;
1335 param->fp_lmv_md = calloc(1,
1336 lmv_user_md_size(param->fp_lmv_stripe_count,
1338 if (param->fp_lmv_md == NULL) {
1339 llapi_error(LLAPI_MSG_ERROR, -ENOMEM,
1340 "error: allocation of %d bytes for ioctl",
1341 lmv_user_md_size(param->fp_lmv_stripe_count,
1346 param->fp_got_uuids = 0;
1347 param->fp_obd_indexes = NULL;
1348 param->fp_obd_index = OBD_NOT_FOUND;
1349 if (!param->fp_migrate)
1350 param->fp_mdt_index = OBD_NOT_FOUND;
1354 static void find_param_fini(struct find_param *param)
1356 if (param->fp_obd_indexes)
1357 free(param->fp_obd_indexes);
1360 free(param->fp_lmd);
1362 if (param->fp_lmv_md)
1363 free(param->fp_lmv_md);
1366 static int cb_common_fini(char *path, DIR *parent, DIR **dirp, void *data,
1367 struct dirent64 *de)
1369 struct find_param *param = data;
1375 /* set errno upon failure */
1376 static DIR *opendir_parent(const char *path)
1382 path_copy = strdup(path);
1383 if (path_copy == NULL)
1386 parent_path = dirname(path_copy);
1387 parent = opendir(parent_path);
1393 static int cb_get_dirstripe(char *path, DIR *d, struct find_param *param)
1398 param->fp_lmv_md->lum_stripe_count = param->fp_lmv_stripe_count;
1399 if (param->fp_get_default_lmv)
1400 param->fp_lmv_md->lum_magic = LMV_USER_MAGIC;
1402 param->fp_lmv_md->lum_magic = LMV_MAGIC_V1;
1404 ret = ioctl(dirfd(d), LL_IOC_LMV_GETSTRIPE, param->fp_lmv_md);
1405 if (errno == E2BIG && ret != 0) {
1409 stripe_count = (__u32)param->fp_lmv_md->lum_stripe_count;
1410 if (stripe_count <= param->fp_lmv_stripe_count)
1413 free(param->fp_lmv_md);
1414 param->fp_lmv_stripe_count = stripe_count;
1415 lmv_size = lmv_user_md_size(stripe_count, LMV_MAGIC_V1);
1416 param->fp_lmv_md = malloc(lmv_size);
1417 if (param->fp_lmv_md == NULL) {
1418 llapi_error(LLAPI_MSG_ERROR, -ENOMEM,
1419 "error: allocation of %d bytes for ioctl",
1420 lmv_user_md_size(param->fp_lmv_stripe_count,
1429 static int get_lmd_info(char *path, DIR *parent, DIR *dir,
1430 struct lov_user_mds_data *lmd, int lumlen)
1432 lstat_t *st = &lmd->lmd_st;
1435 if (parent == NULL && dir == NULL)
1439 ret = ioctl(dirfd(dir), LL_IOC_MDC_GETINFO, (void *)lmd);
1440 } else if (parent) {
1441 char *fname = strrchr(path, '/');
1443 /* To avoid opening, locking, and closing each file on the
1444 * client if that is not needed. The GETFILEINFO ioctl can
1445 * be done on the patent dir with a single open for all
1446 * files in that directory, and it also doesn't pollute the
1447 * client dcache with millions of dentries when traversing
1448 * a large filesystem. */
1449 fname = (fname == NULL ? path : fname + 1);
1450 /* retrieve needed file info */
1451 strlcpy((char *)lmd, fname, lumlen);
1452 ret = ioctl(dirfd(parent), IOC_MDC_GETFILEINFO, (void *)lmd);
1456 if (errno == ENOTTY) {
1457 /* ioctl is not supported, it is not a lustre fs.
1458 * Do the regular lstat(2) instead. */
1459 ret = lstat_f(path, st);
1462 llapi_error(LLAPI_MSG_ERROR, ret,
1463 "error: %s: lstat failed for %s",
1466 } else if (errno == ENOENT) {
1468 llapi_error(LLAPI_MSG_WARN, ret,
1469 "warning: %s: %s does not exist",
1471 } else if (errno != EISDIR) {
1473 llapi_error(LLAPI_MSG_ERROR, ret,
1474 "%s ioctl failed for %s.",
1475 dir ? "LL_IOC_MDC_GETINFO" :
1476 "IOC_MDC_GETFILEINFO", path);
1479 llapi_error(LLAPI_MSG_ERROR, ret,
1480 "error: %s: IOC_MDC_GETFILEINFO failed for %s",
1487 static int llapi_semantic_traverse(char *path, int size, DIR *parent,
1488 semantic_func_t sem_init,
1489 semantic_func_t sem_fini, void *data,
1490 struct dirent64 *de)
1492 struct find_param *param = (struct find_param *)data;
1493 struct dirent64 *dent;
1501 if (!d && errno != ENOTDIR) {
1503 llapi_error(LLAPI_MSG_ERROR, ret, "%s: Failed to open '%s'",
1506 } else if (!d && !parent) {
1507 /* ENOTDIR. Open the parent dir. */
1508 p = opendir_parent(path);
1515 if (sem_init && (ret = sem_init(path, parent ?: p, &d, data, de)))
1521 while ((dent = readdir64(d)) != NULL) {
1524 if (!strcmp(dent->d_name, ".") || !strcmp(dent->d_name, ".."))
1527 /* Don't traverse .lustre directory */
1528 if (!(strcmp(dent->d_name, dot_lustre_name)))
1532 if ((len + dent->d_reclen + 2) > size) {
1533 llapi_err_noerrno(LLAPI_MSG_ERROR,
1534 "error: %s: string buffer is too small",
1539 strcat(path, dent->d_name);
1541 if (dent->d_type == DT_UNKNOWN) {
1542 lstat_t *st = ¶m->fp_lmd->lmd_st;
1544 rc = get_lmd_info(path, d, NULL, param->fp_lmd,
1545 param->fp_lum_size);
1547 dent->d_type = IFTODT(st->st_mode);
1554 switch (dent->d_type) {
1556 llapi_err_noerrno(LLAPI_MSG_ERROR,
1557 "error: %s: '%s' is UNKNOWN type %d",
1558 __func__, dent->d_name, dent->d_type);
1561 rc = llapi_semantic_traverse(path, size, d, sem_init,
1562 sem_fini, data, dent);
1563 if (rc != 0 && ret == 0)
1569 rc = sem_init(path, d, NULL, data, dent);
1570 if (rc < 0 && ret == 0)
1573 if (sem_fini && rc == 0)
1574 sem_fini(path, d, NULL, data, dent);
1582 sem_fini(path, parent, &d, data, de);
1591 static int param_callback(char *path, semantic_func_t sem_init,
1592 semantic_func_t sem_fini, struct find_param *param)
1594 int ret, len = strlen(path);
1597 if (len > PATH_MAX) {
1599 llapi_error(LLAPI_MSG_ERROR, ret,
1600 "Path name '%s' is too long", path);
1604 buf = (char *)malloc(PATH_MAX + 1);
1608 strlcpy(buf, path, PATH_MAX + 1);
1609 ret = common_param_init(param, buf);
1613 param->fp_depth = 0;
1615 ret = llapi_semantic_traverse(buf, PATH_MAX + 1, NULL, sem_init,
1616 sem_fini, param, NULL);
1618 find_param_fini(param);
1620 return ret < 0 ? ret : 0;
1623 int llapi_file_fget_lov_uuid(int fd, struct obd_uuid *lov_name)
1625 int rc = ioctl(fd, OBD_IOC_GETNAME, lov_name);
1628 llapi_error(LLAPI_MSG_ERROR, rc, "error: can't get lov name.");
1633 int llapi_file_fget_lmv_uuid(int fd, struct obd_uuid *lov_name)
1635 int rc = ioctl(fd, OBD_IOC_GETMDNAME, lov_name);
1638 llapi_error(LLAPI_MSG_ERROR, rc, "error: can't get lmv name.");
1643 int llapi_file_get_lov_uuid(const char *path, struct obd_uuid *lov_uuid)
1647 fd = open(path, O_RDONLY | O_NONBLOCK);
1650 llapi_error(LLAPI_MSG_ERROR, rc, "error opening %s", path);
1654 rc = llapi_file_fget_lov_uuid(fd, lov_uuid);
1660 int llapi_file_get_lmv_uuid(const char *path, struct obd_uuid *lov_uuid)
1664 fd = open(path, O_RDONLY | O_NONBLOCK);
1667 llapi_error(LLAPI_MSG_ERROR, rc, "error opening %s", path);
1671 rc = llapi_file_fget_lmv_uuid(fd, lov_uuid);
1683 * If uuidp is NULL, return the number of available obd uuids.
1684 * If uuidp is non-NULL, then it will return the uuids of the obds. If
1685 * there are more OSTs than allocated to uuidp, then an error is returned with
1686 * the ost_count set to number of available obd uuids.
1688 static int llapi_get_target_uuids(int fd, struct obd_uuid *uuidp,
1689 int *ost_count, enum tgt_type type)
1691 char buf[PATH_MAX], format[32];
1692 int rc = 0, index = 0;
1693 struct obd_uuid name;
1697 /* Get the lov name */
1698 if (type == LOV_TYPE)
1699 rc = llapi_file_fget_lov_uuid(fd, &name);
1701 rc = llapi_file_fget_lmv_uuid(fd, &name);
1705 /* Now get the ost uuids */
1706 rc = get_lustre_param_path(type == LOV_TYPE ? "lov" : "lmv", name.uuid,
1707 FILTER_BY_EXACT, "target_obd", ¶m);
1711 fp = fopen(param.gl_pathv[0], "r");
1714 llapi_error(LLAPI_MSG_ERROR, rc, "error: opening '%s'",
1719 snprintf(format, sizeof(format),
1720 "%%d: %%%zus", sizeof(uuidp[0].uuid) - 1);
1721 while (fgets(buf, sizeof(buf), fp) != NULL) {
1722 if (uuidp && (index < *ost_count)) {
1723 if (sscanf(buf, format, &index, uuidp[index].uuid) < 2)
1731 if (uuidp && (index > *ost_count))
1736 cfs_free_param_data(¶m);
1740 int llapi_lov_get_uuids(int fd, struct obd_uuid *uuidp, int *ost_count)
1742 return llapi_get_target_uuids(fd, uuidp, ost_count, LOV_TYPE);
1745 int llapi_get_obd_count(char *mnt, int *count, int is_mdt)
1750 root = open(mnt, O_RDONLY | O_DIRECTORY);
1753 llapi_error(LLAPI_MSG_ERROR, rc, "open %s failed", mnt);
1758 rc = ioctl(root, LL_IOC_GETOBDCOUNT, count);
1766 /* Check if user specified value matches a real uuid. Ignore _UUID,
1767 * -osc-4ba41334, other trailing gunk in comparison.
1768 * @param real_uuid ends in "_UUID"
1769 * @param search_uuid may or may not end in "_UUID"
1771 int llapi_uuid_match(char *real_uuid, char *search_uuid)
1773 int cmplen = strlen(real_uuid);
1774 int searchlen = strlen(search_uuid);
1776 if (cmplen > 5 && strcmp(real_uuid + cmplen - 5, "_UUID") == 0)
1778 if (searchlen > 5 && strcmp(search_uuid + searchlen - 5, "_UUID") == 0)
1781 /* The UUIDs may legitimately be different lengths, if
1782 * the system was upgraded from an older version. */
1783 if (cmplen != searchlen)
1786 return (strncmp(search_uuid, real_uuid, cmplen) == 0);
1789 /* Here, param->fp_obd_uuid points to a single obduuid, the index of which is
1790 * returned in param->fp_obd_index */
1791 static int setup_obd_uuid(int fd, char *dname, struct find_param *param)
1793 struct obd_uuid obd_uuid;
1800 if (param->fp_got_uuids)
1803 /* Get the lov/lmv name */
1804 if (param->fp_get_lmv)
1805 rc = llapi_file_fget_lmv_uuid(fd, &obd_uuid);
1807 rc = llapi_file_fget_lov_uuid(fd, &obd_uuid);
1809 if (rc != -ENOTTY) {
1810 llapi_error(LLAPI_MSG_ERROR, rc,
1811 "error: can't get %s name: %s",
1812 param->fp_get_lmv ? "lmv" : "lov",
1820 param->fp_got_uuids = 1;
1822 /* Now get the ost uuids */
1823 rc = get_lustre_param_path(param->fp_get_lmv ? "lmv" : "lov",
1824 obd_uuid.uuid, FILTER_BY_EXACT,
1825 "target_obd", ¶m_data);
1829 fp = fopen(param_data.gl_pathv[0], "r");
1832 llapi_error(LLAPI_MSG_ERROR, rc, "error: opening '%s'",
1833 param_data.gl_pathv[0]);
1837 if (!param->fp_obd_uuid && !param->fp_quiet && !param->fp_obds_printed)
1838 llapi_printf(LLAPI_MSG_NORMAL, "%s:\n",
1839 param->fp_get_lmv ? "MDTS" : "OBDS");
1841 snprintf(format, sizeof(format),
1842 "%%d: %%%zus", sizeof(obd_uuid.uuid) - 1);
1843 while (fgets(buf, sizeof(buf), fp) != NULL) {
1846 if (sscanf(buf, format, &index, obd_uuid.uuid) < 2)
1849 if (param->fp_obd_uuid) {
1850 if (llapi_uuid_match(obd_uuid.uuid,
1851 param->fp_obd_uuid->uuid)) {
1852 param->fp_obd_index = index;
1855 } else if (!param->fp_quiet && !param->fp_obds_printed) {
1856 /* Print everything */
1857 llapi_printf(LLAPI_MSG_NORMAL, "%s", buf);
1860 param->fp_obds_printed = 1;
1864 if (param->fp_obd_uuid && (param->fp_obd_index == OBD_NOT_FOUND)) {
1865 llapi_err_noerrno(LLAPI_MSG_ERROR,
1866 "error: %s: unknown obduuid: %s",
1867 __func__, param->fp_obd_uuid->uuid);
1871 cfs_free_param_data(¶m_data);
1875 /* In this case, param->fp_obd_uuid will be an array of obduuids and
1876 * obd index for all these obduuids will be returned in
1877 * param->fp_obd_indexes */
1878 static int setup_indexes(DIR *dir, char *path, struct obd_uuid *obduuids,
1879 int num_obds, int **obdindexes, int *obdindex,
1882 int ret, obdcount, obd_valid = 0, obdnum;
1884 struct obd_uuid *uuids = NULL;
1888 if (type == LOV_TYPE)
1889 ret = get_param_lov(path, "numobd", buf, sizeof(buf));
1891 ret = get_param_lmv(path, "numobd", buf, sizeof(buf));
1895 obdcount = atoi(buf);
1896 uuids = malloc(obdcount * sizeof(struct obd_uuid));
1901 ret = llapi_get_target_uuids(dirfd(dir), uuids, &obdcount, type);
1903 if (ret == -EOVERFLOW) {
1904 struct obd_uuid *uuids_temp;
1906 uuids_temp = realloc(uuids, obdcount *
1907 sizeof(struct obd_uuid));
1908 if (uuids_temp != NULL) {
1910 goto retry_get_uuids;
1915 llapi_error(LLAPI_MSG_ERROR, ret, "get ost uuid failed");
1919 indexes = malloc(num_obds * sizeof(*obdindex));
1920 if (indexes == NULL) {
1925 for (obdnum = 0; obdnum < num_obds; obdnum++) {
1928 /* The user may have specified a simple index */
1929 i = strtol(obduuids[obdnum].uuid, &end, 0);
1930 if (end && *end == '\0' && i < obdcount) {
1931 indexes[obdnum] = i;
1934 for (i = 0; i < obdcount; i++) {
1935 if (llapi_uuid_match(uuids[i].uuid,
1936 obduuids[obdnum].uuid)) {
1937 indexes[obdnum] = i;
1943 if (i >= obdcount) {
1944 indexes[obdnum] = OBD_NOT_FOUND;
1945 llapi_err_noerrno(LLAPI_MSG_ERROR,
1946 "error: %s: unknown obduuid: %s",
1947 __func__, obduuids[obdnum].uuid);
1953 *obdindex = OBD_NOT_FOUND;
1955 *obdindex = obd_valid;
1957 *obdindexes = indexes;
1965 static int setup_target_indexes(DIR *dir, char *path, struct find_param *param)
1969 if (param->fp_mdt_uuid) {
1970 ret = setup_indexes(dir, path, param->fp_mdt_uuid,
1972 ¶m->fp_mdt_indexes,
1973 ¶m->fp_mdt_index, LMV_TYPE);
1978 if (param->fp_obd_uuid) {
1979 ret = setup_indexes(dir, path, param->fp_obd_uuid,
1981 ¶m->fp_obd_indexes,
1982 ¶m->fp_obd_index, LOV_TYPE);
1987 param->fp_got_uuids = 1;
1992 int llapi_ostlist(char *path, struct find_param *param)
1997 fd = open(path, O_RDONLY | O_DIRECTORY);
2001 ret = setup_obd_uuid(fd, path, param);
2008 * Tries to determine the default stripe attributes for a given filesystem. The
2009 * filesystem to check should be specified by fsname, or will be determined
2012 static int sattr_get_defaults(const char *const fsname,
2013 unsigned int *scount,
2014 unsigned int *ssize,
2015 unsigned int *soffset)
2021 rc = get_lustre_param_value("lov", fsname, FILTER_BY_FS_NAME,
2022 "stripecount", val, sizeof(val));
2025 *scount = atoi(val);
2029 rc = get_lustre_param_value("lov", fsname, FILTER_BY_FS_NAME,
2030 "stripesize", val, sizeof(val));
2037 rc = get_lustre_param_value("lov", fsname, FILTER_BY_FS_NAME,
2038 "stripeoffset", val, sizeof(val));
2041 *soffset = atoi(val);
2048 * Tries to gather the default stripe attributes for a given filesystem. If
2049 * the attributes can be determined, they are cached for easy retreival the
2050 * next time they are needed. Only a single filesystem's attributes are
2053 static int sattr_cache_get_defaults(const char *const fsname,
2054 const char *const pathname,
2055 unsigned int *scount,
2056 unsigned int *ssize,
2057 unsigned int *soffset)
2060 char fsname[PATH_MAX + 1];
2061 unsigned int stripecount;
2062 unsigned int stripesize;
2063 unsigned int stripeoffset;
2069 char fsname_buf[PATH_MAX + 1];
2070 unsigned int tmp[3];
2072 if (fsname == NULL) {
2073 rc = llapi_search_fsname(pathname, fsname_buf);
2077 strlcpy(fsname_buf, fsname, sizeof(fsname_buf));
2080 if (strncmp(fsname_buf, cache.fsname, sizeof(fsname_buf) - 1) != 0) {
2082 * Ensure all 3 sattrs (count, size, and offset) are
2083 * successfully retrieved and stored in tmp before writing to
2086 rc = sattr_get_defaults(fsname_buf, &tmp[0], &tmp[1], &tmp[2]);
2090 cache.stripecount = tmp[0];
2091 cache.stripesize = tmp[1];
2092 cache.stripeoffset = tmp[2];
2093 strlcpy(cache.fsname, fsname_buf, sizeof(cache.fsname));
2097 *scount = cache.stripecount;
2099 *ssize = cache.stripesize;
2101 *soffset = cache.stripeoffset;
2106 static void lov_dump_user_lmm_header(struct lov_user_md *lum, char *path,
2107 struct lov_user_ost_data_v1 *objects,
2108 int is_dir, int verbose, int depth,
2109 int raw, char *pool_name)
2111 char *prefix = is_dir ? "" : "lmm_";
2112 char *separator = "";
2115 if (is_dir && lmm_oi_seq(&lum->lmm_oi) == FID_SEQ_LOV_DEFAULT) {
2116 lmm_oi_set_seq(&lum->lmm_oi, 0);
2117 if (verbose & VERBOSE_DETAIL)
2118 llapi_printf(LLAPI_MSG_NORMAL, "(Default) ");
2121 if (depth && path && ((verbose != VERBOSE_OBJID) || !is_dir))
2122 llapi_printf(LLAPI_MSG_NORMAL, "%s\n", path);
2124 if ((verbose & VERBOSE_DETAIL) && !is_dir) {
2125 llapi_printf(LLAPI_MSG_NORMAL, "lmm_magic: 0x%08X\n",
2127 llapi_printf(LLAPI_MSG_NORMAL, "lmm_seq: %#jx\n",
2128 (uintmax_t)lmm_oi_seq(&lum->lmm_oi));
2129 llapi_printf(LLAPI_MSG_NORMAL, "lmm_object_id: %#jx\n",
2130 (uintmax_t)lmm_oi_id(&lum->lmm_oi));
2132 if ((verbose & (VERBOSE_DETAIL | VERBOSE_DFID)) && !is_dir) {
2133 if (verbose & ~VERBOSE_DFID)
2134 llapi_printf(LLAPI_MSG_NORMAL, "lmm_fid: ");
2135 /* This needs a bit of hand-holding since old 1.x lmm_oi
2136 * have { oi.oi_id = mds_inum, oi.oi_seq = 0 } and 2.x lmm_oi
2137 * have { oi.oi_id = mds_oid, oi.oi_seq = mds_seq } instead of
2138 * a real FID. Ideally the 2.x code would have stored this
2139 * like a FID with { oi_id = mds_seq, oi_seq = mds_oid } so the
2140 * ostid union lu_fid { f_seq = mds_seq, f_oid = mds_oid }
2141 * worked properly (especially since IGIF FIDs use mds_inum as
2142 * the FID SEQ), but unfortunately that didn't happen.
2144 * Print it to look like an IGIF FID, even though the fields
2145 * are reversed on disk, so that it makes sense to userspace.
2147 * Don't use ostid_id() and ostid_seq(), since they assume the
2148 * oi_fid fields are in the right order. This is why there are
2149 * separate lmm_oi_seq() and lmm_oi_id() routines for this.
2151 * For newer layout types hopefully this will be a real FID. */
2152 llapi_printf(LLAPI_MSG_NORMAL, DFID"\n",
2153 lmm_oi_seq(&lum->lmm_oi) == 0 ?
2154 lmm_oi_id(&lum->lmm_oi) :
2155 lmm_oi_seq(&lum->lmm_oi),
2156 lmm_oi_seq(&lum->lmm_oi) == 0 ?
2157 0 : (__u32)lmm_oi_id(&lum->lmm_oi),
2158 (__u32)(lmm_oi_id(&lum->lmm_oi) >> 32));
2161 if (verbose & VERBOSE_COUNT) {
2162 if (verbose & ~VERBOSE_COUNT)
2163 llapi_printf(LLAPI_MSG_NORMAL, "%sstripe_count: ",
2166 if (!raw && lum->lmm_stripe_count == 0) {
2167 unsigned int scount;
2168 rc = sattr_cache_get_defaults(NULL, path,
2172 llapi_printf(LLAPI_MSG_NORMAL, "%d",
2175 llapi_error(LLAPI_MSG_ERROR, rc,
2176 "Cannot determine default"
2179 llapi_printf(LLAPI_MSG_NORMAL, "%d",
2180 lum->lmm_stripe_count ==
2181 (typeof(lum->lmm_stripe_count))(-1)
2182 ? -1 : lum->lmm_stripe_count);
2185 llapi_printf(LLAPI_MSG_NORMAL, "%hd",
2186 (__s16)lum->lmm_stripe_count);
2188 separator = is_dir ? " " : "\n";
2191 if (verbose & VERBOSE_SIZE) {
2192 llapi_printf(LLAPI_MSG_NORMAL, "%s", separator);
2193 if (verbose & ~VERBOSE_SIZE)
2194 llapi_printf(LLAPI_MSG_NORMAL, "%sstripe_size: ",
2196 if (is_dir && !raw && lum->lmm_stripe_size == 0) {
2198 rc = sattr_cache_get_defaults(NULL, path, NULL, &ssize,
2201 llapi_printf(LLAPI_MSG_NORMAL, "%u", ssize);
2203 llapi_error(LLAPI_MSG_ERROR, rc,
2204 "Cannot determine default"
2207 llapi_printf(LLAPI_MSG_NORMAL, "%u",
2208 lum->lmm_stripe_size);
2210 separator = is_dir ? " " : "\n";
2213 if ((verbose & VERBOSE_LAYOUT) && !is_dir) {
2214 llapi_printf(LLAPI_MSG_NORMAL, "%s", separator);
2215 if (verbose & ~VERBOSE_LAYOUT)
2216 llapi_printf(LLAPI_MSG_NORMAL, "%spattern: ",
2218 llapi_printf(LLAPI_MSG_NORMAL, "%.x", lum->lmm_pattern);
2222 if ((verbose & VERBOSE_GENERATION) && !is_dir) {
2223 llapi_printf(LLAPI_MSG_NORMAL, "%s", separator);
2224 if (verbose & ~VERBOSE_GENERATION)
2225 llapi_printf(LLAPI_MSG_NORMAL, "%slayout_gen: ",
2227 llapi_printf(LLAPI_MSG_NORMAL, "%u",
2228 (int)lum->lmm_layout_gen);
2232 if (verbose & VERBOSE_OFFSET) {
2233 llapi_printf(LLAPI_MSG_NORMAL, "%s", separator);
2234 if (verbose & ~VERBOSE_OFFSET)
2235 llapi_printf(LLAPI_MSG_NORMAL, "%sstripe_offset: ",
2238 llapi_printf(LLAPI_MSG_NORMAL, "%d",
2239 lum->lmm_stripe_offset ==
2240 (typeof(lum->lmm_stripe_offset))(-1) ? -1 :
2241 lum->lmm_stripe_offset);
2243 llapi_printf(LLAPI_MSG_NORMAL, "%u",
2244 objects[0].l_ost_idx);
2245 separator = is_dir ? " " : "\n";
2248 if ((verbose & VERBOSE_POOL) && (pool_name != NULL)) {
2249 llapi_printf(LLAPI_MSG_NORMAL, "%s", separator);
2250 if (verbose & ~VERBOSE_POOL)
2251 llapi_printf(LLAPI_MSG_NORMAL, "%spool: ",
2253 llapi_printf(LLAPI_MSG_NORMAL, "%s", pool_name);
2256 if (!is_dir || (is_dir && (verbose != VERBOSE_OBJID)))
2257 llapi_printf(LLAPI_MSG_NORMAL, "\n");
2260 void lov_dump_user_lmm_v1v3(struct lov_user_md *lum, char *pool_name,
2261 struct lov_user_ost_data_v1 *objects,
2262 char *path, int is_dir, int obdindex,
2263 int depth, int header, int raw)
2265 int i, obdstripe = (obdindex != OBD_NOT_FOUND) ? 0 : 1;
2268 for (i = 0; !is_dir && i < lum->lmm_stripe_count; i++) {
2269 if (obdindex == objects[i].l_ost_idx) {
2277 lov_dump_user_lmm_header(lum, path, objects, is_dir, header,
2278 depth, raw, pool_name);
2280 if (!is_dir && (header & VERBOSE_OBJID) &&
2281 !(lum->lmm_pattern & LOV_PATTERN_F_RELEASED)) {
2283 llapi_printf(LLAPI_MSG_NORMAL,
2284 "\tobdidx\t\t objid\t\t objid\t\t group\n");
2286 for (i = 0; i < lum->lmm_stripe_count; i++) {
2287 int idx = objects[i].l_ost_idx;
2288 long long oid = ostid_id(&objects[i].l_ost_oi);
2289 long long gr = ostid_seq(&objects[i].l_ost_oi);
2290 if ((obdindex == OBD_NOT_FOUND) || (obdindex == idx)) {
2292 sprintf(fmt, "%s%s%s\n",
2293 "\t%6u\t%14llu\t%#13llx\t",
2294 (fid_seq_is_rsvd(gr) ||
2295 fid_seq_is_mdt0(gr)) ?
2296 "%14llu" : "%#14llx", "%s");
2297 llapi_printf(LLAPI_MSG_NORMAL, fmt, idx, oid,
2299 obdindex == idx ? " *" : "");
2303 llapi_printf(LLAPI_MSG_NORMAL, "\n");
2307 void lmv_dump_user_lmm(struct lmv_user_md *lum, char *pool_name,
2308 char *path, int obdindex, int depth, int verbose)
2310 struct lmv_user_mds_data *objects = lum->lum_objects;
2311 char *prefix = lum->lum_magic == LMV_USER_MAGIC ? "(Default)" : "";
2312 int i, obdstripe = 0;
2313 char *separator = "";
2315 if (obdindex != OBD_NOT_FOUND) {
2316 if (lum->lum_stripe_count == 0) {
2317 if (obdindex == lum->lum_stripe_offset)
2320 for (i = 0; i < lum->lum_stripe_count; i++) {
2321 if (obdindex == objects[i].lum_mds) {
2322 llapi_printf(LLAPI_MSG_NORMAL,
2337 /* show all information default */
2339 if (lum->lum_magic == LMV_USER_MAGIC)
2340 verbose = VERBOSE_POOL | VERBOSE_COUNT |
2341 VERBOSE_OFFSET | VERBOSE_HASH_TYPE;
2343 verbose = VERBOSE_OBJID;
2346 if (depth && path && ((verbose != VERBOSE_OBJID)))
2347 llapi_printf(LLAPI_MSG_NORMAL, "%s%s\n", prefix, path);
2349 if (verbose & VERBOSE_COUNT) {
2350 llapi_printf(LLAPI_MSG_NORMAL, "%s", separator);
2351 if (verbose & ~VERBOSE_COUNT)
2352 llapi_printf(LLAPI_MSG_NORMAL, "lmv_stripe_count: ");
2353 llapi_printf(LLAPI_MSG_NORMAL, "%u",
2354 (int)lum->lum_stripe_count);
2355 if (verbose & VERBOSE_OFFSET)
2361 if (verbose & VERBOSE_OFFSET) {
2362 llapi_printf(LLAPI_MSG_NORMAL, "%s", separator);
2363 if (verbose & ~VERBOSE_OFFSET)
2364 llapi_printf(LLAPI_MSG_NORMAL, "lmv_stripe_offset: ");
2365 llapi_printf(LLAPI_MSG_NORMAL, "%d",
2366 (int)lum->lum_stripe_offset);
2367 if (verbose & VERBOSE_HASH_TYPE)
2373 if (verbose & VERBOSE_HASH_TYPE) {
2374 unsigned int type = lum->lum_hash_type;
2376 llapi_printf(LLAPI_MSG_NORMAL, "%s", separator);
2377 if (verbose & ~VERBOSE_HASH_TYPE)
2378 llapi_printf(LLAPI_MSG_NORMAL, "lmv_hash_type: ");
2379 if (type < LMV_HASH_TYPE_MAX)
2380 llapi_printf(LLAPI_MSG_NORMAL, "%s",
2381 mdt_hash_name[type]);
2383 llapi_printf(LLAPI_MSG_NORMAL, "%d",
2388 if (verbose & VERBOSE_OBJID && lum->lum_magic != LMV_USER_MAGIC) {
2389 llapi_printf(LLAPI_MSG_NORMAL, "%s", separator);
2390 if (obdstripe == 1 && lum->lum_stripe_count > 0)
2391 llapi_printf(LLAPI_MSG_NORMAL,
2392 "mdtidx\t\t FID[seq:oid:ver]\n");
2393 for (i = 0; i < lum->lum_stripe_count; i++) {
2394 int idx = objects[i].lum_mds;
2395 struct lu_fid *fid = &objects[i].lum_fid;
2396 if ((obdindex == OBD_NOT_FOUND) || (obdindex == idx))
2397 llapi_printf(LLAPI_MSG_NORMAL,
2398 "%6u\t\t "DFID"\t\t%s\n",
2400 obdindex == idx ? " *" : "");
2405 if ((verbose & VERBOSE_POOL) && pool_name != NULL &&
2406 pool_name[0] != '\0') {
2407 llapi_printf(LLAPI_MSG_NORMAL, "%s", separator);
2408 if (verbose & ~VERBOSE_POOL)
2409 llapi_printf(LLAPI_MSG_NORMAL, "%slmv_pool: ",
2411 llapi_printf(LLAPI_MSG_NORMAL, "%s%c ", pool_name, ' ');
2415 if (!(verbose & VERBOSE_OBJID) || lum->lum_magic == LMV_USER_MAGIC)
2416 llapi_printf(LLAPI_MSG_NORMAL, "\n");
2419 void llapi_lov_dump_user_lmm(struct find_param *param, char *path, int is_dir)
2423 if (param->fp_get_lmv || param->fp_get_default_lmv)
2424 magic = (__u32)param->fp_lmv_md->lum_magic;
2426 magic = *(__u32 *)¶m->fp_lmd->lmd_lmm; /* lum->lmm_magic */
2429 case LOV_USER_MAGIC_V1:
2430 lov_dump_user_lmm_v1v3(¶m->fp_lmd->lmd_lmm, NULL,
2431 param->fp_lmd->lmd_lmm.lmm_objects,
2433 param->fp_obd_index, param->fp_max_depth,
2434 param->fp_verbose, param->fp_raw);
2436 case LOV_USER_MAGIC_V3: {
2437 char pool_name[LOV_MAXPOOLNAME + 1];
2438 struct lov_user_ost_data_v1 *objects;
2439 struct lov_user_md_v3 *lmmv3 = (void *)¶m->fp_lmd->lmd_lmm;
2441 strlcpy(pool_name, lmmv3->lmm_pool_name, sizeof(pool_name));
2442 objects = lmmv3->lmm_objects;
2443 lov_dump_user_lmm_v1v3(¶m->fp_lmd->lmd_lmm,
2444 pool_name[0] == '\0' ? NULL : pool_name,
2445 objects, path, is_dir,
2446 param->fp_obd_index, param->fp_max_depth,
2447 param->fp_verbose, param->fp_raw);
2451 case LMV_USER_MAGIC: {
2452 char pool_name[LOV_MAXPOOLNAME + 1];
2453 struct lmv_user_md *lum;
2455 lum = (struct lmv_user_md *)param->fp_lmv_md;
2456 strlcpy(pool_name, lum->lum_pool_name, sizeof(pool_name));
2457 lmv_dump_user_lmm(lum,
2458 pool_name[0] == '\0' ? NULL : pool_name,
2459 path, param->fp_obd_index,
2460 param->fp_max_depth, param->fp_verbose);
2464 llapi_printf(LLAPI_MSG_NORMAL, "unknown lmm_magic: %#x "
2465 "(expecting one of %#x %#x %#x %#x)\n",
2466 *(__u32 *)¶m->fp_lmd->lmd_lmm,
2467 LOV_USER_MAGIC_V1, LOV_USER_MAGIC_V3,
2468 LMV_USER_MAGIC, LMV_MAGIC_V1);
2473 int llapi_file_get_stripe(const char *path, struct lov_user_md *lum)
2479 fname = strrchr(path, '/');
2481 /* It should be a file (or other non-directory) */
2482 if (fname == NULL) {
2483 dname = (char *)malloc(2);
2487 fname = (char *)path;
2489 dname = (char *)malloc(fname - path + 1);
2492 strncpy(dname, path, fname - path);
2493 dname[fname - path] = '\0';
2497 fd = open(dname, O_RDONLY | O_NONBLOCK);
2504 strcpy((char *)lum, fname);
2505 if (ioctl(fd, IOC_MDC_GETFILESTRIPE, (void *)lum) == -1)
2508 if (close(fd) == -1 && rc == 0)
2515 int llapi_file_lookup(int dirfd, const char *name)
2517 struct obd_ioctl_data data = { 0 };
2522 if (dirfd < 0 || name == NULL)
2525 data.ioc_version = OBD_IOCTL_VERSION;
2526 data.ioc_len = sizeof(data);
2527 data.ioc_inlbuf1 = (char *)name;
2528 data.ioc_inllen1 = strlen(name) + 1;
2530 rc = obd_ioctl_pack(&data, &buf, sizeof(rawbuf));
2532 llapi_error(LLAPI_MSG_ERROR, rc,
2533 "error: IOC_MDC_LOOKUP pack failed for '%s': rc %d",
2538 rc = ioctl(dirfd, IOC_MDC_LOOKUP, buf);
2544 /* Check if the value matches 1 of the given criteria (e.g. --atime +/-N).
2545 * @mds indicates if this is MDS timestamps and there are attributes on OSTs.
2547 * The result is -1 if it does not match, 0 if not yet clear, 1 if matches.
2548 * The table below gives the answers for the specified parameters (value and
2549 * sign), 1st column is the answer for the MDS value, the 2nd is for the OST:
2550 * --------------------------------------
2551 * 1 | file > limit; sign > 0 | -1 / -1 |
2552 * 2 | file = limit; sign > 0 | -1 / -1 |
2553 * 3 | file < limit; sign > 0 | ? / 1 |
2554 * 4 | file > limit; sign = 0 | -1 / -1 |
2555 * 5 | file = limit; sign = 0 | ? / 1 | <- (see the Note below)
2556 * 6 | file < limit; sign = 0 | ? / -1 |
2557 * 7 | file > limit; sign < 0 | 1 / 1 |
2558 * 8 | file = limit; sign < 0 | ? / -1 |
2559 * 9 | file < limit; sign < 0 | ? / -1 |
2560 * --------------------------------------
2561 * Note: 5th actually means that the value is within the interval
2562 * (limit - margin, limit]. */
2563 static int find_value_cmp(unsigned long long file, unsigned long long limit,
2564 int sign, int negopt, unsigned long long margin,
2570 /* Drop the fraction of margin (of days). */
2571 if (file + margin <= limit)
2573 } else if (sign == 0) {
2574 if (file <= limit && file + margin > limit)
2576 else if (file + margin <= limit)
2578 } else if (sign < 0) {
2585 return negopt ? ~ret + 1 : ret;
2588 /* Check if the file time matches all the given criteria (e.g. --atime +/-N).
2589 * Return -1 or 1 if file timestamp does not or does match the given criteria
2590 * correspondingly. Return 0 if the MDS time is being checked and there are
2591 * attributes on OSTs and it is not yet clear if the timespamp matches.
2593 * If 0 is returned, we need to do another RPC to the OSTs to obtain the
2594 * updated timestamps. */
2595 static int find_time_check(lstat_t *st, struct find_param *param, int mds)
2600 /* Check if file is accepted. */
2601 if (param->fp_atime) {
2602 rc2 = find_value_cmp(st->st_atime, param->fp_atime,
2603 param->fp_asign, param->fp_exclude_atime,
2610 if (param->fp_mtime) {
2611 rc2 = find_value_cmp(st->st_mtime, param->fp_mtime,
2612 param->fp_msign, param->fp_exclude_mtime,
2617 /* If the previous check matches, but this one is not yet clear,
2618 * we should return 0 to do an RPC on OSTs. */
2623 if (param->fp_ctime) {
2624 rc2 = find_value_cmp(st->st_ctime, param->fp_ctime,
2625 param->fp_csign, param->fp_exclude_ctime,
2630 /* If the previous check matches, but this one is not yet clear,
2631 * we should return 0 to do an RPC on OSTs. */
2640 * Check whether the stripes matches the indexes user provided
2644 static int check_obd_match(struct find_param *param)
2646 lstat_t *st = ¶m->fp_lmd->lmd_st;
2647 struct lov_user_ost_data_v1 *lmm_objects;
2650 if (param->fp_obd_uuid && param->fp_obd_index == OBD_NOT_FOUND)
2653 if (!S_ISREG(st->st_mode))
2656 /* Only those files should be accepted, which have a
2657 * stripe on the specified OST. */
2658 if (!param->fp_lmd->lmd_lmm.lmm_stripe_count)
2661 if (param->fp_lmd->lmd_lmm.lmm_magic ==
2662 LOV_USER_MAGIC_V3) {
2663 struct lov_user_md_v3 *lmmv3 = (void *)¶m->fp_lmd->lmd_lmm;
2665 lmm_objects = lmmv3->lmm_objects;
2666 } else if (param->fp_lmd->lmd_lmm.lmm_magic == LOV_USER_MAGIC_V1) {
2667 lmm_objects = param->fp_lmd->lmd_lmm.lmm_objects;
2669 llapi_err_noerrno(LLAPI_MSG_ERROR, "%s:Unknown magic: 0x%08X\n",
2670 __func__, param->fp_lmd->lmd_lmm.lmm_magic);
2674 for (i = 0; i < param->fp_lmd->lmd_lmm.lmm_stripe_count; i++) {
2675 for (j = 0; j < param->fp_num_obds; j++) {
2676 if (param->fp_obd_indexes[j] ==
2677 lmm_objects[i].l_ost_idx) {
2678 if (param->fp_exclude_obd)
2685 if (param->fp_exclude_obd)
2691 static int check_mdt_match(struct find_param *param)
2695 if (param->fp_mdt_uuid && param->fp_mdt_index == OBD_NOT_FOUND)
2698 /* FIXME: For striped dir, we should get stripe information and check */
2699 for (i = 0; i < param->fp_num_mdts; i++) {
2700 if (param->fp_mdt_indexes[i] == param->fp_file_mdt_index)
2701 return !param->fp_exclude_mdt;
2704 if (param->fp_exclude_mdt)
2711 * Check whether the obd is active or not, if it is
2712 * not active, just print the object affected by this
2715 static int print_failed_tgt(struct find_param *param, char *path, int type)
2717 struct obd_statfs stat_buf;
2718 struct obd_uuid uuid_buf;
2721 if (type != LL_STATFS_LOV && type != LL_STATFS_LMV)
2724 memset(&stat_buf, 0, sizeof(struct obd_statfs));
2725 memset(&uuid_buf, 0, sizeof(struct obd_uuid));
2726 ret = llapi_obd_statfs(path, type,
2727 param->fp_obd_index, &stat_buf,
2730 llapi_printf(LLAPI_MSG_NORMAL,
2731 "obd_uuid: %s failed %s ",
2732 param->fp_obd_uuid->uuid,
2739 static int cb_find_init(char *path, DIR *parent, DIR **dirp,
2740 void *data, struct dirent64 *de)
2742 struct find_param *param = (struct find_param *)data;
2743 DIR *dir = dirp == NULL ? NULL : *dirp;
2744 int decision = 1; /* 1 is accepted; -1 is rejected. */
2745 lstat_t *st = ¶m->fp_lmd->lmd_st;
2747 int checked_type = 0;
2750 if (parent == NULL && dir == NULL)
2753 param->fp_lmd->lmd_lmm.lmm_stripe_count = 0;
2755 /* If a regular expression is presented, make the initial decision */
2756 if (param->fp_pattern != NULL) {
2757 char *fname = strrchr(path, '/');
2758 fname = (fname == NULL ? path : fname + 1);
2759 ret = fnmatch(param->fp_pattern, fname, 0);
2760 if ((ret == FNM_NOMATCH && !param->fp_exclude_pattern) ||
2761 (ret == 0 && param->fp_exclude_pattern))
2765 /* See if we can check the file type from the dirent. */
2766 if (param->fp_type != 0 && de != NULL && de->d_type != DT_UNKNOWN) {
2769 if (DTTOIF(de->d_type) == param->fp_type) {
2770 if (param->fp_exclude_type)
2773 if (!param->fp_exclude_type)
2780 /* Request MDS for the stat info if some of these parameters need
2781 * to be compared. */
2782 if (param->fp_obd_uuid || param->fp_mdt_uuid ||
2783 param->fp_check_uid || param->fp_check_gid ||
2784 param->fp_atime || param->fp_mtime || param->fp_ctime ||
2785 param->fp_check_pool || param->fp_check_size ||
2786 param->fp_check_stripe_count || param->fp_check_stripe_size ||
2787 param->fp_check_layout)
2790 if (param->fp_type != 0 && checked_type == 0)
2793 if (decision == 0) {
2794 ret = get_lmd_info(path, parent, dir, param->fp_lmd,
2795 param->fp_lum_size);
2796 if (ret == 0 && param->fp_lmd->lmd_lmm.lmm_magic == 0 &&
2797 (param->fp_check_pool || param->fp_check_stripe_count ||
2798 param->fp_check_stripe_size || param->fp_check_layout)) {
2799 struct lov_user_md *lmm = ¶m->fp_lmd->lmd_lmm;
2801 /* We need to "fake" the "use the default" values
2802 * since the lmm struct is zeroed out at this point. */
2803 lmm->lmm_magic = LOV_USER_MAGIC_V1;
2804 lmm->lmm_pattern = 0xFFFFFFFF;
2806 ostid_set_seq(&lmm->lmm_oi,
2807 FID_SEQ_LOV_DEFAULT);
2808 lmm->lmm_stripe_size = 0;
2809 lmm->lmm_stripe_count = 0;
2810 lmm->lmm_stripe_offset = -1;
2812 if (ret == 0 && param->fp_mdt_uuid != NULL) {
2814 ret = llapi_file_fget_mdtidx(dirfd(dir),
2815 ¶m->fp_file_mdt_index);
2816 } else if (S_ISREG(st->st_mode)) {
2819 /* FIXME: we could get the MDT index from the
2820 * file's FID in lmd->lmd_lmm.lmm_oi without
2821 * opening the file, once we are sure that
2822 * LFSCK2 (2.6) has fixed up pre-2.0 LOV EAs.
2823 * That would still be an ioctl() to map the
2824 * FID to the MDT, but not an open RPC. */
2825 fd = open(path, O_RDONLY);
2827 ret = llapi_file_fget_mdtidx(fd,
2828 ¶m->fp_file_mdt_index);
2834 /* For a special file, we assume it resides on
2835 * the same MDT as the parent directory. */
2836 ret = llapi_file_fget_mdtidx(dirfd(parent),
2837 ¶m->fp_file_mdt_index);
2850 if (param->fp_type && !checked_type) {
2851 if ((st->st_mode & S_IFMT) == param->fp_type) {
2852 if (param->fp_exclude_type)
2855 if (!param->fp_exclude_type)
2861 if (param->fp_obd_uuid || param->fp_mdt_uuid) {
2862 if (lustre_fs && param->fp_got_uuids &&
2863 param->fp_dev != st->st_dev) {
2864 /* A lustre/lustre mount point is crossed. */
2865 param->fp_got_uuids = 0;
2866 param->fp_obds_printed = 0;
2867 param->fp_mdt_index = OBD_NOT_FOUND;
2868 param->fp_obd_index = OBD_NOT_FOUND;
2871 if (lustre_fs && !param->fp_got_uuids) {
2872 ret = setup_target_indexes(dir ? dir : parent, path,
2877 param->fp_dev = st->st_dev;
2878 } else if (!lustre_fs && param->fp_got_uuids) {
2879 /* A lustre/non-lustre mount point is crossed. */
2880 param->fp_got_uuids = 0;
2881 param->fp_mdt_index = OBD_NOT_FOUND;
2882 param->fp_obd_index = OBD_NOT_FOUND;
2886 if (param->fp_check_stripe_size) {
2887 decision = find_value_cmp(
2888 param->fp_lmd->lmd_lmm.lmm_stripe_size,
2889 param->fp_stripe_size,
2890 param->fp_stripe_size_sign,
2891 param->fp_exclude_stripe_size,
2892 param->fp_stripe_size_units, 0);
2897 if (param->fp_check_stripe_count) {
2898 decision = find_value_cmp(
2899 param->fp_lmd->lmd_lmm.lmm_stripe_count,
2900 param->fp_stripe_count,
2901 param->fp_stripe_count_sign,
2902 param->fp_exclude_stripe_count, 1, 0);
2907 if (param->fp_check_layout) {
2910 found = (param->fp_lmd->lmd_lmm.lmm_pattern & param->fp_layout);
2911 if ((param->fp_lmd->lmd_lmm.lmm_pattern == 0xFFFFFFFF) ||
2912 (found && param->fp_exclude_layout) ||
2913 (!found && !param->fp_exclude_layout)) {
2919 /* If an OBD UUID is specified but none matches, skip this file. */
2920 if ((param->fp_obd_uuid && param->fp_obd_index == OBD_NOT_FOUND) ||
2921 (param->fp_mdt_uuid && param->fp_mdt_index == OBD_NOT_FOUND))
2924 /* If an OST or MDT UUID is given, and some OST matches,
2926 if (param->fp_obd_index != OBD_NOT_FOUND ||
2927 param->fp_mdt_index != OBD_NOT_FOUND) {
2928 if (param->fp_obd_uuid) {
2929 if (check_obd_match(param)) {
2930 /* If no mdtuuid is given, we are done.
2931 * Otherwise, fall through to the mdtuuid
2933 if (!param->fp_mdt_uuid)
2940 if (param->fp_mdt_uuid) {
2941 if (check_mdt_match(param))
2948 if (param->fp_check_uid) {
2949 if (st->st_uid == param->fp_uid) {
2950 if (param->fp_exclude_uid)
2953 if (!param->fp_exclude_uid)
2958 if (param->fp_check_gid) {
2959 if (st->st_gid == param->fp_gid) {
2960 if (param->fp_exclude_gid)
2963 if (!param->fp_exclude_gid)
2968 if (param->fp_check_pool) {
2969 struct lov_user_md_v3 *lmmv3 = (void *)¶m->fp_lmd->lmd_lmm;
2971 /* empty requested pool is taken as no pool search => V1 */
2972 if (((param->fp_lmd->lmd_lmm.lmm_magic == LOV_USER_MAGIC_V1) &&
2973 (param->fp_poolname[0] == '\0')) ||
2974 ((param->fp_lmd->lmd_lmm.lmm_magic == LOV_USER_MAGIC_V3) &&
2975 (strncmp(lmmv3->lmm_pool_name,
2976 param->fp_poolname, LOV_MAXPOOLNAME) == 0)) ||
2977 ((param->fp_lmd->lmd_lmm.lmm_magic == LOV_USER_MAGIC_V3) &&
2978 (strcmp(param->fp_poolname, "*") == 0))) {
2979 if (param->fp_exclude_pool)
2982 if (!param->fp_exclude_pool)
2987 /* Check the time on mds. */
2989 if (param->fp_atime || param->fp_mtime || param->fp_ctime) {
2992 for_mds = lustre_fs ? (S_ISREG(st->st_mode) &&
2993 param->fp_lmd->lmd_lmm.lmm_stripe_count)
2995 decision = find_time_check(st, param, for_mds);
3000 /* If file still fits the request, ask ost for updated info.
3001 The regular stat is almost of the same speed as some new
3002 'glimpse-size-ioctl'. */
3004 if (param->fp_check_size && S_ISREG(st->st_mode) &&
3005 param->fp_lmd->lmd_lmm.lmm_stripe_count)
3008 if (param->fp_check_size && S_ISDIR(st->st_mode))
3012 /* For regular files with the stripe the decision may have not
3013 * been taken yet if *time or size is to be checked. */
3014 if (param->fp_obd_index != OBD_NOT_FOUND)
3015 print_failed_tgt(param, path, LL_STATFS_LOV);
3017 if (param->fp_mdt_index != OBD_NOT_FOUND)
3018 print_failed_tgt(param, path, LL_STATFS_LMV);
3021 ret = fstat_f(dirfd(dir), st);
3022 else if (de != NULL)
3023 ret = fstatat_f(dirfd(parent), de->d_name, st,
3024 AT_SYMLINK_NOFOLLOW);
3026 ret = lstat_f(path, st);
3029 if (errno == ENOENT) {
3030 llapi_error(LLAPI_MSG_ERROR, -ENOENT,
3031 "warning: %s: %s does not exist",
3036 llapi_error(LLAPI_MSG_ERROR, ret,
3037 "%s: IOC_LOV_GETINFO on %s failed",
3043 /* Check the time on osc. */
3044 decision = find_time_check(st, param, 0);
3049 if (param->fp_check_size)
3050 decision = find_value_cmp(st->st_size, param->fp_size,
3051 param->fp_size_sign,
3052 param->fp_exclude_size,
3053 param->fp_size_units, 0);
3055 if (decision != -1) {
3056 llapi_printf(LLAPI_MSG_NORMAL, "%s", path);
3057 if (param->fp_zero_end)
3058 llapi_printf(LLAPI_MSG_NORMAL, "%c", '\0');
3060 llapi_printf(LLAPI_MSG_NORMAL, "\n");
3064 /* Do not get down anymore? */
3065 if (param->fp_depth == param->fp_max_depth)
3073 static int cb_migrate_mdt_init(char *path, DIR *parent, DIR **dirp,
3074 void *param_data, struct dirent64 *de)
3076 struct find_param *param = (struct find_param *)param_data;
3077 DIR *tmp_parent = parent;
3078 char raw[OBD_MAX_IOCTL_BUFFER] = {'\0'};
3080 struct obd_ioctl_data data = { 0 };
3087 if (parent == NULL && dirp == NULL)
3093 if (parent == NULL) {
3094 tmp_parent = opendir_parent(path);
3095 if (tmp_parent == NULL) {
3098 llapi_error(LLAPI_MSG_ERROR, ret,
3099 "can not open %s", path);
3104 fd = dirfd(tmp_parent);
3106 path_copy = strdup(path);
3107 filename = basename(path_copy);
3108 data.ioc_inlbuf1 = (char *)filename;
3109 data.ioc_inllen1 = strlen(filename) + 1;
3110 data.ioc_inlbuf2 = (char *)¶m->fp_mdt_index;
3111 data.ioc_inllen2 = sizeof(param->fp_mdt_index);
3112 ret = obd_ioctl_pack(&data, &rawbuf, sizeof(raw));
3114 llapi_error(LLAPI_MSG_ERROR, ret,
3115 "llapi_obd_statfs: error packing ioctl data");
3120 ret = ioctl(fd, LL_IOC_MIGRATE, rawbuf);
3122 if (errno == EBUSY && !retry) {
3123 /* because migrate may not be able to lock all involved
3124 * objects in order, for some of them it try lock, while
3125 * there may be conflicting COS locks and cause migrate
3126 * fail with EBUSY, hope a sync() could cause
3127 * transaction commit and release these COS locks. */
3133 fprintf(stderr, "%s migrate failed: %s (%d)\n",
3134 path, strerror(-ret), ret);
3136 } else if (param->fp_verbose & VERBOSE_DETAIL) {
3137 fprintf(stdout, "migrate %s to MDT%d\n",
3138 path, param->fp_mdt_index);
3143 /* If the directory is being migration, we need
3144 * close the directory after migration,
3145 * so the old directory cache will be cleanup
3146 * on the client side, and re-open to get the
3147 * new directory handle */
3148 *dirp = opendir(path);
3149 if (*dirp == NULL) {
3151 llapi_error(LLAPI_MSG_ERROR, ret,
3152 "%s: Failed to open '%s'", __func__, path);
3157 closedir(tmp_parent);
3164 int llapi_migrate_mdt(char *path, struct find_param *param)
3166 return param_callback(path, cb_migrate_mdt_init, cb_common_fini, param);
3169 int llapi_mv(char *path, struct find_param *param)
3171 #if LUSTRE_VERSION_CODE > OBD_OCD_VERSION(2, 9, 53, 0)
3172 static bool printed;
3175 llapi_error(LLAPI_MSG_ERROR, -ESTALE,
3176 "llapi_mv() is deprecated, use llapi_migrate_mdt()\n");
3180 return llapi_migrate_mdt(path, param);
3183 int llapi_find(char *path, struct find_param *param)
3185 return param_callback(path, cb_find_init, cb_common_fini, param);
3189 * Get MDT number that the file/directory inode referenced
3190 * by the open fd resides on.
3191 * Return 0 and mdtidx on success, or -ve errno.
3193 int llapi_file_fget_mdtidx(int fd, int *mdtidx)
3195 if (ioctl(fd, LL_IOC_GET_MDTIDX, mdtidx) < 0)
3200 static int cb_get_mdt_index(char *path, DIR *parent, DIR **dirp, void *data,
3201 struct dirent64 *de)
3203 struct find_param *param = (struct find_param *)data;
3204 DIR *d = dirp == NULL ? NULL : *dirp;
3208 if (parent == NULL && d == NULL)
3212 ret = llapi_file_fget_mdtidx(dirfd(d), &mdtidx);
3213 } else /* if (parent) */ {
3216 fd = open(path, O_RDONLY | O_NOCTTY);
3218 ret = llapi_file_fget_mdtidx(fd, &mdtidx);
3226 if (ret == -ENODATA) {
3227 if (!param->fp_obd_uuid)
3228 llapi_printf(LLAPI_MSG_NORMAL,
3229 "'%s' has no stripe info\n", path);
3231 } else if (ret == -ENOENT) {
3232 llapi_error(LLAPI_MSG_WARN, ret,
3233 "warning: %s: '%s' does not exist",
3236 } else if (ret == -ENOTTY) {
3237 llapi_error(LLAPI_MSG_ERROR, ret,
3238 "%s: '%s' not on a Lustre fs",
3241 llapi_error(LLAPI_MSG_ERROR, ret,
3242 "error: %s: '%s' failed get_mdtidx",
3248 if (param->fp_quiet || !(param->fp_verbose & VERBOSE_DETAIL))
3249 llapi_printf(LLAPI_MSG_NORMAL, "%d\n", mdtidx);
3251 llapi_printf(LLAPI_MSG_NORMAL, "%s\nmdt_index:\t%d\n",
3255 /* Do not go down anymore? */
3256 if (param->fp_depth == param->fp_max_depth)
3264 static int cb_getstripe(char *path, DIR *parent, DIR **dirp, void *data,
3265 struct dirent64 *de)
3267 struct find_param *param = (struct find_param *)data;
3268 DIR *d = dirp == NULL ? NULL : *dirp;
3271 if (parent == NULL && d == NULL)
3274 if (param->fp_obd_uuid) {
3275 param->fp_quiet = 1;
3276 ret = setup_obd_uuid(d ? dirfd(d) : dirfd(parent), path, param);
3282 if (param->fp_get_lmv || param->fp_get_default_lmv) {
3283 ret = cb_get_dirstripe(path, d, param);
3285 ret = ioctl(dirfd(d), LL_IOC_LOV_GETSTRIPE,
3286 (void *)¶m->fp_lmd->lmd_lmm);
3289 } else if (parent && !param->fp_get_lmv && !param->fp_get_default_lmv) {
3290 char *fname = strrchr(path, '/');
3291 fname = (fname == NULL ? path : fname + 1);
3293 strlcpy((char *)¶m->fp_lmd->lmd_lmm, fname,
3294 param->fp_lum_size);
3296 ret = ioctl(dirfd(parent), IOC_MDC_GETFILESTRIPE,
3297 (void *)¶m->fp_lmd->lmd_lmm);
3303 if (errno == ENODATA && d != NULL) {
3304 /* We need to "fake" the "use the default" values
3305 * since the lmm struct is zeroed out at this point.
3306 * The magic needs to be set in order to satisfy
3307 * a check later on in the code path.
3308 * The object_seq needs to be set for the "(Default)"
3309 * prefix to be displayed. */
3310 if (param->fp_get_default_lmv) {
3311 struct lmv_user_md *lum = param->fp_lmv_md;
3313 lum->lum_magic = LMV_USER_MAGIC;
3314 lum->lum_stripe_count = 0;
3315 lum->lum_stripe_offset = -1;
3317 } else if (param->fp_get_lmv) {
3318 struct lmv_user_md *lum = param->fp_lmv_md;
3321 ret = llapi_file_fget_mdtidx(dirfd(d), &mdtidx);
3324 lum->lum_magic = LMV_MAGIC_V1;
3325 lum->lum_stripe_count = 0;
3326 lum->lum_stripe_offset = mdtidx;
3329 struct lov_user_md *lmm =
3330 ¶m->fp_lmd->lmd_lmm;
3332 lmm->lmm_magic = LOV_USER_MAGIC_V1;
3334 ostid_set_seq(&lmm->lmm_oi,
3335 FID_SEQ_LOV_DEFAULT);
3336 lmm->lmm_stripe_count = 0;
3337 lmm->lmm_stripe_size = 0;
3338 lmm->lmm_stripe_offset = -1;
3341 } else if (errno == ENODATA && parent != NULL) {
3342 if (!param->fp_obd_uuid && !param->fp_mdt_uuid)
3343 llapi_printf(LLAPI_MSG_NORMAL,
3344 "%s has no stripe info\n", path);
3346 } else if (errno == ENOENT) {
3347 llapi_error(LLAPI_MSG_WARN, -ENOENT,
3348 "warning: %s: %s does not exist",
3351 } else if (errno == ENOTTY) {
3353 llapi_error(LLAPI_MSG_ERROR, ret,
3354 "%s: '%s' not on a Lustre fs?",
3359 llapi_error(LLAPI_MSG_ERROR, ret,
3360 "error: %s: %s failed for %s",
3361 __func__, d ? "LL_IOC_LOV_GETSTRIPE" :
3362 "IOC_MDC_GETFILESTRIPE", path);
3369 if (!(param->fp_verbose & VERBOSE_MDTINDEX))
3370 llapi_lov_dump_user_lmm(param, path, d ? 1 : 0);
3373 /* Do not get down anymore? */
3374 if (param->fp_depth == param->fp_max_depth)
3382 int llapi_getstripe(char *path, struct find_param *param)
3384 return param_callback(path, (param->fp_verbose & VERBOSE_MDTINDEX) ?
3385 cb_get_mdt_index : cb_getstripe,
3386 cb_common_fini, param);
3389 int llapi_obd_fstatfs(int fd, __u32 type, __u32 index,
3390 struct obd_statfs *stat_buf, struct obd_uuid *uuid_buf)
3392 char raw[OBD_MAX_IOCTL_BUFFER] = {'\0'};
3394 struct obd_ioctl_data data = { 0 };
3397 data.ioc_inlbuf1 = (char *)&type;
3398 data.ioc_inllen1 = sizeof(__u32);
3399 data.ioc_inlbuf2 = (char *)&index;
3400 data.ioc_inllen2 = sizeof(__u32);
3401 data.ioc_pbuf1 = (char *)stat_buf;
3402 data.ioc_plen1 = sizeof(struct obd_statfs);
3403 data.ioc_pbuf2 = (char *)uuid_buf;
3404 data.ioc_plen2 = sizeof(struct obd_uuid);
3406 rc = obd_ioctl_pack(&data, &rawbuf, sizeof(raw));
3408 llapi_error(LLAPI_MSG_ERROR, rc,
3409 "llapi_obd_statfs: error packing ioctl data");
3413 rc = ioctl(fd, IOC_OBD_STATFS, (void *)rawbuf);
3415 return rc < 0 ? -errno : 0;
3418 int llapi_obd_statfs(char *path, __u32 type, __u32 index,
3419 struct obd_statfs *stat_buf, struct obd_uuid *uuid_buf)
3424 fd = open(path, O_RDONLY);
3427 llapi_error(LLAPI_MSG_ERROR, rc, "error: %s: opening '%s'",
3429 /* If we can't even open a file on the filesystem (e.g. with
3430 * -ESHUTDOWN), force caller to exit or it will loop forever. */
3434 rc = llapi_obd_fstatfs(fd, type, index, stat_buf, uuid_buf);
3441 #define MAX_STRING_SIZE 128
3443 int llapi_ping(char *obd_type, char *obd_name)
3449 rc = cfs_get_param_paths(&path, "%s/%s/ping",
3450 obd_type, obd_name);
3454 fd = open(path.gl_pathv[0], O_WRONLY);
3457 llapi_error(LLAPI_MSG_ERROR, rc, "error opening %s",
3462 /* The purpose is to send a byte as a ping, whatever this byte is. */
3463 /* coverity[uninit_use_in_call] */
3464 rc = write(fd, buf, 1);
3472 cfs_free_param_data(&path);
3476 int llapi_target_iterate(int type_num, char **obd_type,
3477 void *args, llapi_cb_t cb)
3479 char buf[MAX_STRING_SIZE];
3484 rc = cfs_get_param_paths(¶m, "devices");
3488 fp = fopen(param.gl_pathv[0], "r");
3491 llapi_error(LLAPI_MSG_ERROR, rc, "error: opening '%s'",
3496 while (fgets(buf, sizeof(buf), fp) != NULL) {
3497 char *obd_type_name = NULL;
3498 char *obd_name = NULL;
3499 char *obd_uuid = NULL;
3501 struct obd_statfs osfs_buffer;
3503 while(bufp[0] == ' ')
3506 for(i = 0; i < 3; i++) {
3507 obd_type_name = strsep(&bufp, " ");
3509 obd_name = strsep(&bufp, " ");
3510 obd_uuid = strsep(&bufp, " ");
3512 memset(&osfs_buffer, 0, sizeof (osfs_buffer));
3514 for (i = 0; i < type_num; i++) {
3515 if (strcmp(obd_type_name, obd_type[i]) != 0)
3518 cb(obd_type_name, obd_name, obd_uuid, args);
3523 cfs_free_param_data(¶m);
3527 static void do_target_check(char *obd_type_name, char *obd_name,
3528 char *obd_uuid, void *args)
3532 rc = llapi_ping(obd_type_name, obd_name);
3533 if (rc == ENOTCONN) {
3534 llapi_printf(LLAPI_MSG_NORMAL, "%s inactive.\n", obd_name);
3536 llapi_error(LLAPI_MSG_ERROR, rc, "error: check '%s'", obd_name);
3538 llapi_printf(LLAPI_MSG_NORMAL, "%s active.\n", obd_name);
3542 int llapi_target_check(int type_num, char **obd_type, char *dir)
3544 return llapi_target_iterate(type_num, obd_type, NULL, do_target_check);
3547 #undef MAX_STRING_SIZE
3549 /* Is this a lustre fs? */
3550 int llapi_is_lustre_mnttype(const char *type)
3552 return (strcmp(type, "lustre") == 0 || strcmp(type,"lustre_lite") == 0);
3555 /* Is this a lustre client fs? */
3556 int llapi_is_lustre_mnt(struct mntent *mnt)
3558 return (llapi_is_lustre_mnttype(mnt->mnt_type) &&
3559 strstr(mnt->mnt_fsname, ":/") != NULL);
3562 int llapi_quotactl(char *mnt, struct if_quotactl *qctl)
3564 char fsname[PATH_MAX + 1];
3568 rc = llapi_search_fsname(mnt, fsname);
3570 llapi_err_noerrno(LLAPI_MSG_ERROR,
3571 "'%s' isn't on Lustre filesystem", mnt);
3575 root = open(mnt, O_RDONLY | O_DIRECTORY);
3578 llapi_error(LLAPI_MSG_ERROR, rc, "open %s failed", mnt);
3582 rc = ioctl(root, OBD_IOC_QUOTACTL, qctl);
3590 /* Print mdtname 'name' into 'buf' using 'format'. Add -MDT0000 if needed.
3591 * format must have %s%s, buf must be > 16
3592 * Eg: if name = "lustre-MDT0000", "lustre", or "lustre-MDT0000_UUID"
3593 * then buf = "lustre-MDT0000"
3595 static int get_mdtname(char *name, char *format, char *buf)
3597 char suffix[]="-MDT0000";
3598 int len = strlen(name);
3600 if ((len > 5) && (strncmp(name + len - 5, "_UUID", 5) == 0)) {
3601 name[len - 5] = '\0';
3606 if ((len <= 16) && strncmp(name + len - 8, "-MDT", 4) == 0) {
3609 /* Not enough room to add suffix */
3610 llapi_err_noerrno(LLAPI_MSG_ERROR,
3611 "MDT name too long |%s|", name);
3616 return sprintf(buf, format, name, suffix);
3619 /** ioctl on filsystem root, with mdtindex sent as data
3620 * \param mdtname path, fsname, or mdtname (lutre-MDT0004)
3621 * \param mdtidxp pointer to integer within data to be filled in with the
3622 * mdt index (0 if no mdt is specified). NULL won't be filled.
3624 int root_ioctl(const char *mdtname, int opc, void *data, int *mdtidxp,
3632 /* Take path, fsname, or MDTname. Assume MDT0000 in the former cases.
3633 Open root and parse mdt index. */
3634 if (mdtname[0] == '/') {
3636 rc = get_root_path(WANT_FD | want_error, NULL, &fd,
3637 (char *)mdtname, -1);
3639 if (get_mdtname((char *)mdtname, "%s%s", fsname) < 0)
3641 ptr = fsname + strlen(fsname) - 8;
3643 index = strtol(ptr + 4, NULL, 10);
3644 rc = get_root_path(WANT_FD | want_error, fsname, &fd, NULL, -1);
3648 llapi_err_noerrno(LLAPI_MSG_ERROR,
3649 "Can't open %s: %d\n", mdtname, rc);
3656 rc = ioctl(fd, opc, data);
3665 /****** Changelog API ********/
3667 static int changelog_ioctl(const char *mdtname, int opc, int id,
3668 long long recno, int flags)
3670 struct ioc_changelog data;
3674 data.icc_recno = recno;
3675 data.icc_flags = flags;
3676 idx = (int *)(&data.icc_mdtindex);
3678 return root_ioctl(mdtname, opc, &data, idx, WANT_ERROR);
3681 #define CHANGELOG_PRIV_MAGIC 0xCA8E1080
3682 struct changelog_private {
3684 enum changelog_send_flag flags;
3685 struct lustre_kernelcomm kuc;
3688 /** Start reading from a changelog
3689 * @param priv Opaque private control structure
3690 * @param flags Start flags (e.g. CHANGELOG_FLAG_BLOCK)
3691 * @param device Report changes recorded on this MDT
3692 * @param startrec Report changes beginning with this record number
3693 * (just call llapi_changelog_fini when done; don't need an endrec)
3695 int llapi_changelog_start(void **priv, enum changelog_send_flag flags,
3696 const char *device, long long startrec)
3698 struct changelog_private *cp;
3702 /* Set up the receiver control struct */
3703 cp = calloc(1, sizeof(*cp));
3707 cp->magic = CHANGELOG_PRIV_MAGIC;
3710 /* Set up the receiver */
3711 rc = libcfs_ukuc_start(&cp->kuc, 0 /* no group registration */, 0);
3717 /* CHANGELOG_FLAG_JOBID will eventually become mandatory. Display a
3718 * warning if it's missing. */
3719 if (!(flags & CHANGELOG_FLAG_JOBID) && !warned) {
3720 llapi_err_noerrno(LLAPI_MSG_WARN, "warning: %s() called "
3721 "w/o CHANGELOG_FLAG_JOBID", __func__);
3725 /* Tell the kernel to start sending */
3726 rc = changelog_ioctl(device, OBD_IOC_CHANGELOG_SEND, cp->kuc.lk_wfd,
3728 /* Only the kernel reference keeps the write side open */
3729 close(cp->kuc.lk_wfd);
3730 cp->kuc.lk_wfd = LK_NOFD;
3732 /* frees and clears priv */
3733 llapi_changelog_fini(priv);
3744 /** Finish reading from a changelog */
3745 int llapi_changelog_fini(void **priv)
3747 struct changelog_private *cp = (struct changelog_private *)*priv;
3749 if (!cp || (cp->magic != CHANGELOG_PRIV_MAGIC))
3752 libcfs_ukuc_stop(&cp->kuc);
3759 * Convert all records to a same format according to the caller's wishes.
3760 * Default is CLF_VERSION | CLF_RENAME.
3761 * Add CLF_JOBID if explicitely requested.
3763 * \param rec The record to remap. It is expected to be big enough to
3764 * properly handle the final format.
3765 * \return 1 if anything changed. 0 otherwise.
3767 /** Read the next changelog entry
3768 * @param priv Opaque private control structure
3769 * @param rech Changelog record handle; record will be allocated here
3770 * @return 0 valid message received; rec is set
3774 #define DEFAULT_RECORD_FMT (CLF_VERSION | CLF_RENAME)
3775 int llapi_changelog_recv(void *priv, struct changelog_rec **rech)
3777 struct changelog_private *cp = (struct changelog_private *)priv;
3778 struct kuc_hdr *kuch;
3779 enum changelog_rec_flags rec_fmt = DEFAULT_RECORD_FMT;
3782 if (!cp || (cp->magic != CHANGELOG_PRIV_MAGIC))
3786 kuch = malloc(KUC_CHANGELOG_MSG_MAXSIZE);
3790 if (cp->flags & CHANGELOG_FLAG_JOBID)
3791 rec_fmt |= CLF_JOBID;
3794 rc = libcfs_ukuc_msg_get(&cp->kuc, (char *)kuch,
3795 KUC_CHANGELOG_MSG_MAXSIZE,
3796 KUC_TRANSPORT_CHANGELOG);
3800 if ((kuch->kuc_transport != KUC_TRANSPORT_CHANGELOG) ||
3801 ((kuch->kuc_msgtype != CL_RECORD) &&
3802 (kuch->kuc_msgtype != CL_EOF))) {
3803 llapi_err_noerrno(LLAPI_MSG_ERROR,
3804 "Unknown changelog message type %d:%d\n",
3805 kuch->kuc_transport, kuch->kuc_msgtype);
3810 if (kuch->kuc_msgtype == CL_EOF) {
3811 if (cp->flags & CHANGELOG_FLAG_FOLLOW) {
3820 /* Our message is a changelog_rec. Use pointer math to skip
3821 * kuch_hdr and point directly to the message payload. */
3822 *rech = (struct changelog_rec *)(kuch + 1);
3823 changelog_remap_rec(*rech, rec_fmt);
3833 /** Release the changelog record when done with it. */
3834 int llapi_changelog_free(struct changelog_rec **rech)
3837 /* We allocated memory starting at the kuc_hdr, but passed
3838 * the consumer a pointer to the payload.
3839 * Use pointer math to get back to the header.
3841 struct kuc_hdr *kuch = (struct kuc_hdr *)*rech - 1;
3848 int llapi_changelog_clear(const char *mdtname, const char *idstr,
3854 llapi_err_noerrno(LLAPI_MSG_ERROR,
3855 "can't purge negative records\n");
3859 id = strtol(idstr + strlen(CHANGELOG_USER_PREFIX), NULL, 10);
3860 if ((id == 0) || (strncmp(idstr, CHANGELOG_USER_PREFIX,
3861 strlen(CHANGELOG_USER_PREFIX)) != 0)) {
3862 llapi_err_noerrno(LLAPI_MSG_ERROR,
3863 "expecting id of the form '"
3864 CHANGELOG_USER_PREFIX
3865 "<num>'; got '%s'\n", idstr);
3869 return changelog_ioctl(mdtname, OBD_IOC_CHANGELOG_CLEAR, id, endrec, 0);
3872 int llapi_fid2path(const char *device, const char *fidstr, char *buf,
3873 int buflen, long long *recno, int *linkno)
3875 const char *fidstr_orig = fidstr;
3877 struct getinfo_fid2path *gf;
3880 while (*fidstr == '[')
3883 sscanf(fidstr, SFID, RFID(&fid));
3884 if (!fid_is_sane(&fid)) {
3885 llapi_err_noerrno(LLAPI_MSG_ERROR,
3886 "bad FID format '%s', should be [seq:oid:ver]"
3887 " (e.g. "DFID")\n", fidstr_orig,
3888 (unsigned long long)FID_SEQ_NORMAL, 2, 0);
3892 gf = malloc(sizeof(*gf) + buflen);
3897 gf->gf_recno = *recno;
3898 gf->gf_linkno = *linkno;
3899 gf->gf_pathlen = buflen;
3901 /* Take path or fsname */
3902 rc = root_ioctl(device, OBD_IOC_FID2PATH, gf, NULL, 0);
3906 memcpy(buf, gf->gf_u.gf_path, gf->gf_pathlen);
3907 if (buf[0] == '\0') { /* ROOT path */
3911 *recno = gf->gf_recno;
3912 *linkno = gf->gf_linkno;
3919 static int fid_from_lma(const char *path, const int fd, lustre_fid *fid)
3922 struct lustre_mdt_attrs *lma;
3926 rc = fgetxattr(fd, XATTR_NAME_LMA, buf, sizeof(buf));
3928 rc = lgetxattr(path, XATTR_NAME_LMA, buf, sizeof(buf));
3931 lma = (struct lustre_mdt_attrs *)buf;
3932 fid_le_to_cpu(fid, &lma->lma_self_fid);
3936 int llapi_get_mdt_index_by_fid(int fd, const lustre_fid *fid,
3941 rc = ioctl(fd, LL_IOC_FID2MDTIDX, fid);
3950 int llapi_fd2fid(const int fd, lustre_fid *fid)
3954 memset(fid, 0, sizeof(*fid));
3956 rc = ioctl(fd, LL_IOC_PATH2FID, fid) < 0 ? -errno : 0;
3957 if (rc == -EINVAL || rc == -ENOTTY)
3958 rc = fid_from_lma(NULL, fd, fid);
3963 int llapi_path2fid(const char *path, lustre_fid *fid)
3967 memset(fid, 0, sizeof(*fid));
3968 fd = open(path, O_RDONLY | O_NONBLOCK | O_NOFOLLOW);
3970 if (errno == ELOOP || errno == ENXIO)
3971 return fid_from_lma(path, -1, fid);
3975 rc = llapi_fd2fid(fd, fid);
3976 if (rc == -EINVAL || rc == -ENOTTY)
3977 rc = fid_from_lma(path, -1, fid);
3983 int llapi_fd2parent(int fd, unsigned int linkno, lustre_fid *parent_fid,
3984 char *name, size_t name_size)
3986 struct getparent *gp;
3989 gp = malloc(sizeof(*gp) + name_size);
3993 gp->gp_linkno = linkno;
3994 gp->gp_name_size = name_size;
3996 rc = ioctl(fd, LL_IOC_GETPARENT, gp);
4002 *parent_fid = gp->gp_fid;
4004 strncpy(name, gp->gp_name, name_size);
4005 name[name_size - 1] = '\0';
4012 int llapi_path2parent(const char *path, unsigned int linkno,
4013 lustre_fid *parent_fid, char *name, size_t name_size)
4018 fd = open(path, O_RDONLY | O_NONBLOCK | O_NOFOLLOW);
4022 rc = llapi_fd2parent(fd, linkno, parent_fid, name, name_size);
4027 int llapi_get_connect_flags(const char *mnt, __u64 *flags)
4032 root = open(mnt, O_RDONLY | O_DIRECTORY);
4035 llapi_error(LLAPI_MSG_ERROR, rc, "open %s failed", mnt);
4039 rc = ioctl(root, LL_IOC_GET_CONNECT_FLAGS, flags);
4042 llapi_error(LLAPI_MSG_ERROR, rc,
4043 "ioctl on %s for getting connect flags failed", mnt);
4050 * Get a 64-bit value representing the version of file data pointed by fd.
4052 * Each write or truncate, flushed on OST, will change this value. You can use
4053 * this value to verify if file data was modified. This only checks the file
4054 * data, not metadata.
4056 * \param flags 0: no flush pages, usually used it the process has already
4058 * LL_DV_RD_FLUSH: OSTs will take LCK_PR to flush dirty pages
4060 * LL_DV_WR_FLUSH: OSTs will take LCK_PW to flush all caching
4061 * pages from clients.
4063 * \retval 0 on success.
4064 * \retval -errno on error.
4066 int llapi_get_data_version(int fd, __u64 *data_version, __u64 flags)
4069 struct ioc_data_version idv;
4071 idv.idv_flags = flags;
4073 rc = ioctl(fd, LL_IOC_DATA_VERSION, &idv);
4077 *data_version = idv.idv_version;
4083 * Create a file without any name open it for read/write
4085 * - file is created as if it were a standard file in the given \a directory
4086 * - file does not appear in \a directory and mtime does not change because
4087 * the filename is handled specially by the Lustre MDS.
4088 * - file is removed at final close
4089 * - file modes are rw------- since it doesn't make sense to have a read-only
4090 * or write-only file that cannot be opened again.
4091 * - if user wants another mode it must use fchmod() on the open file, no
4092 * security problems arise because it cannot be opened by another process.
4094 * \param[in] directory directory from which to inherit layout/MDT idx
4095 * \param[in] idx MDT index on which the file is created,
4096 * \a idx == -1 means no specific MDT is requested
4097 * \param[in] open_flags standard open(2) flags
4099 * \retval 0 on success.
4100 * \retval -errno on error.
4102 int llapi_create_volatile_idx(char *directory, int idx, int open_flags)
4104 char file_path[PATH_MAX];
4105 char filename[PATH_MAX];
4106 int saved_errno = errno;
4114 snprintf(filename, sizeof(filename),
4115 LUSTRE_VOLATILE_HDR"::%.4X", rnumber);
4117 snprintf(filename, sizeof(filename),
4118 LUSTRE_VOLATILE_HDR":%.4X:%.4X", idx, rnumber);
4120 rc = snprintf(file_path, sizeof(file_path),
4121 "%s/%s", directory, filename);
4122 if (rc >= sizeof(file_path))
4125 fd = open(file_path,
4126 O_RDWR | O_CREAT | O_EXCL | O_NOFOLLOW | open_flags,
4128 } while (fd < 0 && errno == EEXIST);
4131 llapi_error(LLAPI_MSG_ERROR, errno,
4132 "Cannot create volatile file '%s' in '%s'",
4133 filename + LUSTRE_VOLATILE_HDR_LEN,
4138 /* Unlink file in case this wasn't a Lustre filesystem and the
4139 * magic volatile filename wasn't handled as intended. The
4140 * effect is the same. If volatile open was supported then we
4141 * expect unlink() to return -ENOENT. */
4142 (void)unlink(file_path);
4144 /* Since we are returning successfully we restore errno (and
4145 * mask out possible EEXIST from open() and ENOENT from
4147 errno = saved_errno;
4153 * Swap the layouts between 2 file descriptors
4154 * the 2 files must be open for writing
4155 * first fd received the ioctl, second fd is passed as arg
4156 * this is assymetric but avoid use of root path for ioctl
4158 int llapi_fswap_layouts_grouplock(int fd1, int fd2, __u64 dv1, __u64 dv2,
4159 int gid, __u64 flags)
4161 struct lustre_swap_layouts lsl;
4166 if (flags & (SWAP_LAYOUTS_KEEP_ATIME | SWAP_LAYOUTS_KEEP_MTIME)) {
4167 rc = fstat(fd1, &st1);
4171 rc = fstat(fd2, &st2);
4176 lsl.sl_flags = flags;
4180 rc = ioctl(fd1, LL_IOC_LOV_SWAP_LAYOUTS, &lsl);
4184 if (flags & (SWAP_LAYOUTS_KEEP_ATIME | SWAP_LAYOUTS_KEEP_MTIME)) {
4185 struct timeval tv1[2];
4186 struct timeval tv2[2];
4188 memset(tv1, 0, sizeof(tv1));
4189 memset(tv2, 0, sizeof(tv2));
4191 if (flags & SWAP_LAYOUTS_KEEP_ATIME) {
4192 tv1[0].tv_sec = st1.st_atime;
4193 tv2[0].tv_sec = st2.st_atime;
4195 tv1[0].tv_sec = st2.st_atime;
4196 tv2[0].tv_sec = st1.st_atime;
4199 if (flags & SWAP_LAYOUTS_KEEP_MTIME) {
4200 tv1[1].tv_sec = st1.st_mtime;
4201 tv2[1].tv_sec = st2.st_mtime;
4203 tv1[1].tv_sec = st2.st_mtime;
4204 tv2[1].tv_sec = st1.st_mtime;
4207 rc = futimes(fd1, tv1);
4211 rc = futimes(fd2, tv2);
4219 int llapi_fswap_layouts(int fd1, int fd2, __u64 dv1, __u64 dv2, __u64 flags)
4226 while (grp_id == 0);
4228 rc = llapi_fswap_layouts_grouplock(fd1, fd2, dv1, dv2, grp_id, flags);
4236 * Swap the layouts between 2 files
4237 * the 2 files are open in write
4239 int llapi_swap_layouts(const char *path1, const char *path2,
4240 __u64 dv1, __u64 dv2, __u64 flags)
4244 fd1 = open(path1, O_WRONLY | O_LOV_DELAY_CREATE);
4247 llapi_error(LLAPI_MSG_ERROR, rc,
4248 "error: cannot open '%s' for write", path1);
4252 fd2 = open(path2, O_WRONLY | O_LOV_DELAY_CREATE);
4255 llapi_error(LLAPI_MSG_ERROR, rc,
4256 "error: cannot open '%s' for write", path2);
4260 rc = llapi_fswap_layouts(fd1, fd2, dv1, dv2, flags);
4262 llapi_error(LLAPI_MSG_ERROR, rc,
4263 "error: cannot swap layout between '%s' and '%s'",
4274 * Attempt to open a file with Lustre file identifier \a fid
4275 * and return an open file descriptor.
4277 * \param[in] lustre_dir path within Lustre filesystem containing \a fid
4278 * \param[in] fid Lustre file identifier of file to open
4279 * \param[in] flags open() flags
4281 * \retval non-negative file descriptor on successful open
4282 * \retval -1 if an error occurred
4284 int llapi_open_by_fid(const char *lustre_dir, const lustre_fid *fid, int flags)
4286 char mntdir[PATH_MAX];
4287 char path[PATH_MAX];
4290 rc = llapi_search_mounts(lustre_dir, 0, mntdir, NULL);
4294 snprintf(path, sizeof(path), "%s/.lustre/fid/"DFID, mntdir, PFID(fid));
4295 return open(path, flags);
4301 * \param fd File to lock.
4302 * \param gid Group Identifier.
4304 * \retval 0 on success.
4305 * \retval -errno on failure.
4307 int llapi_group_lock(int fd, int gid)
4311 rc = ioctl(fd, LL_IOC_GROUP_LOCK, gid);
4314 llapi_error(LLAPI_MSG_ERROR, rc, "cannot get group lock");
4322 * \param fd File to unlock.
4323 * \param gid Group Identifier.
4325 * \retval 0 on success.
4326 * \retval -errno on failure.
4328 int llapi_group_unlock(int fd, int gid)
4332 rc = ioctl(fd, LL_IOC_GROUP_UNLOCK, gid);
4335 llapi_error(LLAPI_MSG_ERROR, rc, "cannot put group lock");