X-Git-Url: https://git.whamcloud.com/?p=fs%2Flustre-release.git;a=blobdiff_plain;f=lustre%2Futils%2Flfs.c;h=86900f7de553a6edebb03b563575fc424838f29e;hp=00ac0b1af12dcaa8550e7a12a77b87882035a064;hb=83f299175e79c37beaa5cc3580dcf52eb9a3385e;hpb=6744eb8eeb9e0a7a745a9a42e5fe09b376e16a82 diff --git a/lustre/utils/lfs.c b/lustre/utils/lfs.c index 00ac0b1..86900f7 100644 --- a/lustre/utils/lfs.c +++ b/lustre/utils/lfs.c @@ -23,7 +23,7 @@ * Copyright (c) 2003, 2010, Oracle and/or its affiliates. All rights reserved. * Use is subject to license terms. * - * Copyright (c) 2011, 2016, Intel Corporation. + * Copyright (c) 2011, 2017, Intel Corporation. */ /* * This file is part of Lustre, http://www.lustre.org/ @@ -43,6 +43,7 @@ #include #include +#include #include #include #include @@ -56,10 +57,14 @@ #include #include #include +#include #include #include #include #include +#include +#include +#include "lfs_project.h" #include #include @@ -67,13 +72,14 @@ #include #include #include +#include +#include #ifndef ARRAY_SIZE # define ARRAY_SIZE(a) ((sizeof(a)) / (sizeof((a)[0]))) #endif /* !ARRAY_SIZE */ /* all functions */ -static int lfs_setstripe(int argc, char **argv); static int lfs_find(int argc, char **argv); static int lfs_getstripe(int argc, char **argv); static int lfs_getdirstripe(int argc, char **argv); @@ -87,6 +93,7 @@ static int lfs_check(int argc, char **argv); #ifdef HAVE_SYS_QUOTA_H static int lfs_setquota(int argc, char **argv); static int lfs_quota(int argc, char **argv); +static int lfs_project(int argc, char **argv); #endif static int lfs_flushctx(int argc, char **argv); static int lfs_cp(int argc, char **argv); @@ -109,52 +116,127 @@ static int lfs_hsm_cancel(int argc, char **argv); static int lfs_swap_layouts(int argc, char **argv); static int lfs_mv(int argc, char **argv); static int lfs_ladvise(int argc, char **argv); +static int lfs_mirror(int argc, char **argv); +static int lfs_mirror_list_commands(int argc, char **argv); static int lfs_list_commands(int argc, char **argv); +static inline int lfs_mirror_resync(int argc, char **argv); +static inline int lfs_mirror_verify(int argc, char **argv); + +enum setstripe_origin { + SO_SETSTRIPE, + SO_MIGRATE, + SO_MIRROR_CREATE, + SO_MIRROR_EXTEND, + SO_MIRROR_SPLIT, +}; +static int lfs_setstripe_internal(int argc, char **argv, + enum setstripe_origin opc); + +static inline int lfs_setstripe(int argc, char **argv) +{ + return lfs_setstripe_internal(argc, argv, SO_SETSTRIPE); +} +static inline int lfs_setstripe_migrate(int argc, char **argv) +{ + return lfs_setstripe_internal(argc, argv, SO_MIGRATE); +} +static inline int lfs_mirror_create(int argc, char **argv) +{ + return lfs_setstripe_internal(argc, argv, SO_MIRROR_CREATE); +} +static inline int lfs_mirror_extend(int argc, char **argv) +{ + return lfs_setstripe_internal(argc, argv, SO_MIRROR_EXTEND); +} +static inline int lfs_mirror_split(int argc, char **argv) +{ + return lfs_setstripe_internal(argc, argv, SO_MIRROR_SPLIT); +} /* Setstripe and migrate share mostly the same parameters */ #define SSM_CMD_COMMON(cmd) \ - "usage: "cmd" [--stripe-count|-c ]\n" \ + "usage: "cmd" [--component-end|-E ]\n" \ + " [--stripe-count|-c ]\n" \ " [--stripe-index|-i ]\n" \ " [--stripe-size|-S ]\n" \ - " [--layout|-L ]\n" \ + " [--layout|-L ]\n" \ " [--pool|-p ]\n" \ " [--ost|-o ]\n" \ - " [--component-end|-E ]\n" + " [--yaml|-y ]\n" \ + " [--copy=]\n" #define SSM_HELP_COMMON \ - "\tstripe_size: Number of bytes on each OST (0 filesystem default)\n" \ - "\t Can be specified with k, m or g (in KB, MB and GB\n" \ + "\tstripe_count: Number of OSTs to stripe over (0=fs default, -1 all)\n" \ + "\tstart_ost_idx: OST index of first stripe (-1=default round robin)\n"\ + "\tstripe_size: Number of bytes on each OST (0=fs default)\n" \ + "\t Can be specified with K, M or G (for KB, MB, GB\n" \ "\t respectively)\n" \ - "\tstart_ost_idx: OST index of first stripe (-1 default)\n" \ - "\tstripe_count: Number of OSTs to stripe over (0 default, -1 all)\n" \ - "\tlayout: stripe pattern type: raid0, mdt (default raid0)\n"\ "\tpool_name: Name of OST pool to use (default none)\n" \ + "\tlayout: stripe pattern type: raid0, mdt (default raid0)\n"\ "\tost_indices: List of OST indices, can be repeated multiple times\n"\ "\t Indices be specified in a format of:\n" \ "\t -o ,-,\n" \ "\t Or:\n" \ "\t -o -o - -o \n" \ "\t If --pool is set with --ost, then the OSTs\n" \ - "\t must be the members of the pool." \ - "\tcomp_end: Extent end of the component\n" \ - "\t Can be specified with k, m or g (in KB, MB and GB\n" \ - "\t respectively, -1 for EOF), it must be aligned with\n"\ - "\t the stripe_size\n" - -#define SETSTRIPE_USAGE \ - SSM_CMD_COMMON("setstripe") \ - " \n" \ - SSM_HELP_COMMON \ + "\t must be the members of the pool.\n" \ + "\tcomp_end: Extent end of component, start after previous end.\n"\ + "\t Can be specified with K, M or G (for KB, MB, GB\n" \ + "\t respectively, -1 for EOF). Must be a multiple of\n"\ + "\t stripe_size.\n" \ + "\tyaml_template_file:\n" \ + "\t YAML layout template file, can't be used with -c,\n" \ + "\t -i, -S, -p, -o, or -E arguments.\n" \ + "\tlustre_src: Lustre file/dir whose layout info is used to set\n" \ + "\t another lustre file or directory, can't used with\n" \ + "\t -c, -i, -S, -p, -o, or -E arguments.\n" + +#define MIRROR_CREATE_HELP \ + "\tmirror_count: Number of mirrors to be created with the upcoming\n" \ + "\t setstripe layout options\n" \ + "\t It defaults to 1 if not specified; if specified,\n" \ + "\t it must follow the option without a space.\n" \ + "\t The option can also be repeated multiple times to\n" \ + "\t separate mirrors that have different layouts.\n" \ + "\tsetstripe options: Mirror layout\n" \ + "\t It can be a plain layout or a composite layout.\n" \ + "\t If not specified, the stripe options inherited\n" \ + "\t from the previous component will be used.\n" \ + "\tflags: set flags to the component of the current mirror.\n" \ + "\t Only \"prefer\" flag is supported so far.\n" + +#define MIRROR_EXTEND_HELP \ + MIRROR_CREATE_HELP \ + "\tvictim_file: The layout of victim_file will be split and used\n" \ + "\t as a mirror added to the mirrored file.\n" \ + "\tno-verify: This option indicates not to verify the mirror(s)\n" \ + "\t from victim file(s) in case the victim file(s)\n" \ + "\t contains the same data as the original mirrored\n" \ + "\t file.\n" + +#define MIRROR_EXTEND_USAGE \ + " <--mirror-count|-N[mirror_count]>\n" \ + " [setstripe options|-f ]\n" \ + " [--no-verify]\n" + +#define SETSTRIPE_USAGE \ + SSM_CMD_COMMON("setstripe") \ + MIRROR_EXTEND_USAGE \ + " \n" \ + SSM_HELP_COMMON \ + MIRROR_EXTEND_HELP #define MIGRATE_USAGE \ SSM_CMD_COMMON("migrate ") \ " [--block|-b]\n" \ " [--non-block|-n]\n" \ + " [--non-direct|-D]\n" \ " \n" \ SSM_HELP_COMMON \ "\n" \ "\tblock: Block file access during data migration (default)\n" \ "\tnon-block: Abort migrations if concurrent access is detected\n" \ + "\tnon-direct: Do not use direct I/O to copy file contents\n" \ #define SETDIRSTRIPE_USAGE \ " [--mdt-count|-c stripe_count>\n" \ @@ -169,42 +251,83 @@ static int lfs_list_commands(int argc, char **argv); "\tdefault_stripe: set default dirstripe of the directory\n" \ "\tmode: the mode of the directory\n" -static const char *progname; -static bool file_lease_supported = true; +/** + * command_t mirror_cmdlist - lfs mirror commands. + */ +command_t mirror_cmdlist[] = { + { .pc_name = "create", .pc_func = lfs_mirror_create, + .pc_help = "Create a mirrored file.\n" + "usage: lfs mirror create " + "<--mirror-count|-N[mirror_count]> " + "[setstripe options] ... \n" + MIRROR_CREATE_HELP }, + { .pc_name = "extend", .pc_func = lfs_mirror_extend, + .pc_help = "Extend a mirrored file.\n" + "usage: lfs mirror extend " + "<--mirror-count|-N[mirror_count]> [--no-verify] " + "[setstripe options|-f ] ... \n" + MIRROR_EXTEND_HELP }, + { .pc_name = "split", .pc_func = lfs_mirror_split, + .pc_help = "Split a mirrored file.\n" + "usage: lfs mirror split <--mirror-id > [--destroy|-d] " + "[-f ] \n" + "\tmirror_id: The numerical unique identifier for a mirror. It\n" + "\t can be fetched by lfs getstripe command.\n" + "\tnew_file: This option indicates the layout of the split\n" + "\t mirror will be stored into. If not specified,\n" + "\t a new file named .mirror~\n" + "\t will be used.\n" }, + { .pc_name = "resync", .pc_func = lfs_mirror_resync, + .pc_help = "Resynchronizes out-of-sync mirrored file(s).\n" + "usage: lfs mirror resync [--only ] " + " [...]\n"}, + { .pc_name = "verify", .pc_func = lfs_mirror_verify, + .pc_help = "Verify mirrored file(s).\n" + "usage: lfs mirror verify " + "[--only ] " + "[--verbose|-v] [ ...]\n"}, + { .pc_name = "--list-commands", .pc_func = lfs_mirror_list_commands, + .pc_help = "list commands supported by lfs mirror"}, + { .pc_name = "help", .pc_func = Parser_help, .pc_help = "help" }, + { .pc_name = "exit", .pc_func = Parser_quit, .pc_help = "quit" }, + { .pc_name = "quit", .pc_func = Parser_quit, .pc_help = "quit" }, + { .pc_help = NULL } +}; /* all available commands */ command_t cmdlist[] = { {"setstripe", lfs_setstripe, 0, - "Create a new file with a specific striping pattern or\n" - "set the default striping pattern on an existing directory or\n" - "delete the default striping pattern from an existing directory or\n" - "add layout component(s) to an existing composite file or\n" - "delete specified component(s) from an existing composite file\n\n" - "To delete default striping from an existing directory:\n" + "To create a file with specified striping/composite layout, or\n" + "create/replace the default layout on an existing directory:\n" + SSM_CMD_COMMON("setstripe") + " \n" + " or\n" + "To add component(s) to an existing composite file:\n" + SSM_CMD_COMMON("setstripe --component-add") + SSM_HELP_COMMON + "To totally delete the default striping from an existing directory:\n" "usage: setstripe -d \n" " or\n" - "To delete component(s) from an existing composite file:\n" + "To create a mirrored file or set s default mirror layout on a directory:\n" + "usage: setstripe -N[mirror_count] [STRIPE_OPTIONS] \n" + " or\n" + "To delete the last component(s) from an existing composite file\n" + "(note that this will also delete any data in those components):\n" "usage: setstripe --component-del [--component-id|-I ]\n" " [--component-flags|-F ]\n" " \n" - "\tcomp_id: Unique component ID\n" + "\tcomp_id: Unique component ID to delete\n" "\tcomp_flags: 'init' indicating all instantiated components\n" - "\t '^init' indicating all uninstantiated components\n" - "\t-I and -F can't be specified at the same time\n" - " or\n" - "To add component(s) to an existing composite file:\n" - SSM_CMD_COMMON("setstripe --component-add") - " or\n" - "To create a file with specified striping/composite layout:\n" - SETSTRIPE_USAGE}, + "\t '^init' indicating all uninstantiated components\n" + "\t-I and -F cannot be specified at the same time\n"}, {"getstripe", lfs_getstripe, 0, - "To list the striping info for a given file or files in a\n" + "To list the layout pattern for a given file or files in a\n" "directory or recursively for all files in a directory tree.\n" "usage: getstripe [--ost|-O ] [--quiet|-q] [--verbose|-v]\n" - " [--stripe-count|-c] [--stripe-index|-i]\n" + " [--stripe-count|-c] [--stripe-index|-i] [--fid|-F]\n" " [--pool|-p] [--stripe-size|-S] [--directory|-d]\n" - " [--mdt|-m] [--recursive|-r] [--raw|-R] [--yaml|-y]\n" - " [--layout|-L] [--fid|-F] [--generation|-g]\n" + " [--mdt-index|-m] [--recursive|-r] [--raw|-R]\n" + " [--layout|-L] [--generation|-g] [--yaml|-y]\n" " [--component-id[=comp_id]|-I[comp_id]]\n" " [--component-flags[=comp_flags]]\n" " [--component-count]\n" @@ -217,10 +340,10 @@ command_t cmdlist[] = { "usage: setdirstripe [OPTION] \n" SETDIRSTRIPE_USAGE}, {"getdirstripe", lfs_getdirstripe, 0, - "To list the striping info for a given directory\n" + "To list the layout pattern info for a given directory\n" "or recursively for all directories in a directory tree.\n" - "usage: getdirstripe [--obd|-O ] [--mdt-count|-c]\n" - " [--mdt-index|-i] [--mdt-hash|-t]\n" + "usage: getdirstripe [--mdt-count|-c] [--mdt-index|-m|-i]\n" + " [--mdt-hash|-H] [--obd|-O ]\n" " [--recursive|-r] [--yaml|-y]\n" " [--default|-D] ..."}, {"mkdir", lfs_setdirstripe, 0, @@ -234,34 +357,36 @@ command_t cmdlist[] = { "will become inaccessable after this command. This can only be done\n" "by the administrator\n" "usage: rm_entry \n"}, - {"pool_list", lfs_poollist, 0, - "List pools or pool OSTs\n" - "usage: pool_list [.] | \n"}, - {"find", lfs_find, 0, - "find files matching given attributes recursively in directory tree.\n" - "usage: find ...\n" - " [[!] --atime|-A [+-]N] [[!] --ctime|-C [+-]N]\n" - " [[!] --mtime|-M [+-]N] [[!] --mdt|-m ]\n" - " [--maxdepth|-D N] [[!] --name|-n ]\n" - " [[!] --ost|-O ] [--print|-p] [--print0|-P]\n" - " [[!] --size|-s [+-]N[bkMGTPE]]\n" - " [[!] --stripe-count|-c [+-]]\n" - " [[!] --stripe-index|-i ]\n" - " [[!] --stripe-size|-S [+-]N[kMGT]] [[!] --type|-t ]\n" - " [[!] --gid|-g|--group|-G |]\n" - " [[!] --uid|-u|--user|-U |] [[!] --pool ]\n" + {"pool_list", lfs_poollist, 0, + "List pools or pool OSTs\n" + "usage: pool_list [.] | \n"}, + {"find", lfs_find, 0, + "find files matching given attributes recursively in directory tree.\n" + "usage: find ...\n" + " [[!] --atime|-A [+-]N] [[!] --ctime|-C [+-]N]\n" + " [[!] --mtime|-M [+-]N] [--maxdepth|-D N] [[!] --blocks|-b N]\n" + " [[!] --mdt-index|--mdt|-m ]\n" + " [[!] --name|-n ] [[!] --ost|-O ]\n" + " [--print|-P] [--print0|-0] [[!] --size|-s [+-]N[bkMGTPE]]\n" + " [[!] --stripe-count|-c [+-]]\n" + " [[!] --stripe-index|-i ]\n" + " [[!] --stripe-size|-S [+-]N[kMGT]] [[!] --type|-t ]\n" + " [[!] --gid|-g|--group|-G |]\n" + " [[!] --uid|-u|--user|-U |] [[!] --pool ]\n" " [[!] --projid ]\n" " [[!] --layout|-L released,raid0,mdt]\n" " [[!] --component-count [+-]]\n" " [[!] --component-start [+-]N[kMGTPE]]\n" " [[!] --component-end|-E [+-]N[kMGTPE]]\n" " [[!] --component-flags ]\n" + " [[!] --mirror-count|-N [+-]]\n" + " [[!] --mirror-state <[^]state>]\n" " [[!] --mdt-count|-T [+-]]\n" " [[!] --mdt-hash|-H \n" "\t !: used before an option indicates 'NOT' requested attribute\n" "\t -: used before a value indicates less than requested value\n" "\t +: used before a value indicates more than requested value\n" - "\tmdt-hash: hash type of the striped directory.\n" + "\thashtype: hash type of the striped directory.\n" "\t fnv_1a_64 FNV-1a hash algorithm\n" "\t all_char sum of characters % MDT_COUNT\n"}, {"check", lfs_check, 0, @@ -292,13 +417,25 @@ command_t cmdlist[] = { " setquota [-t] <-u|--user|-g|--group|-p|--projid>\n" " [--block-grace ]\n" " [--inode-grace ] \n" + " setquota <-U|-G|-P>\n" + " -b -B \n" + " -i -I \n" + " setquota <-U|--default-usr|-G|--default-grp|-P|--default-prj>\n" + " [--block-softlimit ]\n" + " [--block-hardlimit ]\n" + " [--inode-softlimit ]\n" + " [--inode-hardlimit ] \n" + " setquota <-u|-g|-p> ||||\n" + " <-d|--default>\n" " -b can be used instead of --block-softlimit/--block-grace\n" " -B can be used instead of --block-hardlimit\n" " -i can be used instead of --inode-softlimit/--inode-grace\n" - " -I can be used instead of --inode-hardlimit\n\n" + " -I can be used instead of --inode-hardlimit\n" + " -d can be used instead of --default\n\n" "Note: The total quota space will be split into many qunits and\n" " balanced over all server targets, the minimal qunit size is\n" " 1M bytes for block space and 1K inodes for inode space.\n\n" + " The maximum quota grace time is 2^48 - 1 seconds.\n\n" " Quota space rebalancing process will stop when this mininum\n" " value is reached. As a result, quota exceeded can be returned\n" " while many targets still have 1MB or 1K inodes of spare\n" @@ -307,7 +444,19 @@ command_t cmdlist[] = { "usage: quota [-q] [-v] [-h] [-o |-i |-I " "]\n" " [<-u|-g|-p> ||||] \n" - " quota [-o |-i |-I ] -t <-u|-g|-p> "}, + " quota [-o |-i |-I ] -t <-u|-g|-p> \n" + " quota [-q] [-v] [h] <-U|-G|-P> "}, + {"project", lfs_project, 0, + "Change or list project attribute for specified file or directory.\n" + "usage: project [-d|-r] \n" + " list project ID and flags on file(s) or directories\n" + " project [-p id] [-s] [-r] \n" + " set project ID and/or inherit flag for specified file(s) or directories\n" + " project -c [-d|-r [-p id] [-0]] \n" + " check project ID and flags on file(s) or directories, print outliers\n" + " project -C [-r] [-k] \n" + " clear the project inherit flag and ID on the file or directory\n" + }, #endif {"flushctx", lfs_flushctx, 0, "Flush security context for current user.\n" "usage: flushctx [-k] [mountpoint...]"}, @@ -339,7 +488,7 @@ command_t cmdlist[] = { "undergoing actions) for given files.\n usage: hsm_state ..."}, {"hsm_set", lfs_hsm_set, 0, "Set HSM user flag on specified files.\n" "usage: hsm_set [--norelease] [--noarchive] [--dirty] [--exists] " - "[--archived] [--lost] ..."}, + "[--archived] [--lost] [--archive-id NUM] ..."}, {"hsm_clear", lfs_hsm_clear, 0, "Clear HSM user flag on specified " "files.\n" "usage: hsm_clear [--norelease] [--noarchive] [--dirty] [--exists] " @@ -358,19 +507,21 @@ command_t cmdlist[] = { "usage: hsm_release [--filelist FILELIST] [--data DATA] ..."}, {"hsm_remove", lfs_hsm_remove, 0, "Remove file copy from external storage.\n" - "usage: hsm_remove [--filelist FILELIST] [--data DATA]\n" - " [--mntpath MOUNTPATH] [--archive NUM] ...\n" + "usage: hsm_remove [--filelist FILELIST] [--data DATA] " + "[--archive NUM]\n" + " (FILE [FILE ...] | " + "--mntpath MOUNTPATH FID [FID ...])\n" "\n" - "Note: To remove files from the archive that have been deleted on\n" - "Lustre, set mntpath and optionally archive. In that case, all the\n" - "positional arguments and entries in the file list must be FIDs." + "Note: To remove an archived copy of a file already deleted from a " + "Lustre FS, the\n" + "--mntpath option and a list of FIDs must be specified" }, {"hsm_cancel", lfs_hsm_cancel, 0, "Cancel requests related to specified files.\n" "usage: hsm_cancel [--filelist FILELIST] [--data DATA] ..."}, {"swap_layouts", lfs_swap_layouts, 0, "Swap layouts between 2 files.\n" "usage: swap_layouts "}, - {"migrate", lfs_setstripe, 0, + {"migrate", lfs_setstripe_migrate, 0, "migrate a directory between MDTs.\n" "usage: migrate --mdt-index [--verbose|-v] " "\n" @@ -383,9 +534,10 @@ command_t cmdlist[] = { " [--stripe-index|-i] \n" " [--stripe-size|-S] \n" " [--pool|-p] \n" - " [--ost-list|-o] \n" + " [--ost|-o] \n" " [--block|-b]\n" " [--non-block|-n]\n" + " [--non-direct|-D]\n" " \n" "\tstripe_count: number of OSTs to stripe a file over\n" "\tstripe_ost_index: index of the first OST to stripe a file over\n" @@ -393,11 +545,12 @@ command_t cmdlist[] = { "\tpool_name: name of the predefined pool of OSTs\n" "\tost_indices: OSTs to stripe over, in order\n" "\tblock: wait for the operation to return before continuing\n" - "\tnon-block: do not wait for the operation to return.\n"}, + "\tnon-block: do not wait for the operation to return\n" + "\tnon-direct: do not use direct I/O to copy file contents.\n"}, {"mv", lfs_mv, 0, "To move directories between MDTs. This command is deprecated, " "use \"migrate\" instead.\n" - "usage: mv [--mdt-index|-M] " + "usage: mv [--mdt-index|-m] " "[--verbose|-v]\n"}, {"ladvise", lfs_ladvise, 0, "Provide servers with advice about access patterns for a file.\n" @@ -406,6 +559,13 @@ command_t cmdlist[] = { " {[--end|-e END[kMGT]] | [--length|-l LENGTH[kMGT]]}\n" " {[--mode|-m [READ,WRITE]}\n" " ...\n"}, + {"mirror", lfs_mirror, mirror_cmdlist, + "lfs commands used to manage files with mirrored components:\n" + "lfs mirror create - create a mirrored file or directory\n" + "lfs mirror extend - add mirror(s) to an existing file\n" + "lfs mirror split - split a mirror from an existing mirrored file\n" + "lfs mirror resync - resynchronize out-of-sync mirrored file(s)\n" + "lfs mirror verify - verify mirrored file(s)\n"}, {"help", Parser_help, 0, "help"}, {"exit", Parser_quit, 0, "quit"}, {"quit", Parser_quit, 0, "quit"}, @@ -417,8 +577,6 @@ command_t cmdlist[] = { }; -#define MIGRATION_NONBLOCK 1 - static int check_hashtype(const char *hashtype) { int i; @@ -430,47 +588,154 @@ static int check_hashtype(const char *hashtype) return 0; } -/** - * Internal helper for migrate_copy_data(). Check lease and report error if - * need be. - * - * \param[in] fd File descriptor on which to check the lease. - * \param[out] lease_broken Set to true if the lease was broken. - * \param[in] group_locked Whether a group lock was taken or not. - * \param[in] path Name of the file being processed, for error - * reporting - * - * \retval 0 Migration can keep on going. - * \retval -errno Error occurred, abort migration. - */ -static int check_lease(int fd, bool *lease_broken, bool group_locked, - const char *path) + +static const char *error_loc = "syserror"; + +enum { + MIGRATION_NONBLOCK = 1 << 0, + MIGRATION_MIRROR = 1 << 1, + MIGRATION_NONDIRECT = 1 << 2, +}; + +static int lfs_component_create(char *fname, int open_flags, mode_t open_mode, + struct llapi_layout *layout); + +static int +migrate_open_files(const char *name, __u64 migration_flags, + const struct llapi_stripe_param *param, + struct llapi_layout *layout, int *fd_src, int *fd_tgt) { - int rc; + int fd = -1; + int fdv = -1; + int rflags; + int mdt_index; + int random_value; + char parent[PATH_MAX]; + char volatile_file[PATH_MAX]; + char *ptr; + int rc; + struct stat st; + struct stat stv; - if (!file_lease_supported) - return 0; + if (param == NULL && layout == NULL) { + error_loc = "layout information"; + return -EINVAL; + } - rc = llapi_lease_check(fd); - if (rc > 0) - return 0; /* llapi_check_lease returns > 0 on success. */ + /* search for file directory pathname */ + if (strlen(name) > sizeof(parent) - 1) { + error_loc = "source file name"; + return -ERANGE; + } - if (!group_locked) { - fprintf(stderr, "%s: cannot migrate '%s': file busy\n", - progname, path); - rc = rc ? rc : -EAGAIN; + strncpy(parent, name, sizeof(parent)); + ptr = strrchr(parent, '/'); + if (ptr == NULL) { + if (getcwd(parent, sizeof(parent)) == NULL) { + error_loc = "getcwd"; + return -errno; + } } else { - fprintf(stderr, "%s: external attempt to access file '%s' " - "blocked until migration ends.\n", progname, path); - rc = 0; + if (ptr == parent) /* leading '/' */ + ptr = parent + 1; + *ptr = '\0'; + } + + /* open file, direct io */ + /* even if the file is only read, WR mode is nedeed to allow + * layout swap on fd */ + rflags = O_RDWR; + if (!(migration_flags & MIGRATION_NONDIRECT)) + rflags |= O_DIRECT; + fd = open(name, rflags); + if (fd < 0) { + rc = -errno; + error_loc = "cannot open source file"; + return rc; + } + + rc = llapi_file_fget_mdtidx(fd, &mdt_index); + if (rc < 0) { + error_loc = "cannot get MDT index"; + goto out; + } + + do { + int open_flags = O_WRONLY | O_CREAT | O_EXCL | O_NOFOLLOW; + mode_t open_mode = S_IRUSR | S_IWUSR; + + random_value = random(); + rc = snprintf(volatile_file, sizeof(volatile_file), + "%s/%s:%.4X:%.4X", parent, LUSTRE_VOLATILE_HDR, + mdt_index, random_value); + if (rc >= sizeof(volatile_file)) { + rc = -ENAMETOOLONG; + break; + } + + /* create, open a volatile file, use caching (ie no directio) */ + if (param != NULL) + fdv = llapi_file_open_param(volatile_file, open_flags, + open_mode, param); + else + fdv = lfs_component_create(volatile_file, open_flags, + open_mode, layout); + } while (fdv < 0 && (rc = fdv) == -EEXIST); + + if (rc < 0) { + error_loc = "cannot create volatile file"; + goto out; + } + + /* In case the MDT does not support creation of volatile files + * we should try to unlink it. */ + (void)unlink(volatile_file); + + /* Not-owner (root?) special case. + * Need to set owner/group of volatile file like original. + * This will allow to pass related check during layout_swap. + */ + rc = fstat(fd, &st); + if (rc != 0) { + rc = -errno; + error_loc = "cannot stat source file"; + goto out; + } + + rc = fstat(fdv, &stv); + if (rc != 0) { + rc = -errno; + error_loc = "cannot stat volatile"; + goto out; + } + + if (st.st_uid != stv.st_uid || st.st_gid != stv.st_gid) { + rc = fchown(fdv, st.st_uid, st.st_gid); + if (rc != 0) { + rc = -errno; + error_loc = "cannot change ownwership of volatile"; + goto out; + } + } + +out: + if (rc < 0) { + if (fd > 0) + close(fd); + if (fdv > 0) + close(fdv); + } else { + *fd_src = fd; + *fd_tgt = fdv; + error_loc = NULL; } - *lease_broken = true; return rc; } -static int migrate_copy_data(int fd_src, int fd_dst, size_t buf_size, - bool group_locked, const char *fname) +static int migrate_copy_data(int fd_src, int fd_dst, int (*check_file)(int)) { + struct llapi_layout *layout; + size_t buf_size = 4 * 1024 * 1024; void *buf = NULL; ssize_t rsize = -1; ssize_t wsize = 0; @@ -478,7 +743,17 @@ static int migrate_copy_data(int fd_src, int fd_dst, size_t buf_size, size_t wpos = 0; off_t bufoff = 0; int rc; - bool lease_broken = false; + + layout = llapi_layout_get_by_fd(fd_src, 0); + if (layout != NULL) { + uint64_t stripe_size; + + rc = llapi_layout_stripe_size_get(layout, &stripe_size); + if (rc == 0) + buf_size = stripe_size; + + llapi_layout_free(layout); + } /* Use a page-aligned buffer for direct I/O */ rc = posix_memalign(&buf, getpagesize(), buf_size); @@ -489,18 +764,16 @@ static int migrate_copy_data(int fd_src, int fd_dst, size_t buf_size, /* read new data only if we have written all * previously read data */ if (wpos == rpos) { - if (!lease_broken) { - rc = check_lease(fd_src, &lease_broken, - group_locked, fname); + if (check_file) { + rc = check_file(fd_src); if (rc < 0) - goto out; + break; } + rsize = read(fd_src, buf, buf_size); if (rsize < 0) { rc = -errno; - fprintf(stderr, "%s: %s: read failed: %s\n", - progname, fname, strerror(-rc)); - goto out; + break; } rpos += rsize; bufoff = 0; @@ -512,39 +785,39 @@ static int migrate_copy_data(int fd_src, int fd_dst, size_t buf_size, wsize = write(fd_dst, buf + bufoff, rpos - wpos); if (wsize < 0) { rc = -errno; - fprintf(stderr, - "%s: %s: write failed on volatile: %s\n", - progname, fname, strerror(-rc)); - goto out; + break; } wpos += wsize; bufoff += wsize; } - rc = fsync(fd_dst); - if (rc < 0) { - rc = -errno; - fprintf(stderr, "%s: %s: fsync failed: %s\n", - progname, fname, strerror(-rc)); + if (rc == 0) { + rc = fsync(fd_dst); + if (rc < 0) + rc = -errno; } -out: free(buf); return rc; } -static int migrate_copy_timestamps(int fdv, const struct stat *st) +static int migrate_copy_timestamps(int fd, int fdv) { - struct timeval tv[2] = { - {.tv_sec = st->st_atime}, - {.tv_sec = st->st_mtime} - }; + struct stat st; + + if (fstat(fd, &st) == 0) { + struct timeval tv[2] = { + {.tv_sec = st.st_atime}, + {.tv_sec = st.st_mtime} + }; + + return futimes(fdv, tv); + } - return futimes(fdv, tv); + return -errno; } -static int migrate_block(int fd, int fdv, const struct stat *st, - size_t buf_size, const char *name) +static int migrate_block(int fd, int fdv) { __u64 dv1; int gid; @@ -553,8 +826,7 @@ static int migrate_block(int fd, int fdv, const struct stat *st, rc = llapi_get_data_version(fd, &dv1, LL_DV_RD_FLUSH); if (rc < 0) { - fprintf(stderr, "%s: %s: cannot get dataversion: %s\n", - progname, name, strerror(-rc)); + error_loc = "cannot get dataversion"; return rc; } @@ -567,22 +839,20 @@ static int migrate_block(int fd, int fdv, const struct stat *st, * block it too. */ rc = llapi_group_lock(fd, gid); if (rc < 0) { - fprintf(stderr, "%s: %s: cannot get group lock: %s\n", - progname, name, strerror(-rc)); + error_loc = "cannot get group lock"; return rc; } - rc = migrate_copy_data(fd, fdv, buf_size, true, name); + rc = migrate_copy_data(fd, fdv, NULL); if (rc < 0) { - fprintf(stderr, "%s: %s: data copy failed\n", progname, name); + error_loc = "data copy failed"; goto out_unlock; } /* Make sure we keep original atime/mtime values */ - rc = migrate_copy_timestamps(fdv, st); + rc = migrate_copy_timestamps(fd, fdv); if (rc < 0) { - fprintf(stderr, "%s: %s: timestamp copy failed\n", - progname, name); + error_loc = "timestamp copy failed"; goto out_unlock; } @@ -594,28 +864,44 @@ static int migrate_block(int fd, int fdv, const struct stat *st, rc = llapi_fswap_layouts_grouplock(fd, fdv, dv1, 0, 0, SWAP_LAYOUTS_CHECK_DV1); if (rc == -EAGAIN) { - fprintf(stderr, "%s: %s: dataversion changed during copy, " - "migration aborted\n", progname, name); + error_loc = "file changed"; goto out_unlock; } else if (rc < 0) { - fprintf(stderr, "%s: %s: cannot swap layouts: %s\n", progname, - name, strerror(-rc)); + error_loc = "cannot swap layout"; goto out_unlock; } out_unlock: rc2 = llapi_group_unlock(fd, gid); if (rc2 < 0 && rc == 0) { - fprintf(stderr, "%s: %s: putting group lock failed: %s\n", - progname, name, strerror(-rc2)); + error_loc = "unlock group lock"; rc = rc2; } return rc; } -static int migrate_nonblock(int fd, int fdv, const struct stat *st, - size_t buf_size, const char *name) +/** + * Internal helper for migrate_copy_data(). Check lease and report error if + * need be. + * + * \param[in] fd File descriptor on which to check the lease. + * + * \retval 0 Migration can keep on going. + * \retval -errno Error occurred, abort migration. + */ +static int check_lease(int fd) +{ + int rc; + + rc = llapi_lease_check(fd); + if (rc > 0) + return 0; /* llapi_check_lease returns > 0 on success. */ + + return -EBUSY; +} + +static int migrate_nonblock(int fd, int fdv) { __u64 dv1; __u64 dv2; @@ -623,80 +909,100 @@ static int migrate_nonblock(int fd, int fdv, const struct stat *st, rc = llapi_get_data_version(fd, &dv1, LL_DV_RD_FLUSH); if (rc < 0) { - fprintf(stderr, "%s: %s: cannot get data version: %s\n", - progname, name, strerror(-rc)); + error_loc = "cannot get data version"; return rc; } - rc = migrate_copy_data(fd, fdv, buf_size, false, name); + rc = migrate_copy_data(fd, fdv, check_lease); if (rc < 0) { - fprintf(stderr, "%s: %s: data copy failed\n", progname, name); + error_loc = "data copy failed"; return rc; } rc = llapi_get_data_version(fd, &dv2, LL_DV_RD_FLUSH); if (rc != 0) { - fprintf(stderr, "%s: %s: cannot get data version: %s\n", - progname, name, strerror(-rc)); + error_loc = "cannot get data version"; return rc; } if (dv1 != dv2) { rc = -EAGAIN; - fprintf(stderr, "%s: %s: data version changed during " - "migration\n", - progname, name); + error_loc = "source file changed"; return rc; } /* Make sure we keep original atime/mtime values */ - rc = migrate_copy_timestamps(fdv, st); - if (rc < 0) { - fprintf(stderr, "%s: %s: timestamp copy failed\n", - progname, name); - return rc; - } - - /* Atomically put lease, swap layouts and close. - * for a migration we need to check data version on file did - * not change. */ - rc = llapi_fswap_layouts(fd, fdv, 0, 0, SWAP_LAYOUTS_CLOSE); + rc = migrate_copy_timestamps(fd, fdv); if (rc < 0) { - fprintf(stderr, "%s: %s: cannot swap layouts: %s\n", - progname, name, strerror(-rc)); + error_loc = "timestamp copy failed"; return rc; } return 0; } -static int lfs_component_set(char *fname, int comp_id, __u32 flags) +static int lfs_component_set(char *fname, int comp_id, + __u32 flags, __u32 neg_flags) { - return -ENOTSUP; + __u32 ids[2]; + __u32 flags_array[2]; + size_t count = 0; + int rc; + + if (flags) { + ids[count] = comp_id; + flags_array[count] = flags; + ++count; + } + + if (neg_flags) { + ids[count] = comp_id; + flags_array[count] = neg_flags | LCME_FL_NEG; + ++count; + } + + rc = llapi_layout_file_comp_set(fname, ids, flags_array, count); + if (rc) + fprintf(stderr, + "%s: cannot change the flags of component '%#x' of file '%s': %x / ^(%x)\n", + progname, comp_id, fname, flags, neg_flags); + + return rc; } -static int lfs_component_del(char *fname, __u32 comp_id, __u32 flags) +static int lfs_component_del(char *fname, __u32 comp_id, + __u32 flags, __u32 neg_flags) { int rc = 0; - if (flags != 0 && comp_id != 0) + if (flags && neg_flags) + return -EINVAL; + + if (!flags && neg_flags) + flags = neg_flags | LCME_FL_NEG; + + if ((flags && comp_id) || (!flags && !comp_id)) return -EINVAL; /* LCME_FL_INIT is the only supported flag in PFL */ - if (flags != 0) { + if (flags) { if (flags & ~LCME_KNOWN_FLAGS) { - fprintf(stderr, "Invalid component flags %#x\n", flags); + fprintf(stderr, + "%s setstripe: unknown flags %#x\n", + progname, flags); return -EINVAL; } } else if (comp_id > LCME_ID_MAX) { - fprintf(stderr, "Invalid component id %u\n", comp_id); + fprintf(stderr, "%s setstripe: invalid component id %u\n", + progname, comp_id); return -EINVAL; } rc = llapi_layout_file_comp_del(fname, comp_id, flags); if (rc) - fprintf(stderr, "Delete component %#x from %s failed. %s\n", - comp_id, fname, strerror(errno)); + fprintf(stderr, + "%s setstripe: cannot delete component %#x from '%s': %s\n", + progname, comp_id, fname, strerror(errno)); return rc; } @@ -729,10 +1035,10 @@ static int lfs_component_create(char *fname, int open_flags, mode_t open_mode, fd = llapi_layout_file_open(fname, open_flags, open_mode, layout); if (fd < 0) - fprintf(stderr, "%s %s failed. %s\n", + fprintf(stderr, "%s: cannot %s '%s': %s\n", progname, S_ISDIR(st.st_mode) ? - "Set default composite layout to " : - "Create composite file", + "set default composite layout for" : + "create composite file", fname, strerror(errno)); return fd; } @@ -741,4789 +1047,7710 @@ static int lfs_migrate(char *name, __u64 migration_flags, struct llapi_stripe_param *param, struct llapi_layout *layout) { - int fd = -1; - int fdv = -1; - char parent[PATH_MAX]; - int mdt_index; - int random_value; - char volatile_file[sizeof(parent) + - LUSTRE_VOLATILE_HDR_LEN + - 2 * sizeof(mdt_index) + - 2 * sizeof(random_value) + 4]; - char *ptr; - int rc; - struct lov_user_md *lum = NULL; - int lum_size; - int buf_size = 1024 * 1024 * 4; - bool have_lease_rdlck = false; - struct stat st; - struct stat stv; + int fd = -1; + int fdv = -1; + int rc; - /* find the right size for the IO and allocate the buffer */ - lum_size = lov_user_md_size(LOV_MAX_STRIPE_COUNT, LOV_USER_MAGIC_V3); - lum = malloc(lum_size); - if (lum == NULL) { - rc = -ENOMEM; - goto free; - } + rc = migrate_open_files(name, migration_flags, param, layout, + &fd, &fdv); + if (rc < 0) + goto out; - rc = llapi_file_get_stripe(name, lum); - /* failure can happen for many reasons and some may be not real errors - * (eg: no stripe) - * in case of a real error, a later call will fail with better - * error management */ - if (rc == 0) { - if ((lum->lmm_magic == LOV_USER_MAGIC_V1 || - lum->lmm_magic == LOV_USER_MAGIC_V3) && - lum->lmm_stripe_size != 0) - buf_size = lum->lmm_stripe_size; + if (!(migration_flags & MIGRATION_NONBLOCK)) { + /* Blocking mode (forced if servers do not support file lease). + * It is also the default mode, since we cannot distinguish + * between a broken lease and a server that does not support + * atomic swap/close (LU-6785) */ + rc = migrate_block(fd, fdv); + goto out; } - /* open file, direct io */ - /* even if the file is only read, WR mode is nedeed to allow - * layout swap on fd */ - fd = open(name, O_RDWR | O_DIRECT); - if (fd == -1) { - rc = -errno; - fprintf(stderr, "%s: %s: cannot open: %s\n", progname, name, - strerror(-rc)); - goto free; - } - - if (file_lease_supported) { - rc = llapi_lease_get(fd, LL_LEASE_RDLCK); - if (rc == -EOPNOTSUPP) { - /* Older servers do not support file lease. - * Disable related checks. This opens race conditions - * as explained in LU-4840 */ - file_lease_supported = false; - } else if (rc < 0) { - fprintf(stderr, "%s: %s: cannot get open lease: %s\n", - progname, name, strerror(-rc)); - goto error; - } else { - have_lease_rdlck = true; - } + rc = llapi_lease_acquire(fd, LL_LEASE_RDLCK); + if (rc < 0) { + error_loc = "cannot get lease"; + goto out; } - /* search for file directory pathname */ - if (strlen(name) > sizeof(parent)-1) { - rc = -E2BIG; - goto error; - } - strncpy(parent, name, sizeof(parent)); - ptr = strrchr(parent, '/'); - if (ptr == NULL) { - if (getcwd(parent, sizeof(parent)) == NULL) { - rc = -errno; - goto error; - } - } else { - if (ptr == parent) - strcpy(parent, "/"); - else - *ptr = '\0'; + rc = migrate_nonblock(fd, fdv); + if (rc < 0) { + llapi_lease_release(fd); + goto out; } - rc = llapi_file_fget_mdtidx(fd, &mdt_index); + /* Atomically put lease, swap layouts and close. + * for a migration we need to check data version on file did + * not change. */ + rc = llapi_fswap_layouts(fd, fdv, 0, 0, SWAP_LAYOUTS_CLOSE); if (rc < 0) { - fprintf(stderr, "%s: %s: cannot get MDT index: %s\n", - progname, name, strerror(-rc)); - goto error; + error_loc = "cannot swap layout"; + goto out; } - do { - int open_flags = O_WRONLY | O_CREAT | O_EXCL | O_NOFOLLOW; - mode_t open_mode = S_IRUSR | S_IWUSR; +out: + if (fd >= 0) + close(fd); - random_value = random(); - rc = snprintf(volatile_file, sizeof(volatile_file), - "%s/%s:%.4X:%.4X", parent, LUSTRE_VOLATILE_HDR, - mdt_index, random_value); - if (rc >= sizeof(volatile_file)) { - rc = -E2BIG; - goto error; - } + if (fdv >= 0) + close(fdv); - /* create, open a volatile file, use caching (ie no directio) */ - if (param != NULL) - fdv = llapi_file_open_param(volatile_file, open_flags, - open_mode, param); - else if (layout != NULL) - fdv = lfs_component_create(volatile_file, open_flags, - open_mode, layout); - else - fdv = -EINVAL; - } while (fdv == -EEXIST); + if (rc < 0) + fprintf(stderr, "error: %s: %s: %s: %s\n", + progname, name, error_loc, strerror(-rc)); + return rc; +} - if (fdv < 0) { - rc = fdv; - fprintf(stderr, "%s: %s: cannot create volatile file in" - " directory: %s\n", - progname, parent, strerror(-rc)); - goto error; - } +static int comp_str2flags(char *string, __u32 *flags, __u32 *neg_flags) +{ + char *name; - /* In case the MDT does not support creation of volatile files - * we should try to unlink it. */ - (void)unlink(volatile_file); + if (string == NULL) + return -EINVAL; - /* Not-owner (root?) special case. - * Need to set owner/group of volatile file like original. - * This will allow to pass related check during layout_swap. - */ - rc = fstat(fd, &st); - if (rc != 0) { - rc = -errno; - fprintf(stderr, "%s: %s: cannot stat: %s\n", progname, name, - strerror(errno)); - goto error; - } - rc = fstat(fdv, &stv); - if (rc != 0) { - rc = -errno; - fprintf(stderr, "%s: %s: cannot stat: %s\n", progname, - volatile_file, strerror(errno)); - goto error; - } - if (st.st_uid != stv.st_uid || st.st_gid != stv.st_gid) { - rc = fchown(fdv, st.st_uid, st.st_gid); - if (rc != 0) { - rc = -errno; - fprintf(stderr, "%s: %s: cannot chown: %s\n", progname, - name, strerror(errno)); - goto error; - } - } + *flags = 0; + *neg_flags = 0; + for (name = strtok(string, ","); name; name = strtok(NULL, ",")) { + bool found = false; + int i; + + for (i = 0; i < ARRAY_SIZE(comp_flags_table); i++) { + __u32 comp_flag = comp_flags_table[i].cfn_flag; + const char *comp_name = comp_flags_table[i].cfn_name; - if (migration_flags & MIGRATION_NONBLOCK && file_lease_supported) { - rc = migrate_nonblock(fd, fdv, &st, buf_size, name); - if (rc == 0) { - have_lease_rdlck = false; - fdv = -1; /* The volatile file is closed as we put the - * lease in non-blocking mode. */ + if (strcmp(name, comp_name) == 0) { + *flags |= comp_flag; + found = true; + } else if (strncmp(name, "^", 1) == 0 && + strcmp(name + 1, comp_name) == 0) { + *neg_flags |= comp_flag; + found = true; + } + } + if (!found) { + llapi_printf(LLAPI_MSG_ERROR, + "%s: component flag '%s' not supported\n", + progname, name); + return -EINVAL; } - } else { - /* Blocking mode (forced if servers do not support file lease). - * It is also the default mode, since we cannot distinguish - * between a broken lease and a server that does not support - * atomic swap/close (LU-6785) */ - rc = migrate_block(fd, fdv, &st, buf_size, name); } -error: - if (have_lease_rdlck) - llapi_lease_put(fd); + if (!*flags && !*neg_flags) + return -EINVAL; - if (fd >= 0) - close(fd); + /* don't allow to set and exclude the same flag */ + if (*flags & *neg_flags) + return -EINVAL; - if (fdv >= 0) - close(fdv); + return 0; +} -free: - if (lum) - free(lum); +static int mirror_str2state(char *string, __u16 *state, __u16 *neg_state) +{ + if (string == NULL) + return -EINVAL; - return rc; + *state = 0; + *neg_state = 0; + + if (strncmp(string, "^", 1) == 0) { + *neg_state = llapi_layout_string_flags(string + 1); + if (*neg_state != 0) + return 0; + } else { + *state = llapi_layout_string_flags(string); + if (*state != 0) + return 0; + } + + llapi_printf(LLAPI_MSG_ERROR, + "%s: mirrored file state '%s' not supported\n", + progname, string); + return -EINVAL; } /** - * Parse a string containing an OST index list into an array of integers. - * - * The input string contains a comma delimited list of individual - * indices and ranges, for example "1,2-4,7". Add the indices into the - * \a osts array and remove duplicates. + * struct mirror_args - Command-line arguments for mirror(s). + * @m_count: Number of mirrors to be created with this layout. + * @m_flags: Mirror level flags, only 'prefer' is supported. + * @m_layout: Mirror layout. + * @m_file: A victim file. Its layout will be split and used as a mirror. + * @m_next: Point to the next node of the list. * - * \param[out] osts array to store indices in - * \param[in] size size of \a osts array - * \param[in] offset starting index in \a osts - * \param[in] arg string containing OST index list - * - * \retval positive number of indices in \a osts - * \retval -EINVAL unable to parse \a arg + * Command-line arguments for mirror(s) will be parsed and stored in + * a linked list that consists of this structure. */ -static int parse_targets(__u32 *osts, int size, int offset, char *arg) +struct mirror_args { + __u32 m_count; + __u32 m_flags; + struct llapi_layout *m_layout; + const char *m_file; + struct mirror_args *m_next; +}; + +static int mirror_sanity_check_flags(struct llapi_layout *layout, void *unused) { + uint32_t flags; int rc; - int nr = offset; - int slots = size - offset; - char *ptr = NULL; - bool end_of_loop; - if (arg == NULL) + rc = llapi_layout_comp_flags_get(layout, &flags); + if (rc) + return -errno; + + if (flags & LCME_FL_NEG) { + fprintf(stderr, "error: %s: negative flags are not supported\n", + progname); return -EINVAL; + } - end_of_loop = false; - while (!end_of_loop) { - int start_index; - int end_index; - int i; - char *endptr = NULL; + if (flags & LCME_FL_STALE) { + fprintf(stderr, "error: %s: setting '%s' is not supported\n", + progname, comp_flags_table[LCME_FL_STALE].cfn_name); + return -EINVAL; + } - rc = -EINVAL; + return LLAPI_LAYOUT_ITER_CONT; +} - ptr = strchrnul(arg, ','); +static inline int mirror_sanity_check_one(struct llapi_layout *layout) +{ + uint64_t start, end; + uint64_t pattern; + int rc; - end_of_loop = *ptr == '\0'; - *ptr = '\0'; + /* LU-10112: do not support dom+flr in phase 1 */ + rc = llapi_layout_comp_use(layout, LLAPI_LAYOUT_COMP_USE_FIRST); + if (rc) + return -errno; - start_index = strtol(arg, &endptr, 0); - if (endptr == arg) /* no data at all */ - break; - if (*endptr != '-' && *endptr != '\0') /* has invalid data */ - break; - if (start_index < 0) - break; + rc = llapi_layout_pattern_get(layout, &pattern); + if (rc) + return -errno; - end_index = start_index; - if (*endptr == '-') { - end_index = strtol(endptr + 1, &endptr, 0); - if (*endptr != '\0') - break; - if (end_index < start_index) - break; - } + if (pattern == LOV_PATTERN_MDT || pattern == LLAPI_LAYOUT_MDT) { + fprintf(stderr, "error: %s: doesn't support dom+flr for now\n", + progname); + return -ENOTSUP; + } - for (i = start_index; i <= end_index && slots > 0; i++) { - int j; + rc = llapi_layout_comp_use(layout, LLAPI_LAYOUT_COMP_USE_LAST); + if (rc) + return -errno; - /* remove duplicate */ - for (j = 0; j < offset; j++) { - if (osts[j] == i) - break; - } - if (j == offset) { /* no duplicate */ - osts[nr++] = i; - --slots; - } - } - if (slots == 0 && i < end_index) - break; + rc = llapi_layout_comp_extent_get(layout, &start, &end); + if (rc) + return -errno; - *ptr = ','; - arg = ++ptr; - offset = nr; - rc = 0; + if (end != LUSTRE_EOF) { + fprintf(stderr, "error: %s: mirror layout doesn't reach eof\n", + progname); + return -EINVAL; } - if (!end_of_loop && ptr != NULL) - *ptr = ','; - return rc < 0 ? rc : nr; + rc = llapi_layout_comp_iterate(layout, mirror_sanity_check_flags, NULL); + return rc; } -struct lfs_setstripe_args { - unsigned long long lsa_comp_end; - unsigned long long lsa_stripe_size; - int lsa_stripe_count; - int lsa_stripe_off; - __u32 lsa_comp_flags; - int lsa_nr_osts; - int lsa_pattern; - __u32 *lsa_osts; - char *lsa_pool_name; +/** + * enum mirror_flags - Flags for extending a mirrored file. + * @MF_NO_VERIFY: Indicates not to verify the mirror(s) from victim file(s) + * in case the victim file(s) contains the same data as the + * original mirrored file. + * @MF_DESTROY: Indicates to delete the mirror from the mirrored file. + * + * Flags for extending a mirrored file. + */ +enum mirror_flags { + MF_NO_VERIFY = 0x1, + MF_DESTROY = 0x2, }; -static inline void setstripe_args_init(struct lfs_setstripe_args *lsa) +/** + * mirror_create_sanity_check() - Check mirror list. + * @list: A linked list that stores the mirror arguments. + * + * This function does a sanity check on @list for creating + * a mirrored file. + * + * Return: 0 on success or a negative error code on failure. + */ +static int mirror_create_sanity_check(const char *fname, + struct mirror_args *list) { - memset(lsa, 0, sizeof(*lsa)); - lsa->lsa_stripe_off = -1; -} + int rc = 0; + bool has_m_file = false; + bool has_m_layout = false; -static inline bool setstripe_args_specified(struct lfs_setstripe_args *lsa) -{ - return (lsa->lsa_stripe_size != 0 || lsa->lsa_stripe_count != 0 || - lsa->lsa_stripe_off != -1 || lsa->lsa_pool_name != NULL || - lsa->lsa_comp_end != 0 || lsa->lsa_pattern != 0); -} + if (list == NULL) + return -EINVAL; -static int comp_args_to_layout(struct llapi_layout **composite, - struct lfs_setstripe_args *lsa) -{ - struct llapi_layout *layout = *composite; - uint64_t prev_end = 0; - int i = 0, rc; + if (fname) { + struct llapi_layout *layout; - if (layout == NULL) { - layout = llapi_layout_alloc(); - if (layout == NULL) { - fprintf(stderr, "Alloc llapi_layout failed. %s\n", - strerror(errno)); - return -ENOMEM; + layout = llapi_layout_get_by_path(fname, 0); + if (!layout) { + fprintf(stderr, + "error: %s: file '%s' couldn't get layout\n", + progname, fname); + return -ENODATA; } - *composite = layout; - } else { - uint64_t start; - /* Get current component extent, current component - * must be the tail component. */ - rc = llapi_layout_comp_extent_get(layout, &start, &prev_end); - if (rc) { - fprintf(stderr, "Get comp extent failed. %s\n", - strerror(errno)); + rc = mirror_sanity_check_one(layout); + llapi_layout_free(layout); + + if (rc) return rc; + } + + while (list != NULL) { + if (list->m_file != NULL) { + has_m_file = true; + llapi_layout_free(list->m_layout); + + list->m_layout = + llapi_layout_get_by_path(list->m_file, 0); + if (list->m_layout == NULL) { + fprintf(stderr, + "error: %s: file '%s' has no layout\n", + progname, list->m_file); + return -ENODATA; + } + } else { + has_m_layout = true; + if (list->m_layout == NULL) { + fprintf(stderr, "error: %s: no mirror layout\n", + progname); + return -EINVAL; + } } - rc = llapi_layout_comp_add(layout); - if (rc) { - fprintf(stderr, "Add component failed. %s\n", - strerror(errno)); + rc = mirror_sanity_check_one(list->m_layout); + if (rc) return rc; - } + + list = list->m_next; } - rc = llapi_layout_comp_extent_set(layout, prev_end, lsa->lsa_comp_end); - if (rc) { - fprintf(stderr, "Set extent [%lu, %llu) failed. %s\n", - prev_end, lsa->lsa_comp_end, strerror(errno)); + if (has_m_file && has_m_layout) { + fprintf(stderr, + "error: %s: -f option should not be specified with setstripe options\n", + progname); + return -EINVAL; + } + + return 0; +} + +static int mirror_set_flags(struct llapi_layout *layout, void *cbdata) +{ + __u32 mirror_flags = *(__u32 *)cbdata; + uint32_t flags; + int rc; + + rc = llapi_layout_comp_flags_get(layout, &flags); + if (rc < 0) return rc; + + if (!flags) { + rc = llapi_layout_comp_flags_set(layout, mirror_flags); + if (rc) + return rc; } - /* Data-on-MDT component setting */ - if (lsa->lsa_pattern == LLAPI_LAYOUT_MDT) { - /* In case of Data-on-MDT patterns the only extra option - * applicable is stripe size option. */ - if (lsa->lsa_stripe_count) { - fprintf(stderr, "Option 'stripe-count' can't be " - "specified with Data-on-MDT component: %i\n", - lsa->lsa_stripe_count); - return -EINVAL; - } - if (lsa->lsa_stripe_size) { - fprintf(stderr, "Option 'stripe-size' can't be " - "specified with Data-on-MDT component: %llu\n", - lsa->lsa_stripe_size); - return -EINVAL; - } - if (lsa->lsa_nr_osts != 0) { - fprintf(stderr, "Option 'ost-list' can't be specified " - "with Data-on-MDT component: '%i'\n", - lsa->lsa_nr_osts); - return -EINVAL; - } - if (lsa->lsa_stripe_off != -1) { - fprintf(stderr, "Option 'stripe-offset' can't be " - "specified with Data-on-MDT component: %i\n", - lsa->lsa_stripe_off); - return -EINVAL; - } - if (lsa->lsa_pool_name != 0) { - fprintf(stderr, "Option 'pool' can't be specified " - "with Data-on-MDT component: '%s'\n", - lsa->lsa_pool_name); - return -EINVAL; - } + return LLAPI_LAYOUT_ITER_CONT; +} - rc = llapi_layout_pattern_set(layout, lsa->lsa_pattern); +/** + * mirror_create() - Create a mirrored file. + * @fname: The file to be created. + * @mirror_list: A linked list that stores the mirror arguments. + * + * This function creates a mirrored file @fname with the mirror(s) + * from @mirror_list. + * + * Return: 0 on success or a negative error code on failure. + */ +static int mirror_create(char *fname, struct mirror_args *mirror_list) +{ + struct llapi_layout *layout = NULL; + struct mirror_args *cur_mirror = NULL; + uint16_t mirror_count = 0; + int i = 0; + int rc = 0; + + rc = mirror_create_sanity_check(NULL, mirror_list); + if (rc) + return rc; + + cur_mirror = mirror_list; + while (cur_mirror != NULL) { + rc = llapi_layout_comp_iterate(cur_mirror->m_layout, + mirror_set_flags, + &cur_mirror->m_flags); if (rc) { - fprintf(stderr, "Set stripe pattern %#x failed. %s\n", - lsa->lsa_pattern, strerror(errno)); - return rc; + rc = -errno; + fprintf(stderr, "%s: failed to set mirror flags\n", + progname); + goto error; } - /* Data-on-MDT component has always single stripe up to end */ - lsa->lsa_stripe_size = lsa->lsa_comp_end; - } - if (lsa->lsa_stripe_size != 0) { - rc = llapi_layout_stripe_size_set(layout, - lsa->lsa_stripe_size); - if (rc) { - fprintf(stderr, "Set stripe size %llu failed. %s\n", - lsa->lsa_stripe_size, strerror(errno)); - return rc; + for (i = 0; i < cur_mirror->m_count; i++) { + rc = llapi_layout_merge(&layout, cur_mirror->m_layout); + if (rc) { + rc = -errno; + fprintf(stderr, "error: %s: " + "merge layout failed: %s\n", + progname, strerror(errno)); + goto error; + } } + mirror_count += cur_mirror->m_count; + cur_mirror = cur_mirror->m_next; } - if (lsa->lsa_stripe_count != 0) { - rc = llapi_layout_stripe_count_set(layout, - lsa->lsa_stripe_count == -1 ? - LLAPI_LAYOUT_WIDE : - lsa->lsa_stripe_count); - if (rc) { - fprintf(stderr, "Set stripe count %d failed. %s\n", - lsa->lsa_stripe_count, strerror(errno)); - return rc; - } + if (layout == NULL) { + fprintf(stderr, "error: %s: layout is NULL\n", progname); + return -EINVAL; } - if (lsa->lsa_pool_name != NULL) { - rc = llapi_layout_pool_name_set(layout, lsa->lsa_pool_name); - if (rc) { - fprintf(stderr, "Set pool name: %s failed. %s\n", - lsa->lsa_pool_name, strerror(errno)); - return rc; - } + rc = llapi_layout_mirror_count_set(layout, mirror_count); + if (rc) { + rc = -errno; + fprintf(stderr, "error: %s: set mirror count failed: %s\n", + progname, strerror(errno)); + goto error; } - if (lsa->lsa_nr_osts > 0) { - if (lsa->lsa_stripe_count > 0 && - lsa->lsa_nr_osts != lsa->lsa_stripe_count) { - fprintf(stderr, "stripe_count(%d) != nr_osts(%d)\n", - lsa->lsa_stripe_count, lsa->lsa_nr_osts); - return -EINVAL; - } - for (i = 0; i < lsa->lsa_nr_osts; i++) { - rc = llapi_layout_ost_index_set(layout, i, - lsa->lsa_osts[i]); - if (rc) - break; - } - } else if (lsa->lsa_stripe_off != -1) { - rc = llapi_layout_ost_index_set(layout, 0, lsa->lsa_stripe_off); + rc = lfs_component_create(fname, O_CREAT | O_WRONLY, 0666, + layout); + if (rc >= 0) { + close(rc); + rc = 0; } - if (rc) { - fprintf(stderr, "Set ost index %d failed. %s\n", - i, strerror(errno)); - return rc; + +error: + llapi_layout_free(layout); + return rc; +} + +/** + * Compare files and check lease on @fd. + * + * \retval bytes number of bytes are the same + */ +static ssize_t mirror_file_compare(int fd, int fdv) +{ + const size_t buflen = 4 * 1024 * 1024; /* 4M */ + void *buf; + ssize_t bytes_done = 0; + ssize_t bytes_read = 0; + + buf = malloc(buflen * 2); + if (!buf) + return -ENOMEM; + + while (1) { + if (!llapi_lease_check(fd)) { + bytes_done = -EBUSY; + break; + } + + bytes_read = read(fd, buf, buflen); + if (bytes_read <= 0) + break; + + if (bytes_read != read(fdv, buf + buflen, buflen)) + break; + + /* XXX: should compute the checksum on each buffer and then + * compare checksum to avoid cache collision */ + if (memcmp(buf, buf + buflen, bytes_read)) + break; + + bytes_done += bytes_read; } - return 0; + free(buf); + + return bytes_done; } -/* In 'lfs setstripe --component-add' mode, we need to fetch the extent - * end of the last component in the existing file, and adjust the - * first extent start of the components to be added accordingly. */ -static int adjust_first_extent(char *fname, struct llapi_layout *layout) +static int mirror_extend_file(const char *fname, const char *victim_file, + enum mirror_flags mirror_flags) { - struct llapi_layout *head; - uint64_t start, end, stripe_size, prev_end = 0; + int fd = -1; + int fdv = -1; + struct stat stbuf; + struct stat stbuf_v; + struct ll_ioc_lease *data = NULL; int rc; - if (layout == NULL) - return -EINVAL; + fd = open(fname, O_RDWR); + if (fd < 0) { + error_loc = "open source file"; + rc = -errno; + goto out; + } - errno = 0; - head = llapi_layout_get_by_path(fname, 0); - if (head == NULL) { - fprintf(stderr, "Read layout from %s failed. %s\n", - fname, strerror(errno)); - return -EINVAL; - } else if (errno == ENODATA) { - /* file without LOVEA, this component-add will be turned - * into a component-create. */ - llapi_layout_free(head); - return -ENODATA; - } else if (!llapi_layout_is_composite(head)) { - fprintf(stderr, "'%s' isn't a composite file.\n", - fname); - llapi_layout_free(head); - return -EINVAL; + fdv = open(victim_file, O_RDWR); + if (fdv < 0) { + error_loc = "open target file"; + rc = -errno; + goto out; } - rc = llapi_layout_comp_extent_get(head, &start, &prev_end); - if (rc) { - fprintf(stderr, "Get prev extent failed. %s\n", - strerror(errno)); - llapi_layout_free(head); - return rc; + if (fstat(fd, &stbuf) || fstat(fdv, &stbuf_v)) { + error_loc = "stat source or target file"; + rc = -errno; + goto out; } - llapi_layout_free(head); + if (stbuf.st_dev != stbuf_v.st_dev) { + error_loc = "stat source and target file"; + rc = -EXDEV; + goto out; + } - /* Make sure we use the first component of the layout to be added. */ - rc = llapi_layout_comp_use(layout, LLAPI_LAYOUT_COMP_USE_FIRST); + /* mirrors should be of the same size */ + if (stbuf.st_size != stbuf_v.st_size) { + error_loc = "file sizes don't match"; + rc = -EINVAL; + goto out; + } + + rc = llapi_lease_acquire(fd, LL_LEASE_RDLCK); if (rc < 0) { - fprintf(stderr, "Move component cursor failed. %s\n", - strerror(errno)); - return rc; + error_loc = "cannot get lease"; + goto out; } - rc = llapi_layout_comp_extent_get(layout, &start, &end); - if (rc) { - fprintf(stderr, "Get extent failed. %s\n", strerror(errno)); - return rc; + if (!(mirror_flags & MF_NO_VERIFY)) { + ssize_t ret; + /* mirrors should have the same contents */ + ret = mirror_file_compare(fd, fdv); + if (ret != stbuf.st_size) { + error_loc = "file busy or contents don't match"; + rc = ret < 0 ? ret : -EINVAL; + goto out; + } } - if (start > prev_end || end <= prev_end) { - fprintf(stderr, "First extent to be set [%lu, %lu) isn't " - "adjacent with the existing file extent end: %lu\n", - start, end, prev_end); - return -EINVAL; + /* Get rid of caching pages from clients */ + rc = llapi_file_flush(fd); + if (rc < 0) { + error_loc = "cannot get data version"; + goto out; } - rc = llapi_layout_stripe_size_get(layout, &stripe_size); - if (rc) { - fprintf(stderr, "Get stripe size failed. %s\n", - strerror(errno)); - return rc; + rc = llapi_file_flush(fdv); + if (rc < 0) { + error_loc = "cannot get data version"; + goto out; + } - if (stripe_size != LLAPI_LAYOUT_DEFAULT && - (prev_end & (stripe_size - 1))) { - fprintf(stderr, "Stripe size %lu not aligned with %lu\n", - stripe_size, prev_end); - return -EINVAL; + /* Make sure we keep original atime/mtime values */ + rc = migrate_copy_timestamps(fd, fdv); + if (rc < 0) { + error_loc = "cannot copy timestamp"; + goto out; } - rc = llapi_layout_comp_extent_set(layout, prev_end, end); - if (rc) { - fprintf(stderr, "Set component extent [%lu, %lu) failed. %s\n", - prev_end, end, strerror(errno)); - return rc; + /* Atomically put lease, merge layouts and close. */ + data = calloc(1, offsetof(typeof(*data), lil_ids[1])); + if (!data) { + error_loc = "memory allocation"; + goto out; + } + data->lil_mode = LL_LEASE_UNLCK; + data->lil_flags = LL_LEASE_LAYOUT_MERGE; + data->lil_count = 1; + data->lil_ids[0] = fdv; + rc = llapi_lease_set(fd, data); + if (rc < 0) { + error_loc = "cannot merge layout"; + goto out; + } else if (rc == 0) { + rc = -EBUSY; + error_loc = "lost lease lock"; + goto out; } + rc = 0; - return 0; +out: + if (data) + free(data); + if (fd >= 0) + close(fd); + if (fdv >= 0) + close(fdv); + if (!rc) + (void) unlink(victim_file); + if (rc < 0) + fprintf(stderr, "error: %s: %s: %s: %s\n", + progname, fname, error_loc, strerror(-rc)); + return rc; } -static inline bool comp_flags_is_neg(__u32 flags) +static int mirror_extend_layout(char *name, struct llapi_layout *layout) { - return flags & LCME_FL_NEG; -} + struct ll_ioc_lease *data = NULL; + int fd = -1; + int fdv = -1; + int rc; -static inline void comp_flags_set_neg(__u32 *flags) -{ - *flags |= LCME_FL_NEG; -} + rc = migrate_open_files(name, 0, NULL, layout, &fd, &fdv); + if (rc < 0) + goto out; -static inline void comp_flags_clear_neg(__u32 *flags) -{ - *flags &= ~LCME_FL_NEG; + rc = llapi_lease_acquire(fd, LL_LEASE_RDLCK); + if (rc < 0) { + error_loc = "cannot get lease"; + goto out; + } + + rc = migrate_nonblock(fd, fdv); + if (rc < 0) { + llapi_lease_release(fd); + goto out; + } + + /* Atomically put lease, merge layouts and close. */ + data = calloc(1, offsetof(typeof(*data), lil_ids[1])); + if (!data) { + error_loc = "memory allocation"; + goto out; + } + data->lil_mode = LL_LEASE_UNLCK; + data->lil_flags = LL_LEASE_LAYOUT_MERGE; + data->lil_count = 1; + data->lil_ids[0] = fdv; + rc = llapi_lease_set(fd, data); + if (rc < 0) { + error_loc = "cannot merge layout"; + goto out; + } else if (rc == 0) { + rc = -EBUSY; + error_loc = "lost lease lock"; + goto out; + } + rc = 0; + +out: + if (data) + free(data); + if (fd >= 0) + close(fd); + if (fdv >= 0) + close(fdv); + if (rc < 0) + fprintf(stderr, "error: %s: %s: %s: %s\n", + progname, name, error_loc, strerror(-rc)); + return rc; } -static int comp_str2flags(__u32 *flags, char *string) +static int mirror_extend(char *fname, struct mirror_args *mirror_list, + enum mirror_flags mirror_flags) { - char *name; - __u32 neg_flags = 0; + int rc; - if (string == NULL) - return -EINVAL; + rc = mirror_create_sanity_check(fname, mirror_list); + if (rc) + return rc; - *flags = 0; - for (name = strtok(string, ","); name; name = strtok(NULL, ",")) { - bool found = false; - int i; + while (mirror_list) { + if (mirror_list->m_file != NULL) { + rc = mirror_extend_file(fname, mirror_list->m_file, + mirror_flags); + } else { + __u32 mirror_count = mirror_list->m_count; - for (i = 0; i < ARRAY_SIZE(comp_flags_table); i++) { - __u32 comp_flag = comp_flags_table[i].cfn_flag; - const char *comp_name = comp_flags_table[i].cfn_name; + while (mirror_count > 0) { + rc = mirror_extend_layout(fname, + mirror_list->m_layout); + if (rc) + break; - if (strcmp(name, comp_name) == 0) { - *flags |= comp_flag; - found = true; - } else if (strncmp(name, "^", 1) == 0 && - strcmp(name + 1, comp_name) == 0) { - neg_flags |= comp_flag; - found = true; + --mirror_count; } } - if (!found) { - llapi_printf(LLAPI_MSG_ERROR, "Component flag " - "'%s' is not supported.\n", name); - return -EINVAL; - } - } - - if (*flags == 0 && neg_flags == 0) - return -EINVAL; - /* don't support mixed flags for now */ - if (*flags && neg_flags) - return -EINVAL; + if (rc) + break; - if (neg_flags) { - *flags = neg_flags; - comp_flags_set_neg(flags); + mirror_list = mirror_list->m_next; } - return 0; + return rc; } -static inline bool arg_is_eof(char *arg) +static int verify_id(struct llapi_layout *layout, void *cbdata) { - return !strncmp(arg, "-1", strlen("-1")) || - !strncmp(arg, "EOF", strlen("EOF")) || - !strncmp(arg, "eof", strlen("eof")); -} + uint32_t id; + int rc; -enum { - LFS_POOL_OPT = 3, - LFS_COMP_COUNT_OPT, - LFS_COMP_START_OPT, - LFS_COMP_FLAGS_OPT, - LFS_COMP_DEL_OPT, - LFS_COMP_SET_OPT, - LFS_COMP_ADD_OPT, - LFS_PROJID_OPT, -}; + rc = llapi_layout_mirror_id_get(layout, &id); + if (rc < 0) + return rc; -/* functions */ -static int lfs_setstripe(int argc, char **argv) + if ((__u16)id == *(__u16 *)cbdata) + return LLAPI_LAYOUT_ITER_STOP; + + return LLAPI_LAYOUT_ITER_CONT; +} + +static int mirror_split(const char *fname, __u16 mirror_id, + enum mirror_flags mflags, const char *victim_file) { - struct lfs_setstripe_args lsa; - struct llapi_stripe_param *param = NULL; - struct find_param migrate_mdt_param = { - .fp_max_depth = -1, - .fp_mdt_index = -1, - }; - char *fname; - int result; - int result2 = 0; - char *end; - int c; - int delete = 0; - char *mdt_idx_arg = NULL; - unsigned long long size_units = 1; - bool migrate_mode = false; - bool migration_block = false; - __u64 migration_flags = 0; - __u32 osts[LOV_MAX_STRIPE_COUNT] = { 0 }; - int comp_del = 0, comp_set = 0; - int comp_add = 0; - __u32 comp_id = 0; - struct llapi_layout *layout = NULL; - - struct option long_opts[] = { - /* --block is only valid in migrate mode */ - { .val = 'b', .name = "block", .has_arg = no_argument}, - { .val = LFS_COMP_ADD_OPT, - .name = "comp-add", .has_arg = no_argument}, - { .val = LFS_COMP_ADD_OPT, - .name = "component-add", - .has_arg = no_argument}, - { .val = LFS_COMP_DEL_OPT, - .name = "comp-del", .has_arg = no_argument}, - { .val = LFS_COMP_DEL_OPT, - .name = "component-del", - .has_arg = no_argument}, - { .val = LFS_COMP_FLAGS_OPT, - .name = "comp-flags", .has_arg = required_argument}, - { .val = LFS_COMP_FLAGS_OPT, - .name = "component-flags", - .has_arg = required_argument}, - { .val = LFS_COMP_SET_OPT, - .name = "comp-set", .has_arg = no_argument}, - { .val = LFS_COMP_SET_OPT, - .name = "component-set", - .has_arg = no_argument}, -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(2, 9, 59, 0) - /* This formerly implied "stripe-count", but was explicitly - * made "stripe-count" for consistency with other options, - * and to separate it from "mdt-count" when DNE arrives. */ - { .val = 'c', .name = "count", .has_arg = required_argument }, -#endif - { .val = 'c', .name = "stripe-count", .has_arg = required_argument}, - { .val = 'c', .name = "stripe_count", .has_arg = required_argument}, - { .val = 'd', .name = "delete", .has_arg = no_argument}, - { .val = 'E', .name = "comp-end", .has_arg = required_argument}, - { .val = 'E', .name = "component-end", - .has_arg = required_argument}, - /* dirstripe {"mdt-hash", required_argument, 0, 'H'}, */ -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(2, 9, 59, 0) - /* This formerly implied "stripe-index", but was explicitly - * made "stripe-index" for consistency with other options, - * and to separate it from "mdt-index" when DNE arrives. */ - { .val = 'i', .name = "index", .has_arg = required_argument }, -#endif - { .val = 'i', .name = "stripe-index", .has_arg = required_argument}, - { .val = 'i', .name = "stripe_index", .has_arg = required_argument}, - { .val = 'I', .name = "comp-id", .has_arg = required_argument}, - { .val = 'I', .name = "component-id", .has_arg = required_argument}, - { .val = 'm', .name = "mdt", .has_arg = required_argument}, - { .val = 'm', .name = "mdt-index", .has_arg = required_argument}, - { .val = 'm', .name = "mdt_index", .has_arg = required_argument}, - /* --non-block is only valid in migrate mode */ - { .val = 'n', .name = "non-block", .has_arg = no_argument}, - { .val = 'o', .name = "ost", .has_arg = required_argument}, -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) - { .val = 'o', .name = "ost-list", .has_arg = required_argument }, - { .val = 'o', .name = "ost_list", .has_arg = required_argument }, -#endif - { .val = 'p', .name = "pool", .has_arg = required_argument }, -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(2, 9, 59, 0) - /* This formerly implied "--stripe-size", but was confusing - * with "lfs find --size|-s", which means "file size", so use - * the consistent "--stripe-size|-S" for all commands. */ - { .val = 's', .name = "size", .has_arg = required_argument }, -#endif - { .val = 'L', .name = "layout", .has_arg = required_argument }, - { .val = 'S', .name = "stripe-size", .has_arg = required_argument }, - { .val = 'S', .name = "stripe_size", .has_arg = required_argument }, - /* dirstripe {"mdt-count", required_argument, 0, 'T'}, */ - /* --verbose is only valid in migrate mode */ - { .val = 'v', .name = "verbose", .has_arg = no_argument }, - { .val = LFS_COMP_ADD_OPT, - .name = "component-add", - .has_arg = no_argument }, - { .val = LFS_COMP_DEL_OPT, - .name = "component-del", - .has_arg = no_argument }, - { .val = LFS_COMP_FLAGS_OPT, - .name = "component-flags", - .has_arg = required_argument }, - { .val = LFS_COMP_SET_OPT, - .name = "component-set", - .has_arg = no_argument }, - { .name = NULL } }; + struct llapi_layout *layout; + char parent[PATH_MAX]; + char victim[PATH_MAX]; + int flags = O_CREAT | O_EXCL | O_LOV_DELAY_CREATE | O_NOFOLLOW; + char *ptr; + struct ll_ioc_lease *data; + uint16_t mirror_count; + int mdt_index; + int fd, fdv; + int rc; - setstripe_args_init(&lsa); + /* check fname contains mirror with mirror_id */ + layout = llapi_layout_get_by_path(fname, 0); + if (!layout) { + fprintf(stderr, + "error %s: file '%s' couldn't get layout\n", + progname, fname); + return -EINVAL; + } - if (strcmp(argv[0], "migrate") == 0) - migrate_mode = true; + rc = mirror_sanity_check_one(layout); + if (rc) + goto free_layout; - while ((c = getopt_long(argc, argv, "bc:dE:i:I:m:no:p:L:s:S:v", - long_opts, NULL)) >= 0) { - switch (c) { - case 0: - /* Long options. */ - break; - case LFS_COMP_ADD_OPT: - comp_add = 1; - break; - case LFS_COMP_DEL_OPT: - comp_del = 1; - break; - case LFS_COMP_FLAGS_OPT: - result = comp_str2flags(&lsa.lsa_comp_flags, optarg); - if (result != 0) { - fprintf(stderr, "error: %s: bad comp flags " - "'%s'\n", argv[0], optarg); - goto error; - } - break; - case LFS_COMP_SET_OPT: - comp_set = 1; - break; - case 'b': - if (!migrate_mode) { - fprintf(stderr, "--block is valid only for" - " migrate mode\n"); - goto error; - } - migration_block = true; - break; - case 'c': -#if LUSTRE_VERSION_CODE >= OBD_OCD_VERSION(2, 6, 53, 0) - if (strcmp(argv[optind - 1], "--count") == 0) - fprintf(stderr, "warning: '--count' deprecated" - ", use '--stripe-count' instead\n"); -#endif - lsa.lsa_stripe_count = strtoul(optarg, &end, 0); - if (*end != '\0') { - fprintf(stderr, "error: %s: bad stripe count " - "'%s'\n", argv[0], optarg); - goto error; - } - break; - case 'd': - /* delete the default striping pattern */ - delete = 1; - break; - case 'E': - if (lsa.lsa_comp_end != 0) { - result = comp_args_to_layout(&layout, &lsa); - if (result) - goto error; + rc = llapi_layout_mirror_count_get(layout, &mirror_count); + if (rc) { + fprintf(stderr, + "error %s: file '%s' couldn't get mirror count\n", + progname, fname); + goto free_layout; + } + if (mirror_count < 2) { + fprintf(stderr, + "error %s: file '%s' has %d component, cannot split\n", + progname, fname, mirror_count); + goto free_layout; + } - setstripe_args_init(&lsa); - } + rc = llapi_layout_comp_iterate(layout, verify_id, &mirror_id); + if (rc < 0) { + fprintf(stderr, "error %s: failed to iterate layout of '%s'\n", + progname, fname); + goto free_layout; + } else if (rc == LLAPI_LAYOUT_ITER_CONT) { + fprintf(stderr, + "error %s: file '%s' does not contain mirror with id %u\n", + progname, fname, mirror_id); + goto free_layout; + } - if (arg_is_eof(optarg)) { - lsa.lsa_comp_end = LUSTRE_EOF; - } else { - result = llapi_parse_size(optarg, - &lsa.lsa_comp_end, - &size_units, 0); - if (result) { - fprintf(stderr, "error: %s: " - "bad component end '%s'\n", - argv[0], optarg); - goto error; - } - } - break; - case 'L': - if (strcmp(argv[optind - 1], "mdt") == 0) { - /* Can be only the first component */ - if (layout != NULL) { - fprintf(stderr, "error: 'mdt' layout " - "can be only the first one\n"); - goto error; - } - if (lsa.lsa_comp_end > (1ULL << 30)) { /* 1Gb */ - fprintf(stderr, "error: 'mdt' layout " - "size is too big\n"); - goto error; - } - lsa.lsa_pattern = LLAPI_LAYOUT_MDT; - } else if (strcmp(argv[optind - 1], "raid0") != 0) { - fprintf(stderr, "error: layout '%s' is " - "unknown, supported layouts are: " - "'mdt', 'raid0'\n", argv[optind]); - goto error; - } - break; - case 'i': - if (strcmp(argv[optind - 1], "--index") == 0) - fprintf(stderr, "warning: '--index' deprecated" - ", use '--stripe-index' instead\n"); - lsa.lsa_stripe_off = strtol(optarg, &end, 0); - if (*end != '\0') { - fprintf(stderr, "error: %s: bad stripe offset " - "'%s'\n", argv[0], optarg); - goto error; - } - break; - case 'I': - comp_id = strtoul(optarg, &end, 0); - if (*end != '\0' || comp_id == 0 || - comp_id > LCME_ID_MAX) { - fprintf(stderr, "error: %s: bad comp ID " - "'%s'\n", argv[0], optarg); - goto error; - } - break; - case 'm': - if (!migrate_mode) { - fprintf(stderr, "--mdt-index is valid only for" - " migrate mode\n"); - goto error; - } - mdt_idx_arg = optarg; - break; - case 'n': - if (!migrate_mode) { - fprintf(stderr, "--non-block is valid only for" - " migrate mode\n"); - goto error; - } - migration_flags |= MIGRATION_NONBLOCK; - break; - case 'o': - lsa.lsa_nr_osts = parse_targets(osts, - sizeof(osts) / sizeof(__u32), - lsa.lsa_nr_osts, optarg); - if (lsa.lsa_nr_osts < 0) { - fprintf(stderr, - "error: %s: bad OST indices '%s'\n", - argv[0], optarg); - goto error; - } + fd = open(fname, O_RDWR); + if (fd < 0) { + fprintf(stderr, + "error %s: open file '%s' failed: %s\n", + progname, fname, strerror(errno)); + goto free_layout; + } - lsa.lsa_osts = osts; - if (lsa.lsa_stripe_off == -1) - lsa.lsa_stripe_off = osts[0]; - break; - case 'p': - if (optarg == NULL) - goto error; - lsa.lsa_pool_name = optarg; - break; -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(2, 9, 59, 0) - case 's': -#if LUSTRE_VERSION_CODE >= OBD_OCD_VERSION(2, 6, 53, 0) - fprintf(stderr, "warning: '--size|-s' deprecated, " - "use '--stripe-size|-S' instead\n"); -#endif -#endif /* LUSTRE_VERSION_CODE < OBD_OCD_VERSION(2, 9, 59, 0) */ - case 'S': - result = llapi_parse_size(optarg, &lsa.lsa_stripe_size, - &size_units, 0); - if (result) { - fprintf(stderr, "error: %s: bad stripe size " - "'%s'\n", argv[0], optarg); - goto error; - } - break; - case 'v': - if (!migrate_mode) { - fprintf(stderr, "--verbose is valid only for" - " migrate mode\n"); - goto error; - } - migrate_mdt_param.fp_verbose = VERBOSE_DETAIL; - break; - default: - goto error; + /* get victim file directory pathname */ + if (strlen(fname) > sizeof(parent) - 1) { + fprintf(stderr, "error %s: file name of '%s' too long\n", + progname, fname); + rc = -ERANGE; + goto close_fd; + } + strncpy(parent, fname, sizeof(parent)); + ptr = strrchr(parent, '/'); + if (ptr == NULL) { + if (getcwd(parent, sizeof(parent)) == NULL) { + fprintf(stderr, "error %s: getcwd failed: %s\n", + progname, strerror(errno)); + rc = -errno; + goto close_fd; } + } else { + if (ptr == parent) + ptr = parent + 1; + *ptr = '\0'; } - fname = argv[optind]; + rc = llapi_file_fget_mdtidx(fd, &mdt_index); + if (rc < 0) { + fprintf(stderr, "%s: cannot get MDT index of '%s'\n", + progname, fname); + goto close_fd; + } - if (lsa.lsa_comp_end != 0) { - result = comp_args_to_layout(&layout, &lsa); - if (result) - goto error; + if (victim_file == NULL) { + /* use a temp file to store the splitted layout */ + if (mflags & MF_DESTROY) { + fdv = llapi_create_volatile_idx(parent, mdt_index, + O_LOV_DELAY_CREATE); + } else { + snprintf(victim, sizeof(victim), "%s.mirror~%u", + fname, mirror_id); + fdv = open(victim, flags, S_IRUSR | S_IWUSR); + } + } else { + /* user specified victim file */ + fdv = open(victim_file, flags, S_IRUSR | S_IWUSR); } - if (optind == argc) { - fprintf(stderr, "error: %s: missing filename|dirname\n", - argv[0]); - goto error; + if (fdv < 0) { + fprintf(stderr, + "error %s: create victim file failed: %s\n", + progname, strerror(errno)); + goto close_fd; } - /* Only LCME_FL_INIT flags is used in PFL, and it shouldn't be - * altered by user space tool, so we don't need to support the - * --component-set for this moment. */ - if (comp_set != 0) { - fprintf(stderr, "error: %s: --component-set isn't supported.\n", - argv[0]); - goto error; + /* get lease lock of fname */ + rc = llapi_lease_acquire(fd, LL_LEASE_WRLCK); + if (rc < 0) { + fprintf(stderr, + "error %s: cannot get lease of file '%s': %d\n", + progname, fname, rc); + goto close_victim; } - if ((delete + comp_set + comp_del + comp_add) > 1) { - fprintf(stderr, "error: %s: can't specify --component-set, " - "--component-del, --component-add or -d together\n", - argv[0]); - goto error; + /* Atomatically put lease, split layouts and close. */ + data = malloc(offsetof(typeof(*data), lil_ids[2])); + if (!data) { + rc = -ENOMEM; + goto close_victim; } - if (delete && (setstripe_args_specified(&lsa) || comp_id != 0 || - lsa.lsa_comp_flags != 0 || layout != NULL)) { - fprintf(stderr, "error: %s: can't specify -d with " - "-s, -c, -o, -p, -I, -F or -E options\n", - argv[0]); - goto error; + data->lil_mode = LL_LEASE_UNLCK; + data->lil_flags = LL_LEASE_LAYOUT_SPLIT; + data->lil_count = 2; + data->lil_ids[0] = fdv; + data->lil_ids[1] = mirror_id; + rc = llapi_lease_set(fd, data); + if (rc <= 0) { + if (rc == 0) /* lost lease lock */ + rc = -EBUSY; + fprintf(stderr, + "error %s: cannot split '%s': %s\n", + progname, fname, strerror(-rc)); + } else { + rc = 0; } + free(data); - if ((comp_set || comp_del) && - (setstripe_args_specified(&lsa) || layout != NULL)) { - fprintf(stderr, "error: %s: can't specify --component-del or " - "--component-set with -s, -c, -o, -p or -E options.\n", - argv[0]); - goto error; - } +close_victim: + close(fdv); +close_fd: + close(fd); +free_layout: + llapi_layout_free(layout); + return rc; +} - if (comp_del && comp_id != 0 && lsa.lsa_comp_flags != 0) { - fprintf(stderr, "error: %s: can't specify both -I and -F for " - "--component-del option.\n", argv[0]); - goto error; - } +/** + * Parse a string containing an target index list into an array of integers. + * + * The input string contains a comma delimited list of individual + * indices and ranges, for example "1,2-4,7". Add the indices into the + * \a tgts array and remove duplicates. + * + * \param[out] tgts array to store indices in + * \param[in] size size of \a tgts array + * \param[in] offset starting index in \a tgts + * \param[in] arg string containing OST index list + * + * \retval positive number of indices in \a tgts + * \retval -EINVAL unable to parse \a arg + */ +static int parse_targets(__u32 *tgts, int size, int offset, char *arg) +{ + int rc; + int nr = offset; + int slots = size - offset; + char *ptr = NULL; + bool end_of_loop; - if (comp_add || comp_del) { - struct stat st; + if (arg == NULL) + return -EINVAL; - result = lstat(fname, &st); - if (result == 0 && S_ISDIR(st.st_mode)) { - fprintf(stderr, "error: %s: can't use --component-add " - "or --component-del for directory.\n", - argv[0]); - goto error; - } - } + end_of_loop = false; + while (!end_of_loop) { + int start_index; + int end_index; + int i; + char *endptr = NULL; - if (comp_add) { - if (layout == NULL) { - fprintf(stderr, "error: %s: -E option must be present" - "in --component-add mode.\n", argv[0]); - goto error; - } - result = adjust_first_extent(fname, layout); - if (result == -ENODATA) - comp_add = 0; - else if (result != 0) - goto error; - } + rc = -EINVAL; - if (mdt_idx_arg != NULL && optind > 3) { - fprintf(stderr, "error: %s: cannot specify -m with other " - "options\n", argv[0]); - goto error; - } + ptr = strchrnul(arg, ','); - if ((migration_flags & MIGRATION_NONBLOCK) && migration_block) { - fprintf(stderr, - "error: %s: cannot specify --non-block and --block\n", - argv[0]); - goto error; - } + end_of_loop = *ptr == '\0'; + *ptr = '\0'; - if (!comp_del && !comp_set && comp_id != 0) { - fprintf(stderr, "error: %s: -I can only be used with " - "--component-del.\n", argv[0]); - goto error; - } + start_index = strtol(arg, &endptr, 0); + if (endptr == arg) /* no data at all */ + break; + if (*endptr != '-' && *endptr != '\0') /* has invalid data */ + break; - if (mdt_idx_arg != NULL) { - /* initialize migrate mdt parameters */ - migrate_mdt_param.fp_mdt_index = strtoul(mdt_idx_arg, &end, 0); - if (*end != '\0') { - fprintf(stderr, "error: %s: bad MDT index '%s'\n", - argv[0], mdt_idx_arg); - goto error; - } - migrate_mdt_param.fp_migrate = 1; - } else if (layout == NULL) { - /* initialize stripe parameters */ - param = calloc(1, offsetof(typeof(*param), - lsp_osts[lsa.lsa_nr_osts])); - if (param == NULL) { - fprintf(stderr, "error: %s: %s\n", argv[0], - strerror(ENOMEM)); - goto error; + end_index = start_index; + if (*endptr == '-') { + end_index = strtol(endptr + 1, &endptr, 0); + if (*endptr != '\0') + break; + if (end_index < start_index) + break; } - param->lsp_stripe_size = lsa.lsa_stripe_size; - param->lsp_stripe_offset = lsa.lsa_stripe_off; - param->lsp_stripe_count = lsa.lsa_stripe_count; - param->lsp_pool = lsa.lsa_pool_name; - param->lsp_is_specific = false; - if (lsa.lsa_nr_osts > 0) { - if (lsa.lsa_stripe_count > 0 && - lsa.lsa_nr_osts != lsa.lsa_stripe_count) { - fprintf(stderr, "error: %s: stripe count '%d' " - "doesn't match the number of OSTs: %d\n" - , argv[0], lsa.lsa_stripe_count, - lsa.lsa_nr_osts); - free(param); - goto error; - } - - param->lsp_is_specific = true; - param->lsp_stripe_count = lsa.lsa_nr_osts; - memcpy(param->lsp_osts, osts, - sizeof(*osts) * lsa.lsa_nr_osts); - } - } + for (i = start_index; i <= end_index && slots > 0; i++) { + int j; - for (fname = argv[optind]; fname != NULL; fname = argv[++optind]) { - char *op; - if (mdt_idx_arg != NULL) { - result = llapi_migrate_mdt(fname, &migrate_mdt_param); - op = "migrate mdt objects of"; - } else if (migrate_mode) { - result = lfs_migrate(fname, migration_flags, param, - layout); - op = "migrate ost objects of"; - } else if (comp_set != 0) { - result = lfs_component_set(fname, comp_id, - lsa.lsa_comp_flags); - op = "modify component flags of"; - } else if (comp_del != 0) { - result = lfs_component_del(fname, comp_id, - lsa.lsa_comp_flags); - op = "delete component of"; - } else if (comp_add != 0) { - result = lfs_component_add(fname, layout); - op = "add component to"; - } else if (layout != NULL) { - result = lfs_component_create(fname, O_CREAT | O_WRONLY, - 0644, layout); - if (result >= 0) { - close(result); - result = 0; + /* remove duplicate */ + for (j = 0; j < offset; j++) { + if (tgts[j] == i) + break; } - op = "create composite"; - } else { - result = llapi_file_open_param(fname, - O_CREAT | O_WRONLY, - 0644, param); - if (result >= 0) { - close(result); - result = 0; + if (j == offset) { /* no duplicate */ + tgts[nr++] = i; + --slots; } - op = "create striped"; - } - if (result) { - /* Save the first error encountered. */ - if (result2 == 0) - result2 = result; - fprintf(stderr, "error: %s: %s file '%s' failed: %s\n", - argv[0], op, fname, - lsa.lsa_pool_name != NULL && result == EINVAL ? - "OST not in pool?" : strerror(errno)); - continue; } + if (slots == 0 && i < end_index) + break; + + *ptr = ','; + arg = ++ptr; + offset = nr; + rc = 0; } + if (!end_of_loop && ptr != NULL) + *ptr = ','; - free(param); - llapi_layout_free(layout); - return result2; -error: - llapi_layout_free(layout); - return CMD_HELP; + return rc < 0 ? rc : nr; } -static int lfs_poollist(int argc, char **argv) -{ - if (argc != 2) - return CMD_HELP; - - return llapi_poollist(argv[1]); -} +struct lfs_setstripe_args { + unsigned long long lsa_comp_end; + unsigned long long lsa_stripe_size; + long long lsa_stripe_count; + long long lsa_stripe_off; + __u32 lsa_comp_flags; + __u32 lsa_comp_neg_flags; + unsigned long long lsa_pattern; + unsigned int lsa_mirror_count; + int lsa_nr_tgts; + bool lsa_first_comp; + __u32 *lsa_tgts; + char *lsa_pool_name; +}; -static int set_time(time_t *time, time_t *set, char *str) +static inline void setstripe_args_init(struct lfs_setstripe_args *lsa) { - time_t t; - int res = 0; - - if (str[0] == '+') - res = 1; - else if (str[0] == '-') - res = -1; - - if (res) - str++; - - t = strtol(str, NULL, 0); - if (*time < t * 24 * 60 * 60) { - if (res) - str--; - fprintf(stderr, "Wrong time '%s' is specified.\n", str); - return INT_MAX; - } + unsigned int mirror_count = lsa->lsa_mirror_count; + bool first_comp = lsa->lsa_first_comp; - *set = *time - t * 24 * 60 * 60; - return res; -} -static int name2uid(unsigned int *id, const char *name) -{ - struct passwd *passwd; + memset(lsa, 0, sizeof(*lsa)); - passwd = getpwnam(name); - if (passwd == NULL) - return -ENOENT; - *id = passwd->pw_uid; + lsa->lsa_stripe_size = LLAPI_LAYOUT_DEFAULT; + lsa->lsa_stripe_count = LLAPI_LAYOUT_DEFAULT; + lsa->lsa_stripe_off = LLAPI_LAYOUT_DEFAULT; + lsa->lsa_pattern = LLAPI_LAYOUT_RAID0; + lsa->lsa_pool_name = NULL; - return 0; + lsa->lsa_mirror_count = mirror_count; + lsa->lsa_first_comp = first_comp; } -static int name2gid(unsigned int *id, const char *name) +/** + * setstripe_args_init_inherit() - Initialize and inherit stripe options. + * @lsa: Stripe options to be initialized and inherited. + * + * This function initializes stripe options in @lsa and inherit + * stripe_size, stripe_count and OST pool_name options. + * + * Return: void. + */ +static inline void setstripe_args_init_inherit(struct lfs_setstripe_args *lsa) { - struct group *group; + unsigned long long stripe_size; + long long stripe_count; + char *pool_name = NULL; - group = getgrnam(name); - if (group == NULL) - return -ENOENT; - *id = group->gr_gid; + stripe_size = lsa->lsa_stripe_size; + stripe_count = lsa->lsa_stripe_count; + pool_name = lsa->lsa_pool_name; - return 0; -} + setstripe_args_init(lsa); -static inline int name2projid(unsigned int *id, const char *name) -{ - return -ENOTSUP; + lsa->lsa_stripe_size = stripe_size; + lsa->lsa_stripe_count = stripe_count; + lsa->lsa_pool_name = pool_name; } -static int uid2name(char **name, unsigned int id) +static inline bool setstripe_args_specified(struct lfs_setstripe_args *lsa) { - struct passwd *passwd; - - passwd = getpwuid(id); - if (passwd == NULL) - return -ENOENT; - *name = passwd->pw_name; - - return 0; + return (lsa->lsa_stripe_size != LLAPI_LAYOUT_DEFAULT || + lsa->lsa_stripe_count != LLAPI_LAYOUT_DEFAULT || + lsa->lsa_stripe_off != LLAPI_LAYOUT_DEFAULT || + lsa->lsa_pattern != LLAPI_LAYOUT_RAID0 || + lsa->lsa_pool_name != NULL || + lsa->lsa_comp_end != 0); } -static inline int gid2name(char **name, unsigned int id) +/** + * comp_args_to_layout() - Create or extend a composite layout. + * @composite: Pointer to the composite layout. + * @lsa: Stripe options for the new component. + * + * This function creates or extends a composite layout by adding a new + * component with stripe options from @lsa. + * + * Return: 0 on success or an error code on failure. + */ +static int comp_args_to_layout(struct llapi_layout **composite, + struct lfs_setstripe_args *lsa, + bool set_extent) { - struct group *group; + struct llapi_layout *layout = *composite; + uint64_t prev_end = 0; + int i = 0, rc; - group = getgrgid(id); - if (group == NULL) - return -ENOENT; - *name = group->gr_name; + if (layout == NULL) { + layout = llapi_layout_alloc(); + if (layout == NULL) { + fprintf(stderr, "Alloc llapi_layout failed. %s\n", + strerror(errno)); + return -ENOMEM; + } + *composite = layout; + } else { + uint64_t start; - return 0; -} + /* Get current component extent, current component + * must be the tail component. */ + rc = llapi_layout_comp_extent_get(layout, &start, &prev_end); + if (rc) { + fprintf(stderr, "Get comp extent failed. %s\n", + strerror(errno)); + return rc; + } -static int name2layout(__u32 *layout, char *name) -{ - char *ptr, *layout_name; + if (lsa->lsa_first_comp) + prev_end = 0; - *layout = 0; - for (ptr = name; ; ptr = NULL) { - layout_name = strtok(ptr, ","); - if (layout_name == NULL) - break; - if (strcmp(layout_name, "released") == 0) - *layout |= LOV_PATTERN_F_RELEASED; - else if (strcmp(layout_name, "raid0") == 0) - *layout |= LOV_PATTERN_RAID0; - else if (strcmp(layout_name, "mdt") == 0) - *layout |= LOV_PATTERN_MDT; + if (lsa->lsa_first_comp) + rc = llapi_layout_add_first_comp(layout); else - return -1; + rc = llapi_layout_comp_add(layout); + if (rc) { + fprintf(stderr, "Add component failed. %s\n", + strerror(errno)); + return rc; + } + } + /* reset lsa_first_comp */ + lsa->lsa_first_comp = false; + + if (set_extent) { + rc = llapi_layout_comp_extent_set(layout, prev_end, + lsa->lsa_comp_end); + if (rc) { + fprintf(stderr, "Set extent [%lu, %llu) failed. %s\n", + prev_end, lsa->lsa_comp_end, strerror(errno)); + return rc; + } + } + + /* Data-on-MDT component setting */ + if (lsa->lsa_pattern == LLAPI_LAYOUT_MDT) { + /* In case of Data-on-MDT patterns the only extra option + * applicable is stripe size option. */ + if (lsa->lsa_stripe_count != LLAPI_LAYOUT_DEFAULT) { + fprintf(stderr, "Option 'stripe-count' can't be " + "specified with Data-on-MDT component: %lld\n", + lsa->lsa_stripe_count); + return -EINVAL; + } + if (lsa->lsa_stripe_size != LLAPI_LAYOUT_DEFAULT) { + fprintf(stderr, "Option 'stripe-size' can't be " + "specified with Data-on-MDT component: %llu\n", + lsa->lsa_stripe_size); + return -EINVAL; + } + if (lsa->lsa_nr_tgts != 0) { + fprintf(stderr, "Option 'ost-list' can't be specified " + "with Data-on-MDT component: '%i'\n", + lsa->lsa_nr_tgts); + return -EINVAL; + } + if (lsa->lsa_stripe_off != LLAPI_LAYOUT_DEFAULT) { + fprintf(stderr, "Option 'stripe-offset' can't be " + "specified with Data-on-MDT component: %lld\n", + lsa->lsa_stripe_off); + return -EINVAL; + } + if (lsa->lsa_pool_name != 0) { + fprintf(stderr, "Option 'pool' can't be specified " + "with Data-on-MDT component: '%s'\n", + lsa->lsa_pool_name); + return -EINVAL; + } + + rc = llapi_layout_pattern_set(layout, lsa->lsa_pattern); + if (rc) { + fprintf(stderr, "Set stripe pattern %#llx failed. %s\n", + lsa->lsa_pattern, strerror(errno)); + return rc; + } + /* Data-on-MDT component has always single stripe up to end */ + lsa->lsa_stripe_size = lsa->lsa_comp_end; + } + + rc = llapi_layout_stripe_size_set(layout, lsa->lsa_stripe_size); + if (rc) { + fprintf(stderr, "Set stripe size %llu failed: %s\n", + lsa->lsa_stripe_size, strerror(errno)); + return rc; + } + + rc = llapi_layout_stripe_count_set(layout, lsa->lsa_stripe_count); + if (rc) { + fprintf(stderr, "Set stripe count %lld failed: %s\n", + lsa->lsa_stripe_count, strerror(errno)); + return rc; + } + + rc = llapi_layout_comp_flags_set(layout, lsa->lsa_comp_flags); + if (rc) { + fprintf(stderr, "Set flags 0x%x failed: %s\n", + lsa->lsa_comp_flags, strerror(errno)); + return rc; + } + + if (lsa->lsa_pool_name != NULL) { + rc = llapi_layout_pool_name_set(layout, lsa->lsa_pool_name); + if (rc) { + fprintf(stderr, "Set pool name: %s failed. %s\n", + lsa->lsa_pool_name, strerror(errno)); + return rc; + } + } else { + rc = llapi_layout_pool_name_set(layout, ""); + if (rc) { + fprintf(stderr, "Clear pool name failed: %s\n", + strerror(errno)); + return rc; + } + } + + if (lsa->lsa_nr_tgts > 0) { + if (lsa->lsa_stripe_count > 0 && + lsa->lsa_stripe_count != LLAPI_LAYOUT_DEFAULT && + lsa->lsa_stripe_count != LLAPI_LAYOUT_WIDE && + lsa->lsa_nr_tgts != lsa->lsa_stripe_count) { + fprintf(stderr, "stripe_count(%lld) != nr_tgts(%d)\n", + lsa->lsa_stripe_count, lsa->lsa_nr_tgts); + return -EINVAL; + } + for (i = 0; i < lsa->lsa_nr_tgts; i++) { + rc = llapi_layout_ost_index_set(layout, i, + lsa->lsa_tgts[i]); + if (rc) + break; + } + } else if (lsa->lsa_stripe_off != LLAPI_LAYOUT_DEFAULT && + lsa->lsa_stripe_off != -1) { + rc = llapi_layout_ost_index_set(layout, 0, lsa->lsa_stripe_off); + } + if (rc) { + fprintf(stderr, "Set ost index %d failed. %s\n", + i, strerror(errno)); + return rc; } + return 0; } -static int lfs_find(int argc, char **argv) +static int build_component(struct llapi_layout **layout, + struct lfs_setstripe_args *lsa, bool set_extent) { - int c, rc; - int ret = 0; - time_t t; - struct find_param param = { - .fp_max_depth = -1, - .fp_quiet = 1, - }; - struct option long_opts[] = { - { .val = 'A', .name = "atime", .has_arg = required_argument }, - { .val = LFS_COMP_COUNT_OPT, - .name = "comp-count", .has_arg = required_argument }, - { .val = LFS_COMP_COUNT_OPT, - .name = "component-count", - .has_arg = required_argument }, - { .val = LFS_COMP_FLAGS_OPT, - .name = "comp-flags", .has_arg = required_argument }, - { .val = LFS_COMP_FLAGS_OPT, - .name = "component-flags", - .has_arg = required_argument }, - { .val = LFS_COMP_START_OPT, - .name = "comp-start", .has_arg = required_argument }, - { .val = LFS_COMP_START_OPT, - .name = "component-start", - .has_arg = required_argument }, - { .val = 'c', .name = "stripe-count", .has_arg = required_argument }, - { .val = 'c', .name = "stripe_count", .has_arg = required_argument }, - { .val = 'C', .name = "ctime", .has_arg = required_argument }, - { .val = 'D', .name = "maxdepth", .has_arg = required_argument }, - { .val = 'E', .name = "comp-end", .has_arg = required_argument }, - { .val = 'E', .name = "component-end", - .has_arg = required_argument }, - { .val = 'g', .name = "gid", .has_arg = required_argument }, - { .val = 'G', .name = "group", .has_arg = required_argument }, - { .val = 'H', .name = "mdt-hash", .has_arg = required_argument }, - { .val = 'i', .name = "stripe-index", .has_arg = required_argument }, - { .val = 'i', .name = "stripe_index", .has_arg = required_argument }, - /*{"component-id", required_argument, 0, 'I'},*/ - { .val = 'L', .name = "layout", .has_arg = required_argument }, - { .val = 'm', .name = "mdt", .has_arg = required_argument }, - { .val = 'm', .name = "mdt-index", .has_arg = required_argument }, - { .val = 'm', .name = "mdt_index", .has_arg = required_argument }, - { .val = 'M', .name = "mtime", .has_arg = required_argument }, - { .val = 'n', .name = "name", .has_arg = required_argument }, - /* reserve {"or", no_argument, , 0, 'o'}, to match find(1) */ - { .val = 'O', .name = "obd", .has_arg = required_argument }, - { .val = 'O', .name = "ost", .has_arg = required_argument }, - /* no short option for pool, p/P already used */ - { .val = LFS_POOL_OPT, - .name = "pool", .has_arg = required_argument }, - { .val = 'p', .name = "print0", .has_arg = no_argument }, - { .val = 'P', .name = "print", .has_arg = no_argument }, - { .val = LFS_PROJID_OPT, - .name = "projid", .has_arg = required_argument }, - { .val = 's', .name = "size", .has_arg = required_argument }, - { .val = 'S', .name = "stripe-size", .has_arg = required_argument }, - { .val = 'S', .name = "stripe_size", .has_arg = required_argument }, - { .val = 't', .name = "type", .has_arg = required_argument }, - { .val = 'T', .name = "mdt-count", .has_arg = required_argument }, - { .val = 'u', .name = "uid", .has_arg = required_argument }, - { .val = 'U', .name = "user", .has_arg = required_argument }, - { .name = NULL } }; - int pathstart = -1; - int pathend = -1; - int neg_opt = 0; - time_t *xtime; - int *xsign; - int isoption; - char *endptr; + int rc; - time(&t); + rc = comp_args_to_layout(layout, lsa, set_extent); + if (rc) + return rc; - /* when getopt_long_only() hits '!' it returns 1, puts "!" in optarg */ - while ((c = getopt_long_only(argc, argv, - "-A:c:C:D:E:g:G:H:i:L:m:M:n:O:Ppqrs:S:t:T:u:U:v", - long_opts, NULL)) >= 0) { - xtime = NULL; - xsign = NULL; - if (neg_opt) - --neg_opt; - /* '!' is part of option */ - /* when getopt_long_only() finds a string which is not - * an option nor a known option argument it returns 1 - * in that case if we already have found pathstart and pathend - * (i.e. we have the list of pathnames), - * the only supported value is "!" - */ - isoption = (c != 1) || (strcmp(optarg, "!") == 0); - if (!isoption && pathend != -1) { - fprintf(stderr, "err: %s: filename|dirname must either " - "precede options or follow options\n", - argv[0]); - ret = CMD_HELP; - goto err; - } - if (!isoption && pathstart == -1) - pathstart = optind - 1; - if (isoption && pathstart != -1 && pathend == -1) - pathend = optind - 2; - switch (c) { - case 0: - /* Long options. */ - break; - case 1: - /* unknown; opt is "!" or path component, - * checking done above. - */ - if (strcmp(optarg, "!") == 0) - neg_opt = 2; - break; - case 'A': - xtime = ¶m.fp_atime; - xsign = ¶m.fp_asign; - param.fp_exclude_atime = !!neg_opt; - /* no break, this falls through to 'C' for ctime */ - case 'C': - if (c == 'C') { - xtime = ¶m.fp_ctime; - xsign = ¶m.fp_csign; - param.fp_exclude_ctime = !!neg_opt; - } - /* no break, this falls through to 'M' for mtime */ - case 'M': - if (c == 'M') { - xtime = ¶m.fp_mtime; - xsign = ¶m.fp_msign; - param.fp_exclude_mtime = !!neg_opt; + if (lsa->lsa_mirror_count > 0) { + rc = llapi_layout_mirror_count_set(*layout, + lsa->lsa_mirror_count); + if (rc) + return rc; + + rc = llapi_layout_flags_set(*layout, LCM_FL_RDONLY); + if (rc) + return rc; + lsa->lsa_mirror_count = 0; + } + + return rc; +} + +static int build_layout_from_yaml_node(struct cYAML *node, + struct llapi_layout **layout, + struct lfs_setstripe_args *lsa, + __u32 *osts) +{ + char *string; + int rc = 0; + + while (node) { + string = node->cy_string; + /* skip leading lmm_ if present, to simplify parsing */ + if (string != NULL && strncmp(string, "lmm_", 4) == 0) + string += 4; + + if (node->cy_type == CYAML_TYPE_STRING) { + if (!strcmp(string, "lcme_extent.e_end")) { + if (!strcmp(node->cy_valuestring, "EOF") || + !strcmp(node->cy_valuestring, "eof")) + lsa->lsa_comp_end = LUSTRE_EOF; + } else if (!strcmp(string, "pool")) { + lsa->lsa_pool_name = node->cy_valuestring; + } else if (!strcmp(string, "pattern")) { + if (!strcmp(node->cy_valuestring, "mdt")) + lsa->lsa_pattern = LLAPI_LAYOUT_MDT; } - rc = set_time(&t, xtime, optarg); - if (rc == INT_MAX) { - ret = -1; - goto err; + } else if (node->cy_type == CYAML_TYPE_NUMBER) { + if (!strcmp(string, "lcm_mirror_count")) { + lsa->lsa_mirror_count = node->cy_valueint; + } else if (!strcmp(string, "lcme_extent.e_start")) { + if (node->cy_valueint != 0 || *layout != NULL) { + rc = build_component(layout, lsa, true); + if (rc) + return rc; + } + + if (node->cy_valueint == 0) + lsa->lsa_first_comp = true; + + /* initialize lsa */ + setstripe_args_init(lsa); + lsa->lsa_tgts = osts; + } else if (!strcmp(string, "lcme_extent.e_end")) { + if (node->cy_valueint == -1) + lsa->lsa_comp_end = LUSTRE_EOF; + else + lsa->lsa_comp_end = node->cy_valueint; + } else if (!strcmp(string, "stripe_count")) { + lsa->lsa_stripe_count = node->cy_valueint; + } else if (!strcmp(string, "stripe_size")) { + lsa->lsa_stripe_size = node->cy_valueint; + } else if (!strcmp(string, "stripe_offset")) { + lsa->lsa_stripe_off = node->cy_valueint; + } else if (!strcmp(string, "l_ost_idx")) { + osts[lsa->lsa_nr_tgts] = node->cy_valueint; + lsa->lsa_nr_tgts++; } + } else if (node->cy_type == CYAML_TYPE_OBJECT) { + /* go deep to sub blocks */ + rc = build_layout_from_yaml_node(node->cy_child, layout, + lsa, osts); if (rc) - *xsign = rc; - break; - case LFS_COMP_COUNT_OPT: - if (optarg[0] == '+') { - param.fp_comp_count_sign = -1; - optarg++; - } else if (optarg[0] == '-') { - param.fp_comp_count_sign = 1; - optarg++; - } + return rc; + } + node = node->cy_next; + } - param.fp_comp_count = strtoul(optarg, &endptr, 0); - if (*endptr != '\0') { - fprintf(stderr, "error: bad component count " - "'%s'\n", optarg); - goto err; - } - param.fp_check_comp_count = 1; - param.fp_exclude_comp_count = !!neg_opt; - break; - case LFS_COMP_FLAGS_OPT: - rc = comp_str2flags(¶m.fp_comp_flags, optarg); - if (rc || comp_flags_is_neg(param.fp_comp_flags)) { - fprintf(stderr, "error: bad component flags " - "'%s'\n", optarg); + return rc; +} + +static int lfs_comp_create_from_yaml(char *template, + struct llapi_layout **layout, + struct lfs_setstripe_args *lsa, + __u32 *osts) +{ + struct cYAML *tree = NULL, *err_rc = NULL; + int rc = 0; + + tree = cYAML_build_tree(template, NULL, 0, &err_rc, false); + if (!tree) { + fprintf(stderr, "%s: cannot parse YAML file %s\n", + progname, template); + cYAML_build_error(-EINVAL, -1, "yaml", "from comp yaml", + "can't parse", &err_rc); + cYAML_print_tree2file(stderr, err_rc); + cYAML_free_tree(err_rc); + rc = -EINVAL; + goto err; + } + + /* initialize lsa for plain file */ + setstripe_args_init(lsa); + lsa->lsa_tgts = osts; + + rc = build_layout_from_yaml_node(tree, layout, lsa, osts); + if (rc) { + fprintf(stderr, "%s: cannot build layout from YAML file %s.\n", + progname, template); + goto err; + } else { + rc = build_component(layout, lsa, *layout != NULL); + } + /* clean clean lsa */ + setstripe_args_init(lsa); + +err: + if (tree) + cYAML_free_tree(tree); + return rc; +} + +/* In 'lfs setstripe --component-add' mode, we need to fetch the extent + * end of the last component in the existing file, and adjust the + * first extent start of the components to be added accordingly. */ +static int adjust_first_extent(char *fname, struct llapi_layout *layout) +{ + struct llapi_layout *head; + uint64_t start, end, stripe_size, prev_end = 0; + int rc; + + if (layout == NULL) { + fprintf(stderr, + "%s setstripe: layout must be specified\n", + progname); + return -EINVAL; + } + + errno = 0; + head = llapi_layout_get_by_path(fname, 0); + if (head == NULL) { + fprintf(stderr, + "%s setstripe: cannot read layout from '%s': %s\n", + progname, fname, strerror(errno)); + return -EINVAL; + } else if (errno == ENODATA) { + /* file without LOVEA, this component-add will be turned + * into a component-create. */ + llapi_layout_free(head); + return -ENODATA; + } else if (!llapi_layout_is_composite(head)) { + fprintf(stderr, "%s setstripe: '%s' not a composite file\n", + progname, fname); + llapi_layout_free(head); + return -EINVAL; + } + + rc = llapi_layout_comp_extent_get(head, &start, &prev_end); + if (rc) { + fprintf(stderr, "%s setstripe: cannot get prev extent: %s\n", + progname, strerror(errno)); + llapi_layout_free(head); + return rc; + } + + llapi_layout_free(head); + + /* Make sure we use the first component of the layout to be added. */ + rc = llapi_layout_comp_use(layout, LLAPI_LAYOUT_COMP_USE_FIRST); + if (rc < 0) { + fprintf(stderr, + "%s setstripe: cannot move component cursor: %s\n", + progname, strerror(errno)); + return rc; + } + + rc = llapi_layout_comp_extent_get(layout, &start, &end); + if (rc) { + fprintf(stderr, "%s setstripe: cannot get extent: %s\n", + progname, strerror(errno)); + return rc; + } + + if (start > prev_end || end <= prev_end) { + fprintf(stderr, + "%s setstripe: first extent [%lu, %lu) not adjacent with extent end %lu\n", + progname, start, end, prev_end); + return -EINVAL; + } + + rc = llapi_layout_stripe_size_get(layout, &stripe_size); + if (rc) { + fprintf(stderr, "%s setstripe: cannot get stripe size: %s\n", + progname, strerror(errno)); + return rc; + } + + if (stripe_size != LLAPI_LAYOUT_DEFAULT && + (prev_end & (stripe_size - 1))) { + fprintf(stderr, + "%s setstripe: stripe size %lu not aligned with %lu\n", + progname, stripe_size, prev_end); + return -EINVAL; + } + + rc = llapi_layout_comp_extent_set(layout, prev_end, end); + if (rc) { + fprintf(stderr, + "%s setstripe: cannot set component extent [%lu, %lu): %s\n", + progname, prev_end, end, strerror(errno)); + return rc; + } + + return 0; +} + +static inline bool arg_is_eof(char *arg) +{ + return !strncmp(arg, "-1", strlen("-1")) || + !strncmp(arg, "EOF", strlen("EOF")) || + !strncmp(arg, "eof", strlen("eof")); +} + +/** + * lfs_mirror_alloc() - Allocate a mirror argument structure. + * + * Return: Valid mirror_args pointer on success and + * NULL if memory allocation fails. + */ +static struct mirror_args *lfs_mirror_alloc(void) +{ + struct mirror_args *mirror = NULL; + + while (1) { + mirror = calloc(1, sizeof(*mirror)); + if (mirror != NULL) + break; + + sleep(1); + } + + return mirror; +} + +/** + * lfs_mirror_free() - Free memory allocated for a mirror argument + * structure. + * @mirror: Previously allocated mirror argument structure by + * lfs_mirror_alloc(). + * + * Free memory allocated for @mirror. + * + * Return: void. + */ +static void lfs_mirror_free(struct mirror_args *mirror) +{ + if (mirror->m_layout != NULL) + llapi_layout_free(mirror->m_layout); + free(mirror); +} + +/** + * lfs_mirror_list_free() - Free memory allocated for a mirror list. + * @mirror_list: Previously allocated mirror list. + * + * Free memory allocated for @mirror_list. + * + * Return: void. + */ +static void lfs_mirror_list_free(struct mirror_args *mirror_list) +{ + struct mirror_args *next_mirror = NULL; + + while (mirror_list != NULL) { + next_mirror = mirror_list->m_next; + lfs_mirror_free(mirror_list); + mirror_list = next_mirror; + } +} + +enum { + LFS_POOL_OPT = 3, + LFS_COMP_COUNT_OPT, + LFS_COMP_START_OPT, + LFS_COMP_FLAGS_OPT, + LFS_COMP_DEL_OPT, + LFS_COMP_SET_OPT, + LFS_COMP_ADD_OPT, + LFS_COMP_NO_VERIFY_OPT, + LFS_PROJID_OPT, + LFS_MIRROR_FLAGS_OPT, + LFS_MIRROR_ID_OPT, + LFS_MIRROR_STATE_OPT, + LFS_LAYOUT_COPY, +}; + +/* functions */ +static int lfs_setstripe_internal(int argc, char **argv, + enum setstripe_origin opc) +{ + struct lfs_setstripe_args lsa = { 0 }; + struct llapi_stripe_param *param = NULL; + struct find_param migrate_mdt_param = { + .fp_max_depth = -1, + .fp_mdt_index = -1, + }; + char *fname; + int result = 0; + int result2 = 0; + char *end; + int c; + int delete = 0; + char *mdt_idx_arg = NULL; + unsigned long long size_units = 1; + bool migrate_mode = false; + bool migration_block = false; + __u64 migration_flags = 0; + __u32 osts[LOV_MAX_STRIPE_COUNT] = { 0 }; + int comp_del = 0, comp_set = 0; + int comp_add = 0; + __u32 comp_id = 0; + struct llapi_layout *layout = NULL; + struct llapi_layout **lpp = &layout; + bool mirror_mode = false; + bool has_m_file = false; + __u32 mirror_count = 0; + enum mirror_flags mirror_flags = 0; + struct mirror_args *mirror_list = NULL; + struct mirror_args *new_mirror = NULL; + struct mirror_args *last_mirror = NULL; + __u16 mirror_id = 0; + char cmd[PATH_MAX]; + bool from_yaml = false; + bool from_copy = false; + char *template = NULL; + + struct option long_opts[] = { +/* find { .val = 'A', .name = "atime", .has_arg = required_argument }*/ + /* --block is only valid in migrate mode */ + { .val = 'b', .name = "block", .has_arg = no_argument }, + { .val = LFS_COMP_ADD_OPT, + .name = "comp-add", .has_arg = no_argument }, + { .val = LFS_COMP_ADD_OPT, + .name = "component-add", .has_arg = no_argument }, + { .val = LFS_COMP_DEL_OPT, + .name = "comp-del", .has_arg = no_argument }, + { .val = LFS_COMP_DEL_OPT, + .name = "component-del", .has_arg = no_argument }, + { .val = LFS_COMP_FLAGS_OPT, + .name = "comp-flags", .has_arg = required_argument }, + { .val = LFS_COMP_FLAGS_OPT, + .name = "component-flags", + .has_arg = required_argument }, + { .val = LFS_COMP_SET_OPT, + .name = "comp-set", .has_arg = no_argument }, + { .val = LFS_COMP_SET_OPT, + .name = "component-set", + .has_arg = no_argument}, + { .val = LFS_COMP_NO_VERIFY_OPT, + .name = "no-verify", .has_arg = no_argument}, + { .val = LFS_MIRROR_FLAGS_OPT, + .name = "flags", .has_arg = required_argument}, + { .val = LFS_MIRROR_ID_OPT, + .name = "mirror-id", .has_arg = required_argument}, + { .val = LFS_LAYOUT_COPY, + .name = "copy", .has_arg = required_argument}, + { .val = 'c', .name = "stripe-count", .has_arg = required_argument}, + { .val = 'c', .name = "stripe_count", .has_arg = required_argument}, +/* find { .val = 'C', .name = "ctime", .has_arg = required_argument }*/ + { .val = 'd', .name = "delete", .has_arg = no_argument}, + { .val = 'd', .name = "destroy", .has_arg = no_argument}, + /* --non-direct is only valid in migrate mode */ + { .val = 'D', .name = "non-direct", .has_arg = no_argument }, + { .val = 'E', .name = "comp-end", .has_arg = required_argument}, + { .val = 'E', .name = "component-end", + .has_arg = required_argument}, + { .val = 'f', .name = "file", .has_arg = required_argument }, +/* find { .val = 'F', .name = "fid", .has_arg = no_argument }, */ +/* find { .val = 'g', .name = "gid", .has_arg = no_argument }, */ +/* find { .val = 'G', .name = "group", .has_arg = required_argument }*/ +/* dirstripe { .val = 'H', .name = "mdt-hash", .has_arg = required_argument }*/ + { .val = 'i', .name = "stripe-index", .has_arg = required_argument}, + { .val = 'i', .name = "stripe_index", .has_arg = required_argument}, + { .val = 'I', .name = "comp-id", .has_arg = required_argument}, + { .val = 'I', .name = "component-id", .has_arg = required_argument}, + { .val = 'L', .name = "layout", .has_arg = required_argument }, + { .val = 'm', .name = "mdt", .has_arg = required_argument}, + { .val = 'm', .name = "mdt-index", .has_arg = required_argument}, + { .val = 'm', .name = "mdt_index", .has_arg = required_argument}, + /* --non-block is only valid in migrate mode */ + { .val = 'n', .name = "non-block", .has_arg = no_argument }, + { .val = 'N', .name = "mirror-count", .has_arg = optional_argument}, + { .val = 'o', .name = "ost", .has_arg = required_argument }, +#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) + { .val = 'o', .name = "ost-list", .has_arg = required_argument }, + { .val = 'o', .name = "ost_list", .has_arg = required_argument }, +#endif + { .val = 'p', .name = "pool", .has_arg = required_argument }, +/* find { .val = 'P', .name = "print", .has_arg = no_argument }, */ +/* getstripe { .val = 'q', .name = "quiet", .has_arg = no_argument }, */ +/* getstripe { .val = 'r', .name = "recursive", .has_arg = no_argument }, */ +/* getstripe { .val = 'R', .name = "raw", .has_arg = no_argument }, */ + { .val = 'S', .name = "stripe-size", .has_arg = required_argument }, + { .val = 'S', .name = "stripe_size", .has_arg = required_argument }, +/* find { .val = 't', .name = "type", .has_arg = required_argument }*/ +/* dirstripe { .val = 'T', .name = "mdt-count", .has_arg = required_argument }*/ +/* find { .val = 'u', .name = "uid", .has_arg = required_argument }*/ +/* find { .val = 'U', .name = "user", .has_arg = required_argument }*/ + /* --verbose is only valid in migrate mode */ + { .val = 'v', .name = "verbose", .has_arg = no_argument}, + { .val = 'y', .name = "yaml", .has_arg = required_argument }, + { .name = NULL } }; + + setstripe_args_init(&lsa); + + migrate_mode = (opc == SO_MIGRATE); + mirror_mode = (opc == SO_MIRROR_CREATE || opc == SO_MIRROR_EXTEND); + + snprintf(cmd, sizeof(cmd), "%s %s", progname, argv[0]); + progname = cmd; + while ((c = getopt_long(argc, argv, "bc:dDE:f:i:I:m:N::no:p:L:s:S:vy:", + long_opts, NULL)) >= 0) { + switch (c) { + case 0: + /* Long options. */ + break; + case LFS_COMP_ADD_OPT: + comp_add = 1; + break; + case LFS_COMP_DEL_OPT: + comp_del = 1; + break; + case LFS_COMP_FLAGS_OPT: + result = comp_str2flags(optarg, &lsa.lsa_comp_flags, + &lsa.lsa_comp_neg_flags); + if (result != 0) + goto usage_error; + if (mirror_mode && lsa.lsa_comp_neg_flags) { + fprintf(stderr, "%s: inverted flags are not supported\n", + progname); + goto usage_error; + } + if (lsa.lsa_comp_neg_flags & LCME_FL_STALE) { + fprintf(stderr, + "%s: cannot clear 'stale' flags from component. Please use lfs-mirror-resync(1) instead\n", + progname); + result = -EINVAL; + goto error; + } + + break; + case LFS_COMP_SET_OPT: + comp_set = 1; + break; + case LFS_COMP_NO_VERIFY_OPT: + mirror_flags |= MF_NO_VERIFY; + break; + case LFS_MIRROR_ID_OPT: + mirror_id = strtoul(optarg, &end, 0); + if (*end != '\0' || mirror_id == 0) { + fprintf(stderr, + "%s %s: invalid mirror ID '%s'\n", + progname, argv[0], optarg); + goto usage_error; + } + break; + case LFS_MIRROR_FLAGS_OPT: { + __u32 flags; + + if (!mirror_mode || !last_mirror) { + fprintf(stderr, "error: %s: --flags must be specified with --mirror-count|-N option\n", + progname); + goto usage_error; + } + + result = comp_str2flags(optarg, &last_mirror->m_flags, + &flags); + if (result != 0) + goto usage_error; + + if (flags) { + fprintf(stderr, "%s: inverted flags are not supported\n", + progname); + result = -EINVAL; + goto usage_error; + } + if (last_mirror->m_flags & ~LCME_USER_FLAGS) { + fprintf(stderr, + "%s: unsupported mirror flags: %s\n", + progname, optarg); + result = -EINVAL; + goto error; + } + break; + } + case LFS_LAYOUT_COPY: + from_copy = true; + template = optarg; + break; + case 'b': + if (!migrate_mode) { + fprintf(stderr, + "%s %s: -b|--block valid only for migrate command\n", + progname, argv[0]); + goto usage_error; + } + migration_block = true; + break; + case 'c': + lsa.lsa_stripe_count = strtoul(optarg, &end, 0); + if (*end != '\0') { + fprintf(stderr, + "%s %s: invalid stripe count '%s'\n", + progname, argv[0], optarg); + goto usage_error; + } + + if (lsa.lsa_stripe_count == -1) + lsa.lsa_stripe_count = LLAPI_LAYOUT_WIDE; + break; + case 'd': + /* delete the default striping pattern */ + delete = 1; + if (opc == SO_MIRROR_SPLIT) { + if (has_m_file) { + fprintf(stderr, + "%s %s: -d cannot used with -f\n", + progname, argv[0]); + goto usage_error; + } + mirror_flags |= MF_DESTROY; + } + break; + case 'D': + if (!migrate_mode) { + fprintf(stderr, + "%s %s: -D|--non-direct is valid " + "only for migrate command\n", + progname, argv[0]); + goto usage_error; + } + migration_flags |= MIGRATION_NONDIRECT; + break; + case 'E': + if (lsa.lsa_comp_end != 0) { + result = comp_args_to_layout(lpp, &lsa, true); + if (result) { + fprintf(stderr, + "%s %s: invalid layout\n", + progname, argv[0]); + goto usage_error; + } + + setstripe_args_init_inherit(&lsa); + } + + if (arg_is_eof(optarg)) { + lsa.lsa_comp_end = LUSTRE_EOF; + } else { + result = llapi_parse_size(optarg, + &lsa.lsa_comp_end, + &size_units, 0); + if (result) { + fprintf(stderr, + "%s %s: invalid component end '%s'\n", + progname, argv[0], optarg); + goto usage_error; + } + } + break; + case 'i': + lsa.lsa_stripe_off = strtol(optarg, &end, 0); + if (*end != '\0') { + fprintf(stderr, + "%s %s: invalid stripe offset '%s'\n", + progname, argv[0], optarg); + goto usage_error; + } + if (lsa.lsa_stripe_off == -1) + lsa.lsa_stripe_off = LLAPI_LAYOUT_DEFAULT; + break; + case 'I': + comp_id = strtoul(optarg, &end, 0); + if (*end != '\0' || comp_id == 0 || + comp_id > LCME_ID_MAX) { + fprintf(stderr, + "%s %s: invalid component ID '%s'\n", + progname, argv[0], optarg); + goto usage_error; + } + break; + case 'f': + if (opc != SO_MIRROR_EXTEND && opc != SO_MIRROR_SPLIT) { + fprintf(stderr, + "error: %s: invalid option: %s\n", + progname, argv[optopt + 1]); + goto usage_error; + } + if (opc == SO_MIRROR_EXTEND) { + if (last_mirror == NULL) { + fprintf(stderr, + "error: %s: '-N' must exist in front of '%s'\n", + progname, argv[optopt + 1]); + goto usage_error; + } + last_mirror->m_file = optarg; + last_mirror->m_count = 1; + } else { + /* mirror split */ + if (mirror_list == NULL) + mirror_list = lfs_mirror_alloc(); + mirror_list->m_file = optarg; + } + has_m_file = true; + break; + case 'L': + if (strcmp(argv[optind - 1], "mdt") == 0) { + /* Can be only the first component */ + if (layout != NULL) { + result = -EINVAL; + fprintf(stderr, "error: 'mdt' layout " + "can be only the first one\n"); + goto error; + } + if (lsa.lsa_comp_end > (1ULL << 30)) { /* 1Gb */ + result = -EFBIG; + fprintf(stderr, "error: 'mdt' layout " + "size is too big\n"); + goto error; + } + lsa.lsa_pattern = LLAPI_LAYOUT_MDT; + } else if (strcmp(argv[optind - 1], "raid0") != 0) { + result = -EINVAL; + fprintf(stderr, "error: layout '%s' is " + "unknown, supported layouts are: " + "'mdt', 'raid0'\n", argv[optind]); + goto error; + } + break; + case 'm': + if (!migrate_mode) { + fprintf(stderr, + "%s %s: -m|--mdt-index valid only for migrate command\n", + progname, argv[0]); + goto usage_error; + } + mdt_idx_arg = optarg; + break; + case 'n': + if (!migrate_mode) { + fprintf(stderr, + "%s %s: -n|--non-block valid only for migrate command\n", + progname, argv[0]); + goto usage_error; + } + migration_flags |= MIGRATION_NONBLOCK; + break; + case 'N': + if (opc == SO_SETSTRIPE) { + opc = SO_MIRROR_CREATE; + mirror_mode = true; + } + mirror_count = 1; + if (optarg != NULL) { + mirror_count = strtoul(optarg, &end, 0); + if (*end != '\0' || mirror_count == 0) { + fprintf(stderr, + "error: %s: bad mirror count: %s\n", + progname, optarg); + result = -EINVAL; + goto error; + } + } + + new_mirror = lfs_mirror_alloc(); + new_mirror->m_count = mirror_count; + + if (mirror_list == NULL) + mirror_list = new_mirror; + + if (last_mirror != NULL) { + /* wrap up last mirror */ + if (lsa.lsa_comp_end == 0) + lsa.lsa_comp_end = LUSTRE_EOF; + + result = comp_args_to_layout(lpp, &lsa, true); + if (result) { + lfs_mirror_free(new_mirror); + goto error; + } + + setstripe_args_init_inherit(&lsa); + + last_mirror->m_next = new_mirror; + } + + last_mirror = new_mirror; + lpp = &last_mirror->m_layout; + break; + case 'o': +#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) + if (strcmp(argv[optind - 1], "--ost-list") == 0) + fprintf(stderr, "warning: '--ost-list' is " + "deprecated, use '--ost' instead\n"); +#endif + lsa.lsa_nr_tgts = parse_targets(osts, + sizeof(osts) / sizeof(__u32), + lsa.lsa_nr_tgts, optarg); + if (lsa.lsa_nr_tgts < 0) { + fprintf(stderr, + "%s %s: invalid OST target(s) '%s'\n", + progname, argv[0], optarg); + goto usage_error; + } + + lsa.lsa_tgts = osts; + if (lsa.lsa_stripe_off == LLAPI_LAYOUT_DEFAULT) + lsa.lsa_stripe_off = osts[0]; + break; + case 'p': + if (optarg == NULL) + goto usage_error; + lsa.lsa_pool_name = optarg; + + if (strlen(lsa.lsa_pool_name) == 0 || + strncmp(lsa.lsa_pool_name, "none", + LOV_MAXPOOLNAME) == 0) + lsa.lsa_pool_name = NULL; + break; + case 'S': + result = llapi_parse_size(optarg, &lsa.lsa_stripe_size, + &size_units, 0); + if (result) { + fprintf(stderr, + "%s %s: invalid stripe size '%s'\n", + progname, argv[0], optarg); + goto usage_error; + } + break; + case 'v': + if (!migrate_mode) { + fprintf(stderr, + "%s %s: -v|--verbose valid only for migrate command\n", + progname, argv[0]); + goto usage_error; + } + migrate_mdt_param.fp_verbose = VERBOSE_DETAIL; + break; + case 'y': + from_yaml = true; + template = optarg; + break; + default: + fprintf(stderr, "%s %s: unrecognized option '%s'\n", + progname, argv[0], argv[optind - 1]); + goto usage_error; + } + } + + fname = argv[optind]; + + if (optind == argc) { + fprintf(stderr, "%s %s: FILE must be specified\n", + progname, argv[0]); + goto usage_error; + } + + if (mirror_mode && mirror_count == 0) { + fprintf(stderr, + "error: %s: --mirror-count|-N option is required\n", + progname); + result = -EINVAL; + goto error; + } + + if (mirror_mode) { + if (lsa.lsa_comp_end == 0) + lsa.lsa_comp_end = LUSTRE_EOF; + } + + if (lsa.lsa_comp_end != 0) { + result = comp_args_to_layout(lpp, &lsa, true); + if (result) + goto error; + } + + if (mirror_flags & MF_NO_VERIFY) { + if (opc != SO_MIRROR_EXTEND) { + fprintf(stderr, + "error: %s: --no-verify is valid only for lfs mirror extend command\n", + progname); + result = -EINVAL; + goto error; + } else if (!has_m_file) { + fprintf(stderr, + "error: %s: --no-verify must be specified with -f option\n", + progname); + result = -EINVAL; + goto error; + } + } + + /* Only LCME_FL_INIT flags is used in PFL, and it shouldn't be + * altered by user space tool, so we don't need to support the + * --component-set for this moment. */ + if (comp_set && !comp_id) { + fprintf(stderr, "%s %s: --component-set doesn't have component-id set\n", + progname, argv[0]); + goto usage_error; + } + + if ((delete + comp_set + comp_del + comp_add) > 1) { + fprintf(stderr, + "%s %s: options --component-set, --component-del, --component-add and -d are mutually exclusive\n", + progname, argv[0]); + goto usage_error; + } + + if (delete && (setstripe_args_specified(&lsa) || comp_id != 0 || + lsa.lsa_comp_flags != 0 || layout != NULL)) { + fprintf(stderr, + "%s %s: option -d is mutually exclusive with -s, -c, -o, -p, -I, -F and -E options\n", + progname, argv[0]); + goto usage_error; + } + + if ((comp_set || comp_del) && + (setstripe_args_specified(&lsa) || layout != NULL)) { + fprintf(stderr, + "%s %s: options --component-del and --component-set are mutually exclusive when used with -c, -E, -o, -p, or -s\n", + progname, argv[0]); + goto usage_error; + } + + if (comp_del && comp_id != 0 && lsa.lsa_comp_flags != 0) { + fprintf(stderr, + "%s %s: options -I and -F are mutually exclusive when used with --component-del\n", + progname, argv[0]); + goto usage_error; + } + + if (comp_add || comp_del) { + struct stat st; + + result = lstat(fname, &st); + if (result == 0 && S_ISDIR(st.st_mode)) { + fprintf(stderr, + "%s setstripe: cannot use --component-add or --component-del for directory\n", + progname); + goto usage_error; + } + + if (mirror_mode) { + fprintf(stderr, "error: %s: can't use --component-add " + "or --component-del for mirror operation\n", + progname); + goto usage_error; + } + } + + if (comp_add) { + if (layout == NULL) { + fprintf(stderr, + "%s %s: option -E must be specified with --component-add\n", + progname, argv[0]); + goto usage_error; + } + + result = adjust_first_extent(fname, layout); + if (result == -ENODATA) + comp_add = 0; + else if (result != 0) + goto error; + } + + if (from_yaml && from_copy) { + fprintf(stderr, + "%s: can't specify --yaml and --copy together\n", + progname); + goto error; + } + + if ((from_yaml || from_copy) && + (setstripe_args_specified(&lsa) || layout != NULL)) { + fprintf(stderr, "error: %s: can't specify --yaml with " + "-c, -S, -i, -o, -p or -E options.\n", + argv[0]); + goto error; + } + + if (mdt_idx_arg != NULL && optind > 3) { + fprintf(stderr, + "%s %s: option -m cannot be used with other options\n", + progname, argv[0]); + goto usage_error; + } + + if ((migration_flags & MIGRATION_NONBLOCK) && migration_block) { + fprintf(stderr, + "%s %s: options --non-block and --block are mutually exclusive\n", + progname, argv[0]); + goto usage_error; + } + + if (!comp_del && !comp_set && comp_id != 0) { + fprintf(stderr, + "%s %s: option -I can only be used with --component-del\n", + progname, argv[0]); + goto usage_error; + } + + if (mdt_idx_arg != NULL) { + /* initialize migrate mdt parameters */ + migrate_mdt_param.fp_mdt_index = strtoul(mdt_idx_arg, &end, 0); + if (*end != '\0') { + fprintf(stderr, "%s %s: invalid MDT index '%s'\n", + progname, argv[0], mdt_idx_arg); + goto usage_error; + } + migrate_mdt_param.fp_migrate = 1; + } else if (layout == NULL) { + /* initialize stripe parameters */ + param = calloc(1, offsetof(typeof(*param), + lsp_osts[lsa.lsa_nr_tgts])); + if (param == NULL) { + fprintf(stderr, + "%s %s: cannot allocate memory for parameters: %s\n", + progname, argv[0], strerror(ENOMEM)); + result = -ENOMEM; + goto error; + } + + if (lsa.lsa_stripe_size != LLAPI_LAYOUT_DEFAULT) + param->lsp_stripe_size = lsa.lsa_stripe_size; + if (lsa.lsa_stripe_count != LLAPI_LAYOUT_DEFAULT) { + if (lsa.lsa_stripe_count == LLAPI_LAYOUT_WIDE) + param->lsp_stripe_count = -1; + else + param->lsp_stripe_count = lsa.lsa_stripe_count; + } + if (lsa.lsa_stripe_off == LLAPI_LAYOUT_DEFAULT) + param->lsp_stripe_offset = -1; + else + param->lsp_stripe_offset = lsa.lsa_stripe_off; + param->lsp_pool = lsa.lsa_pool_name; + param->lsp_is_specific = false; + if (lsa.lsa_nr_tgts > 0) { + if (lsa.lsa_stripe_count > 0 && + lsa.lsa_stripe_count != LLAPI_LAYOUT_DEFAULT && + lsa.lsa_stripe_count != LLAPI_LAYOUT_WIDE && + lsa.lsa_nr_tgts != lsa.lsa_stripe_count) { + fprintf(stderr, "error: %s: stripe count %lld " + "doesn't match the number of OSTs: %d\n" + , argv[0], lsa.lsa_stripe_count, + lsa.lsa_nr_tgts); + free(param); + goto usage_error; + } + + param->lsp_is_specific = true; + param->lsp_stripe_count = lsa.lsa_nr_tgts; + memcpy(param->lsp_osts, osts, + sizeof(*osts) * lsa.lsa_nr_tgts); + } + } + + if (from_yaml) { + /* generate a layout from a YAML template */ + result = lfs_comp_create_from_yaml(template, &layout, + &lsa, osts); + if (result) { + fprintf(stderr, "error: %s: can't create composite " + "layout from template file %s\n", + argv[0], template); + goto error; + } + } else if (from_copy) { + layout = llapi_layout_get_by_path(template, 0); + if (layout == NULL) { + fprintf(stderr, + "%s: can't create composite layout from file %s.\n", + progname, template); + goto error; + } + } + + for (fname = argv[optind]; fname != NULL; fname = argv[++optind]) { + if (mdt_idx_arg != NULL) { + result = llapi_migrate_mdt(fname, &migrate_mdt_param); + } else if (migrate_mode) { + result = lfs_migrate(fname, migration_flags, param, + layout); + } else if (comp_set != 0) { + result = lfs_component_set(fname, comp_id, + lsa.lsa_comp_flags, + lsa.lsa_comp_neg_flags); + } else if (comp_del != 0) { + result = lfs_component_del(fname, comp_id, + lsa.lsa_comp_flags, + lsa.lsa_comp_neg_flags); + } else if (comp_add != 0) { + result = lfs_component_add(fname, layout); + } else if (opc == SO_MIRROR_CREATE) { + result = mirror_create(fname, mirror_list); + } else if (opc == SO_MIRROR_EXTEND) { + result = mirror_extend(fname, mirror_list, + mirror_flags); + } else if (opc == SO_MIRROR_SPLIT) { + if (mirror_id == 0) { + fprintf(stderr, + "%s %s: no mirror id is specified\n", + progname, argv[0]); + goto usage_error; + } + result = mirror_split(fname, mirror_id, mirror_flags, + has_m_file ? mirror_list->m_file : + NULL); + } else if (layout != NULL) { + result = lfs_component_create(fname, O_CREAT | O_WRONLY, + 0666, layout); + if (result >= 0) { + close(result); + result = 0; + } + } else { + result = llapi_file_open_param(fname, + O_CREAT | O_WRONLY, + 0666, param); + if (result >= 0) { + close(result); + result = 0; + } + } + if (result) { + /* Save the first error encountered. */ + if (result2 == 0) + result2 = result; + continue; + } + } + + free(param); + llapi_layout_free(layout); + lfs_mirror_list_free(mirror_list); + return result2; +usage_error: + result = CMD_HELP; +error: + llapi_layout_free(layout); + lfs_mirror_list_free(mirror_list); + return result; +} + +static int lfs_poollist(int argc, char **argv) +{ + if (argc != 2) + return CMD_HELP; + + return llapi_poollist(argv[1]); +} + +static int set_time(time_t *time, time_t *set, char *str) +{ + time_t t; + int res = 0; + char *endptr; + + if (str[0] == '+') + res = 1; + else if (str[0] == '-') + res = -1; + + if (res) + str++; + + t = strtol(str, &endptr, 0); + if (*endptr != '\0') { + fprintf(stderr, + "%s find: bad time '%s': %s\n", + progname, str, strerror(EINVAL)); + return INT_MAX; + } + if (*time < t * 24 * 60 * 60) { + if (res != 0) + str--; + fprintf(stderr, + "%s find: bad time '%s': too large\n", + progname, str); + return INT_MAX; + } + + *set = *time - t * 24 * 60 * 60; + return res; +} + +static int name2uid(unsigned int *id, const char *name) +{ + struct passwd *passwd; + + passwd = getpwnam(name); + if (passwd == NULL) + return -ENOENT; + *id = passwd->pw_uid; + + return 0; +} + +static int name2gid(unsigned int *id, const char *name) +{ + struct group *group; + + group = getgrnam(name); + if (group == NULL) + return -ENOENT; + *id = group->gr_gid; + + return 0; +} + +static inline int name2projid(unsigned int *id, const char *name) +{ + return -ENOTSUP; +} + +static int uid2name(char **name, unsigned int id) +{ + struct passwd *passwd; + + passwd = getpwuid(id); + if (passwd == NULL) + return -ENOENT; + *name = passwd->pw_name; + + return 0; +} + +static inline int gid2name(char **name, unsigned int id) +{ + struct group *group; + + group = getgrgid(id); + if (group == NULL) + return -ENOENT; + *name = group->gr_name; + + return 0; +} + +static int name2layout(__u32 *layout, char *name) +{ + char *ptr, *layout_name; + + *layout = 0; + for (ptr = name; ; ptr = NULL) { + layout_name = strtok(ptr, ","); + if (layout_name == NULL) + break; + if (strcmp(layout_name, "released") == 0) + *layout |= LOV_PATTERN_F_RELEASED; + else if (strcmp(layout_name, "raid0") == 0) + *layout |= LOV_PATTERN_RAID0; + else if (strcmp(layout_name, "mdt") == 0) + *layout |= LOV_PATTERN_MDT; + else + return -1; + } + return 0; +} + +static int lfs_find(int argc, char **argv) +{ + int c, rc; + int ret = 0; + time_t t; + struct find_param param = { + .fp_max_depth = -1, + .fp_quiet = 1, + }; + struct option long_opts[] = { + { .val = 'A', .name = "atime", .has_arg = required_argument }, + { .val = 'b', .name = "blocks", .has_arg = required_argument }, + { .val = LFS_COMP_COUNT_OPT, + .name = "comp-count", .has_arg = required_argument }, + { .val = LFS_COMP_COUNT_OPT, + .name = "component-count", + .has_arg = required_argument }, + { .val = LFS_COMP_FLAGS_OPT, + .name = "comp-flags", .has_arg = required_argument }, + { .val = LFS_COMP_FLAGS_OPT, + .name = "component-flags", + .has_arg = required_argument }, + { .val = LFS_COMP_START_OPT, + .name = "comp-start", .has_arg = required_argument }, + { .val = LFS_COMP_START_OPT, + .name = "component-start", + .has_arg = required_argument }, + { .val = LFS_MIRROR_STATE_OPT, + .name = "mirror-state", .has_arg = required_argument }, + { .val = 'c', .name = "stripe-count", .has_arg = required_argument }, + { .val = 'c', .name = "stripe_count", .has_arg = required_argument }, + { .val = 'C', .name = "ctime", .has_arg = required_argument }, +/* getstripe { .val = 'd', .name = "directory", .has_arg = no_argument }, */ + { .val = 'D', .name = "maxdepth", .has_arg = required_argument }, + { .val = 'E', .name = "comp-end", .has_arg = required_argument }, + { .val = 'E', .name = "component-end", + .has_arg = required_argument }, +/* find { .val = 'F', .name = "fid", .has_arg = no_argument }, */ + { .val = 'g', .name = "gid", .has_arg = required_argument }, + { .val = 'G', .name = "group", .has_arg = required_argument }, + { .val = 'H', .name = "mdt-hash", .has_arg = required_argument }, + { .val = 'i', .name = "stripe-index", .has_arg = required_argument }, + { .val = 'i', .name = "stripe_index", .has_arg = required_argument }, +/* getstripe { .val = 'I', .name = "comp-id", .has_arg = required_argument }*/ + { .val = 'L', .name = "layout", .has_arg = required_argument }, + { .val = 'm', .name = "mdt", .has_arg = required_argument }, + { .val = 'm', .name = "mdt-index", .has_arg = required_argument }, + { .val = 'm', .name = "mdt_index", .has_arg = required_argument }, + { .val = 'M', .name = "mtime", .has_arg = required_argument }, + { .val = 'n', .name = "name", .has_arg = required_argument }, + { .val = 'N', .name = "mirror-count", .has_arg = required_argument }, +/* find { .val = 'o' .name = "or", .has_arg = no_argument }, like find(1) */ + { .val = 'O', .name = "obd", .has_arg = required_argument }, + { .val = 'O', .name = "ost", .has_arg = required_argument }, + /* no short option for pool yet, can be 'p' after 2.18 */ + { .val = LFS_POOL_OPT, + .name = "pool", .has_arg = required_argument }, + { .val = '0', .name = "print0", .has_arg = no_argument }, + { .val = 'P', .name = "print", .has_arg = no_argument }, + { .val = LFS_PROJID_OPT, + .name = "projid", .has_arg = required_argument }, +/* getstripe { .val = 'q', .name = "quiet", .has_arg = no_argument }, */ +/* getstripe { .val = 'r', .name = "recursive", .has_arg = no_argument }, */ +/* getstripe { .val = 'R', .name = "raw", .has_arg = no_argument }, */ + { .val = 's', .name = "size", .has_arg = required_argument }, + { .val = 'S', .name = "stripe-size", .has_arg = required_argument }, + { .val = 'S', .name = "stripe_size", .has_arg = required_argument }, + { .val = 't', .name = "type", .has_arg = required_argument }, + { .val = 'T', .name = "mdt-count", .has_arg = required_argument }, + { .val = 'u', .name = "uid", .has_arg = required_argument }, + { .val = 'U', .name = "user", .has_arg = required_argument }, +/* getstripe { .val = 'v', .name = "verbose", .has_arg = no_argument }, */ +/* getstripe { .val = 'y', .name = "yaml", .has_arg = no_argument }, */ + { .name = NULL } }; + int pathstart = -1; + int pathend = -1; + int neg_opt = 0; + time_t *xtime; + int *xsign; + int isoption; + char *endptr; + + time(&t); + + /* when getopt_long_only() hits '!' it returns 1, puts "!" in optarg */ + while ((c = getopt_long_only(argc, argv, + "-0A:b:c:C:D:E:g:G:H:i:L:m:M:n:N:O:Ppqrs:S:t:T:u:U:v", + long_opts, NULL)) >= 0) { + xtime = NULL; + xsign = NULL; + if (neg_opt) + --neg_opt; + /* '!' is part of option */ + /* when getopt_long_only() finds a string which is not + * an option nor a known option argument it returns 1 + * in that case if we already have found pathstart and pathend + * (i.e. we have the list of pathnames), + * the only supported value is "!" + */ + isoption = (c != 1) || (strcmp(optarg, "!") == 0); + if (!isoption && pathend != -1) { + fprintf(stderr, "err: %s: filename|dirname must either " + "precede options or follow options\n", + argv[0]); + ret = CMD_HELP; + goto err; + } + if (!isoption && pathstart == -1) + pathstart = optind - 1; + if (isoption && pathstart != -1 && pathend == -1) + pathend = optind - 2; + switch (c) { + case 0: + /* Long options. */ + break; + case 1: + /* unknown; opt is "!" or path component, + * checking done above. + */ + if (strcmp(optarg, "!") == 0) + neg_opt = 2; + break; + case 'A': + xtime = ¶m.fp_atime; + xsign = ¶m.fp_asign; + param.fp_exclude_atime = !!neg_opt; + /* no break, this falls through to 'C' for ctime */ + case 'C': + if (c == 'C') { + xtime = ¶m.fp_ctime; + xsign = ¶m.fp_csign; + param.fp_exclude_ctime = !!neg_opt; + } + /* no break, this falls through to 'M' for mtime */ + case 'M': + if (c == 'M') { + xtime = ¶m.fp_mtime; + xsign = ¶m.fp_msign; + param.fp_exclude_mtime = !!neg_opt; + } + rc = set_time(&t, xtime, optarg); + if (rc == INT_MAX) { + ret = -1; + goto err; + } + if (rc) + *xsign = rc; + break; + case 'b': + if (optarg[0] == '+') { + param.fp_blocks_sign = -1; + optarg++; + } else if (optarg[0] == '-') { + param.fp_blocks_sign = 1; + optarg++; + } + + param.fp_blocks_units = 1024; + ret = llapi_parse_size(optarg, ¶m.fp_blocks, + ¶m.fp_blocks_units, 0); + if (ret) { + fprintf(stderr, "error: bad blocks '%s'\n", + optarg); + goto err; + } + param.fp_check_blocks = 1; + param.fp_exclude_blocks = !!neg_opt; + break; + case LFS_COMP_COUNT_OPT: + if (optarg[0] == '+') { + param.fp_comp_count_sign = -1; + optarg++; + } else if (optarg[0] == '-') { + param.fp_comp_count_sign = 1; + optarg++; + } + + param.fp_comp_count = strtoul(optarg, &endptr, 0); + if (*endptr != '\0') { + fprintf(stderr, "error: bad component count " + "'%s'\n", optarg); + goto err; + } + param.fp_check_comp_count = 1; + param.fp_exclude_comp_count = !!neg_opt; + break; + case LFS_COMP_FLAGS_OPT: + rc = comp_str2flags(optarg, ¶m.fp_comp_flags, + ¶m.fp_comp_neg_flags); + if (rc) { + fprintf(stderr, "error: bad component flags " + "'%s'\n", optarg); + goto err; + } + param.fp_check_comp_flags = 1; + if (neg_opt) { + __u32 flags = param.fp_comp_neg_flags; + param.fp_comp_neg_flags = param.fp_comp_flags; + param.fp_comp_flags = flags; + } + break; + case LFS_COMP_START_OPT: + if (optarg[0] == '+') { + param.fp_comp_start_sign = -1; + optarg++; + } else if (optarg[0] == '-') { + param.fp_comp_start_sign = 1; + optarg++; + } + + rc = llapi_parse_size(optarg, ¶m.fp_comp_start, + ¶m.fp_comp_start_units, 0); + if (rc) { + fprintf(stderr, "error: bad component start " + "'%s'\n", optarg); + goto err; + } + param.fp_check_comp_start = 1; + param.fp_exclude_comp_start = !!neg_opt; + break; + case LFS_MIRROR_STATE_OPT: + rc = mirror_str2state(optarg, ¶m.fp_mirror_state, + ¶m.fp_mirror_neg_state); + if (rc) { + fprintf(stderr, + "error: bad mirrored file state '%s'\n", + optarg); + goto err; + } + param.fp_check_mirror_state = 1; + if (neg_opt) { + __u16 state = param.fp_mirror_neg_state; + param.fp_mirror_neg_state = + param.fp_mirror_state; + param.fp_mirror_state = state; + } + break; + case 'c': + if (optarg[0] == '+') { + param.fp_stripe_count_sign = -1; + optarg++; + } else if (optarg[0] == '-') { + param.fp_stripe_count_sign = 1; + optarg++; + } + + param.fp_stripe_count = strtoul(optarg, &endptr, 0); + if (*endptr != '\0') { + fprintf(stderr,"error: bad stripe_count '%s'\n", + optarg); + ret = -1; + goto err; + } + param.fp_check_stripe_count = 1; + param.fp_exclude_stripe_count = !!neg_opt; + break; + case 'D': + param.fp_max_depth = strtol(optarg, 0, 0); + break; + case 'E': + if (optarg[0] == '+') { + param.fp_comp_end_sign = -1; + optarg++; + } else if (optarg[0] == '-') { + param.fp_comp_end_sign = 1; + optarg++; + } + + if (arg_is_eof(optarg)) { + param.fp_comp_end = LUSTRE_EOF; + param.fp_comp_end_units = 1; + rc = 0; + } else { + rc = llapi_parse_size(optarg, + ¶m.fp_comp_end, + ¶m.fp_comp_end_units, 0); + } + if (rc) { + fprintf(stderr, "error: bad component end " + "'%s'\n", optarg); + goto err; + } + param.fp_check_comp_end = 1; + param.fp_exclude_comp_end = !!neg_opt; + break; + case 'g': + case 'G': + rc = name2gid(¶m.fp_gid, optarg); + if (rc) { + param.fp_gid = strtoul(optarg, &endptr, 10); + if (*endptr != '\0') { + fprintf(stderr, "Group/GID: %s cannot " + "be found.\n", optarg); + ret = -1; + goto err; + } + } + param.fp_exclude_gid = !!neg_opt; + param.fp_check_gid = 1; + break; + case 'H': + param.fp_hash_type = check_hashtype(optarg); + if (param.fp_hash_type == 0) { + fprintf(stderr, "error: bad hash_type '%s'\n", + optarg); + ret = -1; + goto err; + } + param.fp_check_hash_type = 1; + param.fp_exclude_hash_type = !!neg_opt; + break; + case 'L': + ret = name2layout(¶m.fp_layout, optarg); + if (ret) + goto err; + param.fp_exclude_layout = !!neg_opt; + param.fp_check_layout = 1; + break; + case 'u': + case 'U': + rc = name2uid(¶m.fp_uid, optarg); + if (rc) { + param.fp_uid = strtoul(optarg, &endptr, 10); + if (*endptr != '\0') { + fprintf(stderr, "User/UID: %s cannot " + "be found.\n", optarg); + ret = -1; + goto err; + } + } + param.fp_exclude_uid = !!neg_opt; + param.fp_check_uid = 1; + break; + case 'n': + param.fp_pattern = (char *)optarg; + param.fp_exclude_pattern = !!neg_opt; + break; + case 'N': + if (optarg[0] == '+') { + param.fp_mirror_count_sign = -1; + optarg++; + } else if (optarg[0] == '-') { + param.fp_mirror_count_sign = 1; + optarg++; + } + + param.fp_mirror_count = strtoul(optarg, &endptr, 0); + if (*endptr != '\0') { + fprintf(stderr, + "error: bad mirror count '%s'\n", + optarg); + goto err; + } + param.fp_check_mirror_count = 1; + param.fp_exclude_mirror_count = !!neg_opt; + break; + case 'm': + case 'i': + case 'O': { + char *buf, *token, *next, *p; + int len = 1; + void *tmp; + + buf = strdup(optarg); + if (buf == NULL) { + ret = -ENOMEM; + goto err; + } + + param.fp_exclude_obd = !!neg_opt; + + token = buf; + while (token && *token) { + token = strchr(token, ','); + if (token) { + len++; + token++; + } + } + if (c == 'm') { + param.fp_exclude_mdt = !!neg_opt; + param.fp_num_alloc_mdts += len; + tmp = realloc(param.fp_mdt_uuid, + param.fp_num_alloc_mdts * + sizeof(*param.fp_mdt_uuid)); + if (tmp == NULL) { + ret = -ENOMEM; + goto err_free; + } + + param.fp_mdt_uuid = tmp; + } else { + param.fp_exclude_obd = !!neg_opt; + param.fp_num_alloc_obds += len; + tmp = realloc(param.fp_obd_uuid, + param.fp_num_alloc_obds * + sizeof(*param.fp_obd_uuid)); + if (tmp == NULL) { + ret = -ENOMEM; + goto err_free; + } + + param.fp_obd_uuid = tmp; + } + for (token = buf; token && *token; token = next) { + struct obd_uuid *puuid; + if (c == 'm') { + puuid = + ¶m.fp_mdt_uuid[param.fp_num_mdts++]; + } else { + puuid = + ¶m.fp_obd_uuid[param.fp_num_obds++]; + } + p = strchr(token, ','); + next = 0; + if (p) { + *p = 0; + next = p+1; + } + + if (strlen(token) > sizeof(puuid->uuid) - 1) { + ret = -E2BIG; + goto err_free; + } + + strncpy(puuid->uuid, token, + sizeof(puuid->uuid)); + } +err_free: + if (buf) + free(buf); + break; + } +#if LUSTRE_VERSION_CODE >= OBD_OCD_VERSION(2, 18, 53, 0) + case 'p': +#endif + case LFS_POOL_OPT: + if (strlen(optarg) > LOV_MAXPOOLNAME) { + fprintf(stderr, + "Pool name %s is too long (max %d)\n", + optarg, LOV_MAXPOOLNAME); + ret = -1; + goto err; + } + /* + * We do check for empty pool because empty pool + * is used to find V1 LOV attributes + */ + strncpy(param.fp_poolname, optarg, LOV_MAXPOOLNAME); + param.fp_poolname[LOV_MAXPOOLNAME] = '\0'; + param.fp_exclude_pool = !!neg_opt; + param.fp_check_pool = 1; + break; +#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(2, 14, 53, 0) + case 'p': /* want this for --pool, to match getstripe/find */ + fprintf(stderr, + "warning: -p deprecated, use --print0 or -0\n"); +#endif + case '0': + param.fp_zero_end = 1; + break; + case 'P': /* we always print, this option is a no-op */ + break; + case LFS_PROJID_OPT: + rc = name2projid(¶m.fp_projid, optarg); + if (rc) { + param.fp_projid = strtoul(optarg, &endptr, 10); + if (*endptr != '\0') { + fprintf(stderr, + "Invalid project ID: %s", + optarg); + ret = -1; + goto err; + } + } + param.fp_exclude_projid = !!neg_opt; + param.fp_check_projid = 1; + break; + case 's': + if (optarg[0] == '+') { + param.fp_size_sign = -1; + optarg++; + } else if (optarg[0] == '-') { + param.fp_size_sign = 1; + optarg++; + } + + ret = llapi_parse_size(optarg, ¶m.fp_size, + ¶m.fp_size_units, 0); + if (ret) { + fprintf(stderr, "error: bad file size '%s'\n", + optarg); + goto err; + } + param.fp_check_size = 1; + param.fp_exclude_size = !!neg_opt; + break; + case 'S': + if (optarg[0] == '+') { + param.fp_stripe_size_sign = -1; + optarg++; + } else if (optarg[0] == '-') { + param.fp_stripe_size_sign = 1; + optarg++; + } + + ret = llapi_parse_size(optarg, ¶m.fp_stripe_size, + ¶m.fp_stripe_size_units, 0); + if (ret) { + fprintf(stderr, "error: bad stripe_size '%s'\n", + optarg); + goto err; + } + param.fp_check_stripe_size = 1; + param.fp_exclude_stripe_size = !!neg_opt; + break; + case 't': + param.fp_exclude_type = !!neg_opt; + switch (optarg[0]) { + case 'b': + param.fp_type = S_IFBLK; + break; + case 'c': + param.fp_type = S_IFCHR; + break; + case 'd': + param.fp_type = S_IFDIR; + break; + case 'f': + param.fp_type = S_IFREG; + break; + case 'l': + param.fp_type = S_IFLNK; + break; + case 'p': + param.fp_type = S_IFIFO; + break; + case 's': + param.fp_type = S_IFSOCK; + break; + default: + fprintf(stderr, "error: %s: bad type '%s'\n", + argv[0], optarg); + ret = CMD_HELP; + goto err; + }; + break; + case 'T': + if (optarg[0] == '+') { + param.fp_mdt_count_sign = -1; + optarg++; + } else if (optarg[0] == '-') { + param.fp_mdt_count_sign = 1; + optarg++; + } + + param.fp_mdt_count = strtoul(optarg, &endptr, 0); + if (*endptr != '\0') { + fprintf(stderr, "error: bad mdt_count '%s'\n", + optarg); + ret = -1; goto err; } - param.fp_check_comp_flags = 1; - param.fp_exclude_comp_flags = !!neg_opt; + param.fp_check_mdt_count = 1; + param.fp_exclude_mdt_count = !!neg_opt; + break; + default: + ret = CMD_HELP; + goto err; + }; + } + + if (pathstart == -1) { + fprintf(stderr, "error: %s: no filename|pathname\n", + argv[0]); + ret = CMD_HELP; + goto err; + } else if (pathend == -1) { + /* no options */ + pathend = argc; + } + + do { + rc = llapi_find(argv[pathstart], ¶m); + if (rc != 0 && ret == 0) + ret = rc; + } while (++pathstart < pathend); + + if (ret) + fprintf(stderr, "error: %s failed for %s.\n", + argv[0], argv[optind - 1]); +err: + if (param.fp_obd_uuid && param.fp_num_alloc_obds) + free(param.fp_obd_uuid); + + if (param.fp_mdt_uuid && param.fp_num_alloc_mdts) + free(param.fp_mdt_uuid); + + return ret; +} + +static int lfs_getstripe_internal(int argc, char **argv, + struct find_param *param) +{ + struct option long_opts[] = { +/* find { .val = 'A', .name = "atime", .has_arg = required_argument }*/ +/* find { .val = 'b', .name = "blocks", .has_arg = required_argument }*/ + { .val = LFS_COMP_COUNT_OPT, + .name = "comp-count", .has_arg = no_argument }, + { .val = LFS_COMP_COUNT_OPT, + .name = "component-count", .has_arg = no_argument }, + { .val = LFS_COMP_FLAGS_OPT, + .name = "comp-flags", .has_arg = optional_argument }, + { .val = LFS_COMP_FLAGS_OPT, + .name = "component-flags", .has_arg = optional_argument }, + { .val = LFS_COMP_START_OPT, + .name = "comp-start", .has_arg = optional_argument }, + { .val = LFS_COMP_START_OPT, + .name = "component-start", .has_arg = optional_argument }, + { .val = 'c', .name = "stripe-count", .has_arg = no_argument }, + { .val = 'c', .name = "stripe_count", .has_arg = no_argument }, +/* find { .val = 'C', .name = "ctime", .has_arg = required_argument }*/ + { .val = 'd', .name = "directory", .has_arg = no_argument }, + { .val = 'D', .name = "default", .has_arg = no_argument }, + { .val = 'E', .name = "comp-end", .has_arg = optional_argument }, + { .val = 'E', .name = "component-end", .has_arg = optional_argument }, + { .val = 'F', .name = "fid", .has_arg = no_argument }, + { .val = 'g', .name = "generation", .has_arg = no_argument }, +/* find { .val = 'G', .name = "group", .has_arg = required_argument }*/ +/* dirstripe { .val = 'H', .name = "mdt-hash", .has_arg = required_argument }*/ + { .val = 'i', .name = "stripe-index", .has_arg = no_argument }, + { .val = 'i', .name = "stripe_index", .has_arg = no_argument }, + { .val = 'I', .name = "comp-id", .has_arg = optional_argument }, + { .val = 'I', .name = "component-id", .has_arg = optional_argument }, + { .val = 'L', .name = "layout", .has_arg = no_argument }, + { .val = 'm', .name = "mdt", .has_arg = no_argument }, + { .val = 'm', .name = "mdt-index", .has_arg = no_argument }, + { .val = 'm', .name = "mdt_index", .has_arg = no_argument }, +/* find { .val = 'M', .name = "mtime", .has_arg = required_argument }*/ +/* find { .val = 'n', .name = "name", .has_arg = required_argument }*/ + { .val = 'O', .name = "obd", .has_arg = required_argument }, + { .val = 'O', .name = "ost", .has_arg = required_argument }, + { .val = 'p', .name = "pool", .has_arg = no_argument }, +/* find { .val = 'P', .name = "print", .has_arg = no_argument }, */ + { .val = 'q', .name = "quiet", .has_arg = no_argument }, + { .val = 'r', .name = "recursive", .has_arg = no_argument }, + { .val = 'R', .name = "raw", .has_arg = no_argument }, + { .val = 'S', .name = "stripe-size", .has_arg = no_argument }, + { .val = 'S', .name = "stripe_size", .has_arg = no_argument }, +/* find { .val = 't', .name = "type", .has_arg = required_argument }*/ +/* dirstripe { .val = 'T', .name = "mdt-count", .has_arg = required_argument }*/ +/* find { .val = 'u', .name = "uid", .has_arg = required_argument }*/ +/* find { .val = 'U', .name = "user", .has_arg = required_argument }*/ + { .val = 'v', .name = "verbose", .has_arg = no_argument }, + { .val = 'y', .name = "yaml", .has_arg = no_argument }, + { .name = NULL } }; + int c, rc; + char *end, *tmp; + + while ((c = getopt_long(argc, argv, "cdDE::FghiI::LmMoO:pqrRsSvy", + long_opts, NULL)) != -1) { + switch (c) { + case 'c': + if (!(param->fp_verbose & VERBOSE_DETAIL)) { + param->fp_verbose |= VERBOSE_COUNT; + param->fp_max_depth = 0; + } + break; + case LFS_COMP_COUNT_OPT: + param->fp_verbose |= VERBOSE_COMP_COUNT; + param->fp_max_depth = 0; + break; + case LFS_COMP_FLAGS_OPT: + if (optarg != NULL) { + rc = comp_str2flags(optarg, + ¶m->fp_comp_flags, + ¶m->fp_comp_neg_flags); + if (rc != 0) { + fprintf(stderr, "error: %s bad " + "component flags '%s'.\n", + argv[0], optarg); + return CMD_HELP; + } + param->fp_check_comp_flags = 1; + } else { + param->fp_verbose |= VERBOSE_COMP_FLAGS; + param->fp_max_depth = 0; + } + break; + case LFS_COMP_START_OPT: + if (optarg != NULL) { + tmp = optarg; + if (tmp[0] == '+') { + param->fp_comp_start_sign = -1; + tmp++; + } else if (tmp[0] == '-') { + param->fp_comp_start_sign = 1; + tmp++; + } + rc = llapi_parse_size(tmp, + ¶m->fp_comp_start, + ¶m->fp_comp_start_units, 0); + if (rc != 0) { + fprintf(stderr, "error: %s bad " + "component start '%s'.\n", + argv[0], tmp); + return CMD_HELP; + } else { + param->fp_check_comp_start = 1; + } + } else { + param->fp_verbose |= VERBOSE_COMP_START; + param->fp_max_depth = 0; + } + break; + case 'd': + param->fp_max_depth = 0; + break; + case 'D': + param->fp_get_default_lmv = 1; + break; + case 'E': + if (optarg != NULL) { + tmp = optarg; + if (tmp[0] == '+') { + param->fp_comp_end_sign = -1; + tmp++; + } else if (tmp[0] == '-') { + param->fp_comp_end_sign = 1; + tmp++; + } + + if (arg_is_eof(tmp)) { + param->fp_comp_end = LUSTRE_EOF; + param->fp_comp_end_units = 1; + rc = 0; + } else { + rc = llapi_parse_size(tmp, + ¶m->fp_comp_end, + ¶m->fp_comp_end_units, 0); + } + if (rc != 0) { + fprintf(stderr, "error: %s bad " + "component end '%s'.\n", + argv[0], tmp); + return CMD_HELP; + } + param->fp_check_comp_end = 1; + } else { + param->fp_verbose |= VERBOSE_COMP_END; + param->fp_max_depth = 0; + } + break; + case 'F': + if (!(param->fp_verbose & VERBOSE_DETAIL)) { + param->fp_verbose |= VERBOSE_DFID; + param->fp_max_depth = 0; + } + break; + case 'g': + if (!(param->fp_verbose & VERBOSE_DETAIL)) { + param->fp_verbose |= VERBOSE_GENERATION; + param->fp_max_depth = 0; + } + break; + case 'i': + if (!(param->fp_verbose & VERBOSE_DETAIL)) { + param->fp_verbose |= VERBOSE_OFFSET; + param->fp_max_depth = 0; + } + break; + case 'I': + if (optarg != NULL) { + param->fp_comp_id = strtoul(optarg, &end, 0); + if (*end != '\0' || param->fp_comp_id == 0 || + param->fp_comp_id > LCME_ID_MAX) { + fprintf(stderr, "error: %s bad " + "component id '%s'\n", + argv[0], optarg); + return CMD_HELP; + } else { + param->fp_check_comp_id = 1; + } + } else { + param->fp_max_depth = 0; + param->fp_verbose |= VERBOSE_COMP_ID; + } + break; + case 'L': + if (!(param->fp_verbose & VERBOSE_DETAIL)) { + param->fp_verbose |= VERBOSE_LAYOUT; + param->fp_max_depth = 0; + } + break; +#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) + case 'M': + fprintf(stderr, "warning: '-M' deprecated" + ", use '--mdt-index' or '-m' instead\n"); +#endif + case 'm': + if (!(param->fp_verbose & VERBOSE_DETAIL)) + param->fp_max_depth = 0; + param->fp_verbose |= VERBOSE_MDTINDEX; + break; + case 'O': + if (param->fp_obd_uuid) { + fprintf(stderr, + "error: %s: only one obduuid allowed", + argv[0]); + return CMD_HELP; + } + param->fp_obd_uuid = (struct obd_uuid *)optarg; + break; + case 'p': + if (!(param->fp_verbose & VERBOSE_DETAIL)) { + param->fp_verbose |= VERBOSE_POOL; + param->fp_max_depth = 0; + } + break; + case 'q': + param->fp_quiet++; + break; + case 'r': + param->fp_recursive = 1; + break; + case 'R': + param->fp_raw = 1; + break; + case 'S': + if (!(param->fp_verbose & VERBOSE_DETAIL)) { + param->fp_verbose |= VERBOSE_SIZE; + param->fp_max_depth = 0; + } + break; + case 'v': + param->fp_verbose = VERBOSE_DEFAULT | VERBOSE_DETAIL; + break; + case 'y': + param->fp_yaml = 1; + break; + default: + return CMD_HELP; + } + } + + if (optind >= argc) + return CMD_HELP; + + if (param->fp_recursive) + param->fp_max_depth = -1; + else if (param->fp_verbose & VERBOSE_DETAIL) + param->fp_max_depth = 1; + + if (!param->fp_verbose) + param->fp_verbose = VERBOSE_DEFAULT; + if (param->fp_quiet) + param->fp_verbose = VERBOSE_OBJID; + + do { + rc = llapi_getstripe(argv[optind], param); + } while (++optind < argc && !rc); + + if (rc) + fprintf(stderr, "error: %s failed for %s.\n", + argv[0], argv[optind - 1]); + return rc; +} + +static int lfs_tgts(int argc, char **argv) +{ + char mntdir[PATH_MAX] = {'\0'}, path[PATH_MAX] = {'\0'}; + struct find_param param; + int index = 0, rc=0; + + if (argc > 2) + return CMD_HELP; + + if (argc == 2 && !realpath(argv[1], path)) { + rc = -errno; + fprintf(stderr, "error: invalid path '%s': %s\n", + argv[1], strerror(-rc)); + return rc; + } + + while (!llapi_search_mounts(path, index++, mntdir, NULL)) { + /* Check if we have a mount point */ + if (mntdir[0] == '\0') + continue; + + memset(¶m, 0, sizeof(param)); + if (!strcmp(argv[0], "mdts")) + param.fp_get_lmv = 1; + + rc = llapi_ostlist(mntdir, ¶m); + if (rc) { + fprintf(stderr, "error: %s: failed on %s\n", + argv[0], mntdir); + } + if (path[0] != '\0') + break; + memset(mntdir, 0, PATH_MAX); + } + + return rc; +} + +static int lfs_getstripe(int argc, char **argv) +{ + struct find_param param = { 0 }; + + param.fp_max_depth = 1; + return lfs_getstripe_internal(argc, argv, ¶m); +} + +/* functions */ +static int lfs_getdirstripe(int argc, char **argv) +{ + struct find_param param = { 0 }; + struct option long_opts[] = { + { .val = 'c', .name = "mdt-count", .has_arg = no_argument }, + { .val = 'D', .name = "default", .has_arg = no_argument }, + { .val = 'H', .name = "mdt-hash", .has_arg = no_argument }, + { .val = 'i', .name = "mdt-index", .has_arg = no_argument }, + { .val = 'm', .name = "mdt-index", .has_arg = no_argument }, + { .val = 'O', .name = "obd", .has_arg = required_argument }, + { .val = 'r', .name = "recursive", .has_arg = no_argument }, + { .val = 'T', .name = "mdt-count", .has_arg = no_argument }, + { .val = 'y', .name = "yaml", .has_arg = no_argument }, + { .name = NULL } }; + int c, rc; + + param.fp_get_lmv = 1; + + while ((c = getopt_long(argc, argv, + "cDHimO:rtTy", long_opts, NULL)) != -1) + { + switch (c) { + case 'c': + case 'T': + param.fp_verbose |= VERBOSE_COUNT; + break; + case 'D': + param.fp_get_default_lmv = 1; + break; + case 'i': + case 'm': + param.fp_verbose |= VERBOSE_OFFSET; + break; +#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) + case 't': + fprintf(stderr, "warning: '-t' deprecated, " + "use '--mdt-hash' or '-H' instead\n"); +#endif + case 'H': + param.fp_verbose |= VERBOSE_HASH_TYPE; + break; + case 'O': + if (param.fp_obd_uuid) { + fprintf(stderr, + "error: %s: only one obduuid allowed", + argv[0]); + return CMD_HELP; + } + param.fp_obd_uuid = (struct obd_uuid *)optarg; + break; + case 'r': + param.fp_recursive = 1; + break; + case 'y': + param.fp_yaml = 1; + break; + default: + return CMD_HELP; + } + } + + if (optind >= argc) + return CMD_HELP; + + if (param.fp_recursive) + param.fp_max_depth = -1; + + if (!param.fp_verbose) + param.fp_verbose = VERBOSE_DEFAULT; + + do { + rc = llapi_getstripe(argv[optind], ¶m); + } while (++optind < argc && !rc); + + if (rc) + fprintf(stderr, "error: %s failed for %s.\n", + argv[0], argv[optind - 1]); + return rc; +} + +enum mntdf_flags { + MNTDF_INODES = 0x0001, + MNTDF_COOKED = 0x0002, + MNTDF_LAZY = 0x0004, + MNTDF_VERBOSE = 0x0008, + MNTDF_SHOW = 0x0010, +}; + +#define COOK(value) \ +({ \ + int radix = 0; \ + while (value > 1024) { \ + value /= 1024; \ + radix++; \ + } \ + radix; \ +}) +#define UUF "%-20s" +#define CSF "%11s" +#define CDF "%11llu" +#define HDF "%8.1f%c" +#define RSF "%4s" +#define RDF "%3d%%" + +static inline int obd_statfs_ratio(const struct obd_statfs *st) +{ + double avail, used, ratio = 0; + + avail = st->os_bavail; + used = st->os_blocks - st->os_bfree; + if (avail + used > 0) + ratio = used / (used + avail) * 100 + 0.5; + + return (int)ratio; +} + +static int showdf(char *mntdir, struct obd_statfs *stat, + char *uuid, enum mntdf_flags flags, + char *type, int index, int rc) +{ + long long avail, used, total; + int ratio = 0; + char *suffix = "KMGTPEZY"; + /* Note if we have >2^64 bytes/fs these buffers will need to be grown */ + char tbuf[3 * sizeof(__u64)]; + char ubuf[3 * sizeof(__u64)]; + char abuf[3 * sizeof(__u64)]; + char rbuf[3 * sizeof(__u64)]; + + if (!uuid || !stat) + return -EINVAL; + + switch (rc) { + case 0: + if (flags & MNTDF_INODES) { + avail = stat->os_ffree; + used = stat->os_files - stat->os_ffree; + total = stat->os_files; + } else { + int shift = flags & MNTDF_COOKED ? 0 : 10; + + avail = (stat->os_bavail * stat->os_bsize) >> shift; + used = ((stat->os_blocks - stat->os_bfree) * + stat->os_bsize) >> shift; + total = (stat->os_blocks * stat->os_bsize) >> shift; + } + + ratio = obd_statfs_ratio(stat); + + if (flags & MNTDF_COOKED) { + int i; + double cook_val; + + cook_val = (double)total; + i = COOK(cook_val); + if (i > 0) + snprintf(tbuf, sizeof(tbuf), HDF, cook_val, + suffix[i - 1]); + else + snprintf(tbuf, sizeof(tbuf), CDF, total); + + cook_val = (double)used; + i = COOK(cook_val); + if (i > 0) + snprintf(ubuf, sizeof(ubuf), HDF, cook_val, + suffix[i - 1]); + else + snprintf(ubuf, sizeof(ubuf), CDF, used); + + cook_val = (double)avail; + i = COOK(cook_val); + if (i > 0) + snprintf(abuf, sizeof(abuf), HDF, cook_val, + suffix[i - 1]); + else + snprintf(abuf, sizeof(abuf), CDF, avail); + } else { + snprintf(tbuf, sizeof(tbuf), CDF, total); + snprintf(ubuf, sizeof(tbuf), CDF, used); + snprintf(abuf, sizeof(tbuf), CDF, avail); + } + + sprintf(rbuf, RDF, ratio); + printf(UUF" "CSF" "CSF" "CSF" "RSF" %-s", + uuid, tbuf, ubuf, abuf, rbuf, mntdir); + if (type) + printf("[%s:%d]", type, index); + + if (stat->os_state) { + /* + * Each character represents the matching + * OS_STATE_* bit. + */ + const char state_names[] = "DRSI"; + __u32 state; + __u32 i; + + printf(" "); + for (i = 0, state = stat->os_state; + state && i < sizeof(state_names); i++) { + if (!(state & (1 << i))) + continue; + printf("%c", state_names[i]); + state ^= 1 << i; + } + } + + printf("\n"); + break; + case -ENODATA: + printf(UUF": inactive device\n", uuid); + break; + default: + printf(UUF": %s\n", uuid, strerror(-rc)); + break; + } + + return 0; +} + +struct ll_stat_type { + int st_op; + char *st_name; +}; + +#define LL_STATFS_MAX LOV_MAX_STRIPE_COUNT + +struct ll_statfs_data { + int sd_index; + struct obd_statfs sd_st; +}; + +struct ll_statfs_buf { + int sb_count; + struct ll_statfs_data sb_buf[LL_STATFS_MAX]; +}; + +static int mntdf(char *mntdir, char *fsname, char *pool, enum mntdf_flags flags, + int ops, struct ll_statfs_buf *lsb) +{ + struct obd_statfs stat_buf, sum = { .os_bsize = 1 }; + struct obd_uuid uuid_buf; + char *poolname = NULL; + struct ll_stat_type types[] = { + { .st_op = LL_STATFS_LMV, .st_name = "MDT" }, + { .st_op = LL_STATFS_LOV, .st_name = "OST" }, + { .st_name = NULL } }; + struct ll_stat_type *tp; + __u64 ost_ffree = 0; + __u32 index; + __u32 type; + int fd; + int rc = 0; + int rc2; + + if (pool) { + poolname = strchr(pool, '.'); + if (poolname != NULL) { + if (strncmp(fsname, pool, strlen(fsname))) { + fprintf(stderr, "filesystem name incorrect\n"); + return -ENODEV; + } + poolname++; + } else + poolname = pool; + } + + fd = open(mntdir, O_RDONLY); + if (fd < 0) { + rc = -errno; + fprintf(stderr, "%s: cannot open '%s': %s\n", progname, mntdir, + strerror(errno)); + return rc; + } + + if (flags & MNTDF_SHOW) { + if (flags & MNTDF_INODES) + printf(UUF" "CSF" "CSF" "CSF" "RSF" %-s\n", + "UUID", "Inodes", "IUsed", "IFree", + "IUse%", "Mounted on"); + else + printf(UUF" "CSF" "CSF" "CSF" "RSF" %-s\n", + "UUID", + flags & MNTDF_COOKED ? "bytes" : "1K-blocks", + "Used", "Available", "Use%", "Mounted on"); + } + + for (tp = types; tp->st_name != NULL; tp++) { + if (!(tp->st_op & ops)) + continue; + + for (index = 0; ; index++) { + memset(&stat_buf, 0, sizeof(struct obd_statfs)); + memset(&uuid_buf, 0, sizeof(struct obd_uuid)); + type = flags & MNTDF_LAZY ? + tp->st_op | LL_STATFS_NODELAY : tp->st_op; + rc2 = llapi_obd_fstatfs(fd, type, index, + &stat_buf, &uuid_buf); + if (rc2 == -ENODEV) + break; + if (rc2 == -EAGAIN) + continue; + if (rc2 == -ENODATA) { /* Inactive device, OK. */ + if (!(flags & MNTDF_VERBOSE)) + continue; + } else if (rc2 < 0 && rc == 0) { + rc = rc2; + } + + if (poolname && tp->st_op == LL_STATFS_LOV && + llapi_search_ost(fsname, poolname, + obd_uuid2str(&uuid_buf)) != 1) + continue; + + /* the llapi_obd_statfs() call may have returned with + * an error, but if it filled in uuid_buf we will at + * lease use that to print out a message for that OBD. + * If we didn't get anything in the uuid_buf, then fill + * it in so that we can print an error message. */ + if (uuid_buf.uuid[0] == '\0') + snprintf(uuid_buf.uuid, sizeof(uuid_buf.uuid), + "%s%04x", tp->st_name, index); + if (!rc && lsb) { + lsb->sb_buf[lsb->sb_count].sd_index = index; + lsb->sb_buf[lsb->sb_count].sd_st = stat_buf; + lsb->sb_count++; + } + if (flags & MNTDF_SHOW) + showdf(mntdir, &stat_buf, + obd_uuid2str(&uuid_buf), flags, + tp->st_name, index, rc2); + + if (rc2 == 0) { + if (tp->st_op == LL_STATFS_LMV) { + sum.os_ffree += stat_buf.os_ffree; + sum.os_files += stat_buf.os_files; + } else /* if (tp->st_op == LL_STATFS_LOV) */ { + sum.os_blocks += stat_buf.os_blocks * + stat_buf.os_bsize; + sum.os_bfree += stat_buf.os_bfree * + stat_buf.os_bsize; + sum.os_bavail += stat_buf.os_bavail * + stat_buf.os_bsize; + ost_ffree += stat_buf.os_ffree; + } + } + } + } + + close(fd); + + /* If we don't have as many objects free on the OST as inodes + * on the MDS, we reduce the total number of inodes to + * compensate, so that the "inodes in use" number is correct. + * Matches ll_statfs_internal() so the results are consistent. */ + if (ost_ffree < sum.os_ffree) { + sum.os_files = (sum.os_files - sum.os_ffree) + ost_ffree; + sum.os_ffree = ost_ffree; + } + if (flags & MNTDF_SHOW) { + printf("\n"); + showdf(mntdir, &sum, "filesystem_summary:", flags, NULL, 0, 0); + printf("\n"); + } + + return rc; +} + +static int ll_statfs_data_comp(const void *sd1, const void *sd2) +{ + const struct obd_statfs *st1 = &((const struct ll_statfs_data *)sd1)-> + sd_st; + const struct obd_statfs *st2 = &((const struct ll_statfs_data *)sd2)-> + sd_st; + int r1 = obd_statfs_ratio(st1); + int r2 = obd_statfs_ratio(st2); + int64_t result = r1 - r2; + + /* if both space usage are above 90, compare free inodes */ + if (r1 > 90 && r2 > 90) + result = st2->os_ffree - st1->os_ffree; + + if (result < 0) + return -1; + else if (result == 0) + return 0; + else + return 1; +} + +/* functions */ +static int lfs_setdirstripe(int argc, char **argv) +{ + char *dname; + int result; + struct lfs_setstripe_args lsa = { 0 }; + struct llapi_stripe_param *param = NULL; + __u32 mdts[LMV_MAX_STRIPE_COUNT] = { 0 }; + char *end; + int c; + char *mode_opt = NULL; + bool default_stripe = false; + mode_t mode = S_IRWXU | S_IRWXG | S_IRWXO; + mode_t previous_mode = 0; + bool delete = false; + struct ll_statfs_buf *lsb = NULL; + char mntdir[PATH_MAX] = ""; + bool auto_distributed = false; + + struct option long_opts[] = { + { .val = 'c', .name = "count", .has_arg = required_argument }, + { .val = 'c', .name = "mdt-count", .has_arg = required_argument }, + { .val = 'd', .name = "delete", .has_arg = no_argument }, + { .val = 'D', .name = "default", .has_arg = no_argument }, + { .val = 'D', .name = "default_stripe", .has_arg = no_argument }, + { .val = 'H', .name = "mdt-hash", .has_arg = required_argument }, + { .val = 'i', .name = "mdt-index", .has_arg = required_argument }, +#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) + { .val = 'i', .name = "index", .has_arg = required_argument }, +#endif + { .val = 'o', .name = "mode", .has_arg = required_argument }, +#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) + { .val = 't', .name = "hash-type", .has_arg = required_argument }, +#endif + { .val = 'T', .name = "mdt-count", .has_arg = required_argument }, +/* setstripe { .val = 'y', .name = "yaml", .has_arg = no_argument }, */ + { .name = NULL } }; + + setstripe_args_init(&lsa); + + while ((c = getopt_long(argc, argv, "c:dDi:H:m:o:t:T:", long_opts, + NULL)) >= 0) { + switch (c) { + case 0: + /* Long options. */ + break; + case 'c': + case 'T': + lsa.lsa_stripe_count = strtoul(optarg, &end, 0); + if (*end != '\0') { + fprintf(stderr, + "%s %s: invalid stripe count '%s'\n", + progname, argv[0], optarg); + return CMD_HELP; + } break; - case LFS_COMP_START_OPT: - if (optarg[0] == '+') { - param.fp_comp_start_sign = -1; - optarg++; - } else if (optarg[0] == '-') { - param.fp_comp_start_sign = 1; - optarg++; + case 'd': + delete = true; + default_stripe = true; + break; + case 'D': + default_stripe = true; + break; +#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) + case 't': + fprintf(stderr, "warning: '--hash-type' and '-t' " + "deprecated, use '--mdt-hash' or '-H' instead\n"); +#endif + case 'H': + lsa.lsa_pattern = check_hashtype(optarg); + if (lsa.lsa_pattern == 0) { + fprintf(stderr, + "%s %s: bad stripe hash type '%s'\n", + progname, argv[0], optarg); + return CMD_HELP; + } + break; + case 'i': +#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) + if (strcmp(argv[optind - 1], "--index") == 0) + fprintf(stderr, + "%s %s: warning: '--index' deprecated, use '--mdt-index' instead\n", + progname, argv[0]); +#endif + lsa.lsa_nr_tgts = parse_targets(mdts, + sizeof(mdts) / sizeof(__u32), + lsa.lsa_nr_tgts, optarg); + if (lsa.lsa_nr_tgts < 0) { + fprintf(stderr, + "%s %s: invalid MDT target(s) '%s'\n", + progname, argv[0], optarg); + return CMD_HELP; } - rc = llapi_parse_size(optarg, ¶m.fp_comp_start, - ¶m.fp_comp_start_units, 0); - if (rc) { - fprintf(stderr, "error: bad component start " - "'%s'\n", optarg); - goto err; + lsa.lsa_tgts = mdts; + if (lsa.lsa_stripe_off == LLAPI_LAYOUT_DEFAULT) + lsa.lsa_stripe_off = mdts[0]; + break; +#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(2, 16, 53, 0) + case 'm': + fprintf(stderr, "warning: '-m' is deprecated, " + "use '--mode' or '-o' instead\n"); +#endif + case 'o': + mode_opt = optarg; + break; + default: + fprintf(stderr, "%s %s: unrecognized option '%s'\n", + progname, argv[0], argv[optind - 1]); + return CMD_HELP; + } + } + + if (optind == argc) { + fprintf(stderr, "%s %s: DIR must be specified\n", + progname, argv[0]); + return CMD_HELP; + } + + if (!delete && lsa.lsa_stripe_off == LLAPI_LAYOUT_DEFAULT && + lsa.lsa_stripe_count == LLAPI_LAYOUT_DEFAULT) { + fprintf(stderr, + "%s %s: stripe offset and count must be specified\n", + progname, argv[0]); + return CMD_HELP; + } + + if (delete && + (lsa.lsa_stripe_off != LLAPI_LAYOUT_DEFAULT || + lsa.lsa_stripe_count != LLAPI_LAYOUT_DEFAULT)) { + fprintf(stderr, + "%s %s: cannot specify -d with -c or -i options\n", + progname, argv[0]); + return CMD_HELP; + } + + if (mode_opt != NULL) { + mode = strtoul(mode_opt, &end, 8); + if (*end != '\0') { + fprintf(stderr, + "%s %s: bad MODE '%s'\n", + progname, argv[0], mode_opt); + return CMD_HELP; + } + previous_mode = umask(0); + } + + /* + * initialize stripe parameters, in case param is converted to specific, + * i.e, 'lfs mkdir -i -1 -c N', always allocate space for lsp_tgts. + */ + param = calloc(1, offsetof(typeof(*param), + lsp_tgts[lsa.lsa_stripe_count != LLAPI_LAYOUT_DEFAULT ? + lsa.lsa_stripe_count : lsa.lsa_nr_tgts])); + if (param == NULL) { + fprintf(stderr, + "%s %s: cannot allocate memory for parameters: %s\n", + progname, argv[0], strerror(ENOMEM)); + return CMD_HELP; + } + + if (lsa.lsa_stripe_count != LLAPI_LAYOUT_DEFAULT) + param->lsp_stripe_count = lsa.lsa_stripe_count; + if (lsa.lsa_stripe_off == LLAPI_LAYOUT_DEFAULT) + param->lsp_stripe_offset = -1; + else + param->lsp_stripe_offset = lsa.lsa_stripe_off; + if (lsa.lsa_pattern != LLAPI_LAYOUT_RAID0) + param->lsp_stripe_pattern = lsa.lsa_pattern; + else + param->lsp_stripe_pattern = LMV_HASH_TYPE_FNV_1A_64; + param->lsp_pool = lsa.lsa_pool_name; + param->lsp_is_specific = false; + if (lsa.lsa_nr_tgts > 1) { + if (lsa.lsa_stripe_count > 0 && + lsa.lsa_stripe_count != LLAPI_LAYOUT_DEFAULT && + lsa.lsa_stripe_count != lsa.lsa_nr_tgts) { + fprintf(stderr, "error: %s: stripe count %lld doesn't " + "match the number of MDTs: %d\n", + argv[0], lsa.lsa_stripe_count, lsa.lsa_nr_tgts); + free(param); + return CMD_HELP; + } + + param->lsp_is_specific = true; + param->lsp_stripe_count = lsa.lsa_nr_tgts; + memcpy(param->lsp_tgts, mdts, sizeof(*mdts) * lsa.lsa_nr_tgts); + } + + dname = argv[optind]; + do { + if (default_stripe) { + result = llapi_dir_set_default_lmv(dname, param); + } else { + /* if current \a dname isn't under the same \a mntdir + * as the last one, and the last one was + * auto-distributed, restore \a param. + */ + if (mntdir[0] != '\0' && + strncmp(dname, mntdir, strlen(mntdir)) && + auto_distributed) { + param->lsp_is_specific = false; + param->lsp_stripe_offset = -1; + auto_distributed = false; } - param.fp_check_comp_start = 1; - param.fp_exclude_comp_start = !!neg_opt; + + if (!param->lsp_is_specific && + param->lsp_stripe_offset == -1) { + char path[PATH_MAX] = ""; + + if (!lsb) { + lsb = malloc(sizeof(*lsb)); + if (!lsb) { + result = -ENOMEM; + break; + } + } + lsb->sb_count = 0; + + /* use mntdir for dirname() temporarily */ + strncpy(mntdir, dname, sizeof(mntdir)); + if (!realpath(dirname(mntdir), path)) { + result = -errno; + fprintf(stderr, + "error: invalid path '%s': %s\n", + argv[optind], strerror(errno)); + break; + } + mntdir[0] = '\0'; + + result = llapi_search_mounts(path, 0, mntdir, + NULL); + if (result < 0 || mntdir[0] == '\0') { + fprintf(stderr, + "No suitable Lustre mount found\n"); + break; + } + + result = mntdf(mntdir, NULL, NULL, 0, + LL_STATFS_LMV, lsb); + if (result < 0) + break; + + if (param->lsp_stripe_count > lsb->sb_count) { + fprintf(stderr, + "error: stripe count %d is too big\n", + param->lsp_stripe_count); + result = -ERANGE; + break; + } + + qsort(lsb->sb_buf, lsb->sb_count, + sizeof(struct ll_statfs_data), + ll_statfs_data_comp); + + auto_distributed = true; + } + + if (auto_distributed) { + int r; + int nr = MAX(param->lsp_stripe_count, + lsb->sb_count / 2); + + /* don't use server whose usage is above 90% */ + while (nr != param->lsp_stripe_count && + obd_statfs_ratio(&lsb->sb_buf[nr].sd_st) + > 90) + nr = MAX(param->lsp_stripe_count, + nr / 2); + + /* get \a r between [0, nr) */ + r = rand() % nr; + + param->lsp_stripe_offset = + lsb->sb_buf[r].sd_index; + if (param->lsp_stripe_count > 1) { + int i = 0; + + param->lsp_is_specific = true; + for (; i < param->lsp_stripe_count; i++) + param->lsp_tgts[(i + r) % nr] = + lsb->sb_buf[i].sd_index; + } + } + + result = llapi_dir_create(dname, mode, param); + } + + if (result) { + fprintf(stderr, + "%s setdirstripe: cannot create stripe dir '%s': %s\n", + progname, dname, strerror(-result)); break; - case 'c': - if (optarg[0] == '+') { - param.fp_stripe_count_sign = -1; - optarg++; - } else if (optarg[0] == '-') { - param.fp_stripe_count_sign = 1; - optarg++; - } + } + dname = argv[++optind]; + } while (dname != NULL); - param.fp_stripe_count = strtoul(optarg, &endptr, 0); - if (*endptr != '\0') { - fprintf(stderr,"error: bad stripe_count '%s'\n", - optarg); - ret = -1; - goto err; - } - param.fp_check_stripe_count = 1; - param.fp_exclude_stripe_count = !!neg_opt; - break; - case 'D': - param.fp_max_depth = strtol(optarg, 0, 0); + if (mode_opt != NULL) + umask(previous_mode); + + free(lsb); + free(param); + return result; +} + +/* functions */ +static int lfs_rmentry(int argc, char **argv) +{ + char *dname; + int index; + int result = 0; + + if (argc <= 1) { + fprintf(stderr, "error: %s: missing dirname\n", + argv[0]); + return CMD_HELP; + } + + index = 1; + dname = argv[index]; + while (dname != NULL) { + result = llapi_direntry_remove(dname); + if (result) { + fprintf(stderr, "error: %s: remove dir entry '%s' " + "failed\n", argv[0], dname); break; - case 'E': - if (optarg[0] == '+') { - param.fp_comp_end_sign = -1; - optarg++; - } else if (optarg[0] == '-') { - param.fp_comp_end_sign = 1; - optarg++; + } + dname = argv[++index]; + } + return result; +} + +static int lfs_mv(int argc, char **argv) +{ + struct find_param param = { + .fp_max_depth = -1, + .fp_mdt_index = -1, + }; + char *end; + int c; + int rc = 0; + struct option long_opts[] = { + { .val = 'm', .name = "mdt-index", .has_arg = required_argument }, + { .val = 'v', .name = "verbose", .has_arg = no_argument }, + { .name = NULL } }; + + while ((c = getopt_long(argc, argv, "m:M:v", long_opts, NULL)) != -1) { + switch (c) { +#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) + case 'M': + fprintf(stderr, "warning: '-M' deprecated" + ", use '--mdt-index' or '-m' instead\n"); +#endif + case 'm': + param.fp_mdt_index = strtoul(optarg, &end, 0); + if (*end != '\0') { + fprintf(stderr, "%s mv: bad MDT index '%s'\n", + progname, optarg); + return CMD_HELP; } + break; + case 'v': + param.fp_verbose = VERBOSE_DETAIL; + break; + default: + fprintf(stderr, "%s mv: unrecognized option '%s'\n", + progname, argv[optind - 1]); + return CMD_HELP; + } + } + + if (param.fp_mdt_index == -1) { + fprintf(stderr, "%s mv: MDT index must be specified\n", + progname); + return CMD_HELP; + } + + if (optind >= argc) { + fprintf(stderr, "%s mv: DIR must be specified\n", progname); + return CMD_HELP; + } + + param.fp_migrate = 1; + rc = llapi_migrate_mdt(argv[optind], ¶m); + if (rc != 0) + fprintf(stderr, "%s mv: cannot migrate '%s' to MDT%04x: %s\n", + progname, argv[optind], param.fp_mdt_index, + strerror(-rc)); + return rc; +} + +static int lfs_osts(int argc, char **argv) +{ + return lfs_tgts(argc, argv); +} + +static int lfs_mdts(int argc, char **argv) +{ + return lfs_tgts(argc, argv); +} + +static int lfs_df(int argc, char **argv) +{ + char mntdir[PATH_MAX] = {'\0'}, path[PATH_MAX] = {'\0'}; + enum mntdf_flags flags = MNTDF_SHOW; + int ops = LL_STATFS_LMV | LL_STATFS_LOV; + int c, rc = 0, index = 0; + char fsname[PATH_MAX] = "", *pool_name = NULL; + struct option long_opts[] = { + { .val = 'h', .name = "human-readable", + .has_arg = no_argument }, + { .val = 'i', .name = "inodes", .has_arg = no_argument }, + { .val = 'l', .name = "lazy", .has_arg = no_argument }, + { .val = 'p', .name = "pool", .has_arg = required_argument }, + { .val = 'v', .name = "verbose", .has_arg = no_argument }, + { .name = NULL} }; - if (arg_is_eof(optarg)) { - param.fp_comp_end = LUSTRE_EOF; - param.fp_comp_end_units = 1; - rc = 0; - } else { - rc = llapi_parse_size(optarg, - ¶m.fp_comp_end, - ¶m.fp_comp_end_units, 0); - } - if (rc) { - fprintf(stderr, "error: bad component end " - "'%s'\n", optarg); - goto err; - } - param.fp_check_comp_end = 1; - param.fp_exclude_comp_end = !!neg_opt; + while ((c = getopt_long(argc, argv, "hilp:v", long_opts, NULL)) != -1) { + switch (c) { + case 'h': + flags |= MNTDF_COOKED; break; - case 'g': - case 'G': - rc = name2gid(¶m.fp_gid, optarg); - if (rc) { - param.fp_gid = strtoul(optarg, &endptr, 10); - if (*endptr != '\0') { - fprintf(stderr, "Group/GID: %s cannot " - "be found.\n", optarg); - ret = -1; - goto err; - } - } - param.fp_exclude_gid = !!neg_opt; - param.fp_check_gid = 1; - break; - case 'H': - param.fp_hash_type = check_hashtype(optarg); - if (param.fp_hash_type == 0) { - fprintf(stderr, "error: bad hash_type '%s'\n", - optarg); - ret = -1; - goto err; - } - param.fp_check_hash_type = 1; - param.fp_exclude_hash_type = !!neg_opt; + case 'i': + flags |= MNTDF_INODES; break; - case 'L': - ret = name2layout(¶m.fp_layout, optarg); - if (ret) - goto err; - param.fp_exclude_layout = !!neg_opt; - param.fp_check_layout = 1; + case 'l': + flags |= MNTDF_LAZY; break; - case 'u': - case 'U': - rc = name2uid(¶m.fp_uid, optarg); - if (rc) { - param.fp_uid = strtoul(optarg, &endptr, 10); - if (*endptr != '\0') { - fprintf(stderr, "User/UID: %s cannot " - "be found.\n", optarg); - ret = -1; - goto err; - } + case 'p': + pool_name = optarg; + break; + case 'v': + flags |= MNTDF_VERBOSE; + break; + default: + return CMD_HELP; + } + } + if (optind < argc && !realpath(argv[optind], path)) { + rc = -errno; + fprintf(stderr, "error: invalid path '%s': %s\n", + argv[optind], strerror(-rc)); + return rc; + } + + while (!llapi_search_mounts(path, index++, mntdir, fsname)) { + /* Check if we have a mount point */ + if (mntdir[0] == '\0') + continue; + + rc = mntdf(mntdir, fsname, pool_name, flags, ops, NULL); + if (rc || path[0] != '\0') + break; + fsname[0] = '\0'; /* avoid matching in next loop */ + mntdir[0] = '\0'; /* avoid matching in next loop */ + } + + return rc; +} + +static int lfs_getname(int argc, char **argv) +{ + char mntdir[PATH_MAX] = "", path[PATH_MAX] = "", fsname[PATH_MAX] = ""; + int rc = 0, index = 0, c; + char buf[sizeof(struct obd_uuid)]; + + while ((c = getopt(argc, argv, "h")) != -1) + return CMD_HELP; + + if (optind == argc) { /* no paths specified, get all paths. */ + while (!llapi_search_mounts(path, index++, mntdir, fsname)) { + rc = llapi_getname(mntdir, buf, sizeof(buf)); + if (rc < 0) { + fprintf(stderr, + "cannot get name for `%s': %s\n", + mntdir, strerror(-rc)); + break; } - param.fp_exclude_uid = !!neg_opt; - param.fp_check_uid = 1; - break; - case LFS_POOL_OPT: - if (strlen(optarg) > LOV_MAXPOOLNAME) { + + printf("%s %s\n", buf, mntdir); + + path[0] = fsname[0] = mntdir[0] = 0; + } + } else { /* paths specified, only attempt to search these. */ + for (; optind < argc; optind++) { + rc = llapi_getname(argv[optind], buf, sizeof(buf)); + if (rc < 0) { fprintf(stderr, - "Pool name %s is too long" - " (max is %d)\n", optarg, - LOV_MAXPOOLNAME); - ret = -1; - goto err; + "cannot get name for `%s': %s\n", + argv[optind], strerror(-rc)); + break; } - /* we do check for empty pool because empty pool - * is used to find V1 lov attributes */ - strncpy(param.fp_poolname, optarg, LOV_MAXPOOLNAME); - param.fp_poolname[LOV_MAXPOOLNAME] = '\0'; - param.fp_exclude_pool = !!neg_opt; - param.fp_check_pool = 1; - break; - case 'n': - param.fp_pattern = (char *)optarg; - param.fp_exclude_pattern = !!neg_opt; - break; - case 'm': - case 'i': - case 'O': { - char *buf, *token, *next, *p; - int len = 1; - void *tmp; - buf = strdup(optarg); - if (buf == NULL) { - ret = -ENOMEM; - goto err; - } + printf("%s %s\n", buf, argv[optind]); + } + } + return rc; +} + +static int lfs_check(int argc, char **argv) +{ + int rc; + char mntdir[PATH_MAX] = {'\0'}; + int num_types = 1; + char *obd_types[2]; + char obd_type1[4]; + char obd_type2[4]; + + if (argc != 2) { + fprintf(stderr, "%s check: server type must be specified\n", + progname); + return CMD_HELP; + } + + obd_types[0] = obd_type1; + obd_types[1] = obd_type2; + + if (strcmp(argv[1], "osts") == 0) { + strcpy(obd_types[0], "osc"); + } else if (strcmp(argv[1], "mds") == 0) { + strcpy(obd_types[0], "mdc"); + } else if (strcmp(argv[1], "servers") == 0) { + num_types = 2; + strcpy(obd_types[0], "osc"); + strcpy(obd_types[1], "mdc"); + } else { + fprintf(stderr, "%s check: unrecognized option '%s'\n", + progname, argv[1]); + return CMD_HELP; + } + + rc = llapi_search_mounts(NULL, 0, mntdir, NULL); + if (rc < 0 || mntdir[0] == '\0') { + fprintf(stderr, + "%s check: cannot find mounted Lustre filesystem: %s\n", + progname, (rc < 0) ? strerror(-rc) : strerror(ENODEV)); + return rc; + } + + rc = llapi_target_check(num_types, obd_types, mntdir); + if (rc) + fprintf(stderr, "%s check: cannot check target '%s': %s\n", + progname, argv[1], strerror(-rc)); + + return rc; + +} + +#ifdef HAVE_SYS_QUOTA_H +#define ARG2INT(nr, str, msg) \ +do { \ + char *endp; \ + nr = strtol(str, &endp, 0); \ + if (*endp != '\0') { \ + fprintf(stderr, "%s: bad %s '%s'\n", \ + progname, msg, str); \ + return CMD_HELP; \ + } \ +} while (0) + +#define ADD_OVERFLOW(a,b) ((a + b) < a) ? (a = ULONG_MAX) : (a = a + b) + +/* Convert format time string "XXwXXdXXhXXmXXs" into seconds value + * returns the value or ULONG_MAX on integer overflow or incorrect format + * Notes: + * 1. the order of specifiers is arbitrary (may be: 5w3s or 3s5w) + * 2. specifiers may be encountered multiple times (2s3s is 5 seconds) + * 3. empty integer value is interpreted as 0 + */ +static unsigned long str2sec(const char* timestr) +{ + const char spec[] = "smhdw"; + const unsigned long mult[] = {1, 60, 60*60, 24*60*60, 7*24*60*60}; + unsigned long val = 0; + char *tail; + + if (strpbrk(timestr, spec) == NULL) { + /* no specifiers inside the time string, + should treat it as an integer value */ + val = strtoul(timestr, &tail, 10); + return *tail ? ULONG_MAX : val; + } + + /* format string is XXwXXdXXhXXmXXs */ + while (*timestr) { + unsigned long v; + int ind; + char* ptr; + + v = strtoul(timestr, &tail, 10); + if (v == ULONG_MAX || *tail == '\0') + /* value too large (ULONG_MAX or more) + or missing specifier */ + goto error; + + ptr = strchr(spec, *tail); + if (ptr == NULL) + /* unknown specifier */ + goto error; + + ind = ptr - spec; + + /* check if product will overflow the type */ + if (!(v < ULONG_MAX / mult[ind])) + goto error; + + ADD_OVERFLOW(val, mult[ind] * v); + if (val == ULONG_MAX) + goto error; + + timestr = tail + 1; + } + + return val; - param.fp_exclude_obd = !!neg_opt; +error: + return ULONG_MAX; +} - token = buf; - while (token && *token) { - token = strchr(token, ','); - if (token) { - len++; - token++; - } - } - if (c == 'm') { - param.fp_exclude_mdt = !!neg_opt; - param.fp_num_alloc_mdts += len; - tmp = realloc(param.fp_mdt_uuid, - param.fp_num_alloc_mdts * - sizeof(*param.fp_mdt_uuid)); - if (tmp == NULL) { - ret = -ENOMEM; - goto err_free; - } +#define ARG2ULL(nr, str, def_units) \ +do { \ + unsigned long long limit, units = def_units; \ + int rc; \ + \ + rc = llapi_parse_size(str, &limit, &units, 1); \ + if (rc < 0) { \ + fprintf(stderr, "%s: invalid limit '%s'\n", \ + progname, str); \ + return CMD_HELP; \ + } \ + nr = limit; \ +} while (0) - param.fp_mdt_uuid = tmp; - } else { - param.fp_exclude_obd = !!neg_opt; - param.fp_num_alloc_obds += len; - tmp = realloc(param.fp_obd_uuid, - param.fp_num_alloc_obds * - sizeof(*param.fp_obd_uuid)); - if (tmp == NULL) { - ret = -ENOMEM; - goto err_free; - } +static inline int has_times_option(int argc, char **argv) +{ + int i; - param.fp_obd_uuid = tmp; - } - for (token = buf; token && *token; token = next) { - struct obd_uuid *puuid; - if (c == 'm') { - puuid = - ¶m.fp_mdt_uuid[param.fp_num_mdts++]; - } else { - puuid = - ¶m.fp_obd_uuid[param.fp_num_obds++]; - } - p = strchr(token, ','); - next = 0; - if (p) { - *p = 0; - next = p+1; - } + for (i = 1; i < argc; i++) + if (!strcmp(argv[i], "-t")) + return 1; - if (strlen(token) > sizeof(puuid->uuid) - 1) { - ret = -E2BIG; - goto err_free; - } + return 0; +} - strncpy(puuid->uuid, token, - sizeof(puuid->uuid)); - } -err_free: - if (buf) - free(buf); - break; - } - case 'p': - param.fp_zero_end = 1; - break; - case 'P': - break; - case LFS_PROJID_OPT: - rc = name2projid(¶m.fp_projid, optarg); - if (rc) { - param.fp_projid = strtoul(optarg, &endptr, 10); - if (*endptr != '\0') { - fprintf(stderr, - "Invalid project ID: %s", - optarg); - ret = -1; - goto err; - } - } - param.fp_exclude_projid = !!neg_opt; - param.fp_check_projid = 1; - break; - case 's': - if (optarg[0] == '+') { - param.fp_size_sign = -1; - optarg++; - } else if (optarg[0] == '-') { - param.fp_size_sign = 1; - optarg++; - } +int lfs_setquota_times(int argc, char **argv) +{ + int c, rc; + struct if_quotactl qctl; + char *mnt, *obd_type = (char *)qctl.obd_type; + struct obd_dqblk *dqb = &qctl.qc_dqblk; + struct obd_dqinfo *dqi = &qctl.qc_dqinfo; + struct option long_opts[] = { + { .val = 'b', .name = "block-grace", .has_arg = required_argument }, + { .val = 'g', .name = "group", .has_arg = no_argument }, + { .val = 'i', .name = "inode-grace", .has_arg = required_argument }, + { .val = 'p', .name = "projid", .has_arg = no_argument }, + { .val = 't', .name = "times", .has_arg = no_argument }, + { .val = 'u', .name = "user", .has_arg = no_argument }, + { .name = NULL } }; + int qtype; - ret = llapi_parse_size(optarg, ¶m.fp_size, - ¶m.fp_size_units, 0); - if (ret) { - fprintf(stderr, "error: bad file size '%s'\n", - optarg); - goto err; - } - param.fp_check_size = 1; - param.fp_exclude_size = !!neg_opt; - break; - case 'S': - if (optarg[0] == '+') { - param.fp_stripe_size_sign = -1; - optarg++; - } else if (optarg[0] == '-') { - param.fp_stripe_size_sign = 1; - optarg++; - } + memset(&qctl, 0, sizeof(qctl)); + qctl.qc_cmd = LUSTRE_Q_SETINFO; + qctl.qc_type = ALLQUOTA; - ret = llapi_parse_size(optarg, ¶m.fp_stripe_size, - ¶m.fp_stripe_size_units, 0); - if (ret) { - fprintf(stderr, "error: bad stripe_size '%s'\n", - optarg); - goto err; + while ((c = getopt_long(argc, argv, "b:gi:ptu", + long_opts, NULL)) != -1) { + switch (c) { + case 'u': + qtype = USRQUOTA; + goto quota_type; + case 'g': + qtype = GRPQUOTA; + goto quota_type; + case 'p': + qtype = PRJQUOTA; +quota_type: + if (qctl.qc_type != ALLQUOTA) { + fprintf(stderr, "error: -u/g/p can't be used " + "more than once\n"); + return CMD_HELP; } - param.fp_check_stripe_size = 1; - param.fp_exclude_stripe_size = !!neg_opt; - break; - case 't': - param.fp_exclude_type = !!neg_opt; - switch (optarg[0]) { - case 'b': - param.fp_type = S_IFBLK; - break; - case 'c': - param.fp_type = S_IFCHR; - break; - case 'd': - param.fp_type = S_IFDIR; - break; - case 'f': - param.fp_type = S_IFREG; - break; - case 'l': - param.fp_type = S_IFLNK; - break; - case 'p': - param.fp_type = S_IFIFO; - break; - case 's': - param.fp_type = S_IFSOCK; - break; - default: - fprintf(stderr, "error: %s: bad type '%s'\n", - argv[0], optarg); - ret = CMD_HELP; - goto err; - }; + qctl.qc_type = qtype; break; - case 'T': - if (optarg[0] == '+') { - param.fp_mdt_count_sign = -1; - optarg++; - } else if (optarg[0] == '-') { - param.fp_mdt_count_sign = 1; - optarg++; - } + case 'b': + if ((dqi->dqi_bgrace = str2sec(optarg)) == ULONG_MAX) { + fprintf(stderr, "error: bad block-grace: %s\n", + optarg); + return CMD_HELP; + } + dqb->dqb_valid |= QIF_BTIME; + break; + case 'i': + if ((dqi->dqi_igrace = str2sec(optarg)) == ULONG_MAX) { + fprintf(stderr, "error: bad inode-grace: %s\n", + optarg); + return CMD_HELP; + } + dqb->dqb_valid |= QIF_ITIME; + break; + case 't': /* Yes, of course! */ + break; + default: /* getopt prints error message for us when opterr != 0 */ + return CMD_HELP; + } + } - param.fp_mdt_count = strtoul(optarg, &endptr, 0); - if (*endptr != '\0') { - fprintf(stderr, "error: bad mdt_count '%s'\n", - optarg); - ret = -1; - goto err; - } - param.fp_check_mdt_count = 1; - param.fp_exclude_mdt_count = !!neg_opt; - break; - default: - ret = CMD_HELP; - goto err; - }; + if (qctl.qc_type == ALLQUOTA) { + fprintf(stderr, "error: neither -u, -g nor -p specified\n"); + return CMD_HELP; } - if (pathstart == -1) { - fprintf(stderr, "error: %s: no filename|pathname\n", - argv[0]); - ret = CMD_HELP; - goto err; - } else if (pathend == -1) { - /* no options */ - pathend = argc; + if (optind != argc - 1) { + fprintf(stderr, "error: unexpected parameters encountered\n"); + return CMD_HELP; } - do { - rc = llapi_find(argv[pathstart], ¶m); - if (rc != 0 && ret == 0) - ret = rc; - } while (++pathstart < pathend); - - if (ret) - fprintf(stderr, "error: %s failed for %s.\n", - argv[0], argv[optind - 1]); -err: - if (param.fp_obd_uuid && param.fp_num_alloc_obds) - free(param.fp_obd_uuid); + if ((dqb->dqb_valid | QIF_BTIME && dqi->dqi_bgrace >= UINT_MAX) || + (dqb->dqb_valid | QIF_ITIME && dqi->dqi_igrace >= UINT_MAX)) { + fprintf(stderr, "error: grace time is too large\n"); + return CMD_HELP; + } - if (param.fp_mdt_uuid && param.fp_num_alloc_mdts) - free(param.fp_mdt_uuid); + mnt = argv[optind]; + rc = llapi_quotactl(mnt, &qctl); + if (rc) { + if (*obd_type) + fprintf(stderr, "%s %s ", obd_type, + obd_uuid2str(&qctl.obd_uuid)); + fprintf(stderr, "setquota failed: %s\n", strerror(-rc)); + return rc; + } - return ret; + return 0; } -static int lfs_getstripe_internal(int argc, char **argv, - struct find_param *param) +#define BSLIMIT (1 << 0) +#define BHLIMIT (1 << 1) +#define ISLIMIT (1 << 2) +#define IHLIMIT (1 << 3) + +int lfs_setquota(int argc, char **argv) { + int c, rc = 0; + struct if_quotactl qctl; + char *mnt, *obd_type = (char *)qctl.obd_type; + struct obd_dqblk *dqb = &qctl.qc_dqblk; struct option long_opts[] = { - { .val = LFS_COMP_COUNT_OPT, - .name = "comp-count", .has_arg = no_argument }, - { .val = LFS_COMP_COUNT_OPT, - .name = "component-count", .has_arg = no_argument }, - { .val = LFS_COMP_FLAGS_OPT, - .name = "comp-flags", .has_arg = optional_argument }, - { .val = LFS_COMP_FLAGS_OPT, - .name = "component-flags", .has_arg = optional_argument }, - { .val = LFS_COMP_START_OPT, - .name = "comp-start", .has_arg = optional_argument }, - { .val = LFS_COMP_START_OPT, - .name = "component-start", .has_arg = optional_argument }, -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(2, 9, 59, 0) - /* This formerly implied "stripe-count", but was explicitly - * made "stripe-count" for consistency with other options, - * and to separate it from "mdt-count" when DNE arrives. */ - { .val = 'c', .name = "count", .has_arg = no_argument }, -#endif - { .val = 'c', .name = "stripe-count", .has_arg = no_argument }, - { .val = 'c', .name = "stripe_count", .has_arg = no_argument }, - { .val = 'd', .name = "directory", .has_arg = no_argument }, - { .val = 'D', .name = "default", .has_arg = no_argument }, - { .val = 'E', .name = "comp-end", .has_arg = optional_argument }, - { .val = 'E', .name = "component-end", - .has_arg = optional_argument }, - { .val = 'F', .name = "fid", .has_arg = no_argument }, - { .val = 'g', .name = "generation", .has_arg = no_argument }, - /* dirstripe { .val = 'H', .name = "mdt-hash", - * .has_arg = required_argument }, */ -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(2, 9, 59, 0) - /* This formerly implied "stripe-index", but was explicitly - * made "stripe-index" for consistency with other options, - * and to separate it from "mdt-index" when DNE arrives. */ - { .val = 'i', .name = "index", .has_arg = no_argument }, -#endif - { .val = 'i', .name = "stripe-index", .has_arg = no_argument }, - { .val = 'i', .name = "stripe_index", .has_arg = no_argument }, - { .val = 'I', .name = "comp-id", .has_arg = optional_argument }, - { .val = 'I', .name = "component-id", .has_arg = optional_argument }, - { .val = 'L', .name = "layout", .has_arg = no_argument }, - { .val = 'm', .name = "mdt", .has_arg = no_argument }, - { .val = 'm', .name = "mdt-index", .has_arg = no_argument }, - { .val = 'm', .name = "mdt_index", .has_arg = no_argument }, -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) - { .val = 'M', .name = "mdt-index", .has_arg = no_argument }, - { .val = 'M', .name = "mdt_index", .has_arg = no_argument }, -#endif -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(2, 9, 59, 0) - /* This formerly implied "stripe-index", but was confusing - * with "file offset" (which will eventually be needed for - * with different layouts by offset), so deprecate it. */ - { .val = 'o', .name = "offset", .has_arg = no_argument }, -#endif - { .val = 'O', .name = "obd", .has_arg = required_argument }, - { .val = 'O', .name = "ost", .has_arg = required_argument }, - { .val = 'p', .name = "pool", .has_arg = no_argument }, - { .val = 'q', .name = "quiet", .has_arg = no_argument }, - { .val = 'r', .name = "recursive", .has_arg = no_argument }, - { .val = 'R', .name = "raw", .has_arg = no_argument }, -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(2, 9, 59, 0) - /* This formerly implied "--stripe-size", but was confusing - * with "lfs find --size|-s", which means "file size", so use - * the consistent "--stripe-size|-S" for all commands. */ - { .val = 's', .name = "size", .has_arg = no_argument }, -#endif - { .val = 'S', .name = "stripe-size", .has_arg = no_argument }, - { .val = 'S', .name = "stripe_size", .has_arg = no_argument }, - /* dirstripe { .val = 'T', .name = "mdt-count", - * .has_arg = required_argument }, */ - { .val = 'v', .name = "verbose", .has_arg = no_argument }, - { .val = 'y', .name = "yaml", .has_arg = no_argument }, + { .val = 'b', .name = "block-softlimit", + .has_arg = required_argument }, + { .val = 'B', .name = "block-hardlimit", + .has_arg = required_argument }, + { .val = 'd', .name = "default", .has_arg = no_argument }, + { .val = 'g', .name = "group", .has_arg = required_argument }, + { .val = 'G', .name = "default-grp", .has_arg = no_argument }, + { .val = 'i', .name = "inode-softlimit", + .has_arg = required_argument }, + { .val = 'I', .name = "inode-hardlimit", + .has_arg = required_argument }, + { .val = 'p', .name = "projid", .has_arg = required_argument }, + { .val = 'P', .name = "default-prj", .has_arg = no_argument }, + { .val = 'u', .name = "user", .has_arg = required_argument }, + { .val = 'U', .name = "default-usr", .has_arg = no_argument }, { .name = NULL } }; - int c, rc; - char *end, *tmp; + unsigned limit_mask = 0; + char *endptr; + bool use_default = false; + int qtype; - while ((c = getopt_long(argc, argv, "cdDE::FghiI::LmMoO:pqrRsSvy", - long_opts, NULL)) != -1) { - switch (c) { - case 'c': - if (strcmp(argv[optind - 1], "--count") == 0) - fprintf(stderr, "warning: '--count' deprecated," - " use '--stripe-count' instead\n"); - if (!(param->fp_verbose & VERBOSE_DETAIL)) { - param->fp_verbose |= VERBOSE_COUNT; - param->fp_max_depth = 0; - } - break; - case LFS_COMP_COUNT_OPT: - param->fp_verbose |= VERBOSE_COMP_COUNT; - param->fp_max_depth = 0; - break; - case LFS_COMP_FLAGS_OPT: - if (optarg != NULL) { - __u32 *flags = ¶m->fp_comp_flags; - rc = comp_str2flags(flags, optarg); - if (rc != 0) { - fprintf(stderr, "error: %s bad " - "component flags '%s'.\n", - argv[0], optarg); - return CMD_HELP; - } else { - param->fp_check_comp_flags = 1; - param->fp_exclude_comp_flags = - comp_flags_is_neg(*flags); - comp_flags_clear_neg(flags); - } - } else { - param->fp_verbose |= VERBOSE_COMP_FLAGS; - param->fp_max_depth = 0; - } - break; - case LFS_COMP_START_OPT: - if (optarg != NULL) { - tmp = optarg; - if (tmp[0] == '+') { - param->fp_comp_start_sign = -1; - tmp++; - } else if (tmp[0] == '-') { - param->fp_comp_start_sign = 1; - tmp++; - } - rc = llapi_parse_size(tmp, - ¶m->fp_comp_start, - ¶m->fp_comp_start_units, 0); - if (rc != 0) { - fprintf(stderr, "error: %s bad " - "component start '%s'.\n", - argv[0], tmp); - return CMD_HELP; - } else { - param->fp_check_comp_start = 1; - } - } else { - param->fp_verbose |= VERBOSE_COMP_START; - param->fp_max_depth = 0; - } - break; - case 'd': - param->fp_max_depth = 0; - break; - case 'D': - param->fp_get_default_lmv = 1; - break; - case 'E': - if (optarg != NULL) { - tmp = optarg; - if (tmp[0] == '+') { - param->fp_comp_end_sign = -1; - tmp++; - } else if (tmp[0] == '-') { - param->fp_comp_end_sign = 1; - tmp++; - } + if (has_times_option(argc, argv)) + return lfs_setquota_times(argc, argv); - if (arg_is_eof(tmp)) { - param->fp_comp_end = LUSTRE_EOF; - param->fp_comp_end_units = 1; - rc = 0; - } else { - rc = llapi_parse_size(tmp, - ¶m->fp_comp_end, - ¶m->fp_comp_end_units, 0); - } - if (rc != 0) { - fprintf(stderr, "error: %s bad " - "component end '%s'.\n", - argv[0], tmp); - return CMD_HELP; - } - param->fp_check_comp_end = 1; - } else { - param->fp_verbose |= VERBOSE_COMP_END; - param->fp_max_depth = 0; - } - break; - case 'F': - if (!(param->fp_verbose & VERBOSE_DETAIL)) { - param->fp_verbose |= VERBOSE_DFID; - param->fp_max_depth = 0; - } - break; - case 'g': - if (!(param->fp_verbose & VERBOSE_DETAIL)) { - param->fp_verbose |= VERBOSE_GENERATION; - param->fp_max_depth = 0; - } - break; -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(2, 9, 59, 0) - case 'o': - fprintf(stderr, "warning: '--offset|-o' deprecated, " - "use '--stripe-index|-i' instead\n"); -#endif - case 'i': -#if LUSTRE_VERSION_CODE >= OBD_OCD_VERSION(2, 6, 53, 0) - if (strcmp(argv[optind - 1], "--index") == 0) - fprintf(stderr, "warning: '--index' deprecated" - ", use '--stripe-index' instead\n"); -#endif - if (!(param->fp_verbose & VERBOSE_DETAIL)) { - param->fp_verbose |= VERBOSE_OFFSET; - param->fp_max_depth = 0; - } - break; - case 'I': - if (optarg != NULL) { - param->fp_comp_id = strtoul(optarg, &end, 0); - if (*end != '\0' || param->fp_comp_id == 0 || - param->fp_comp_id > LCME_ID_MAX) { - fprintf(stderr, "error: %s bad " - "component id '%s'\n", - argv[0], optarg); - return CMD_HELP; - } else { - param->fp_check_comp_id = 1; + memset(&qctl, 0, sizeof(qctl)); + qctl.qc_cmd = LUSTRE_Q_SETQUOTA; + qctl.qc_type = ALLQUOTA; /* ALLQUOTA makes no sense for setquota, + * so it can be used as a marker that qc_type + * isn't reinitialized from command line */ + + while ((c = getopt_long(argc, argv, "b:B:dg:Gi:I:p:Pu:U", + long_opts, NULL)) != -1) { + switch (c) { + case 'U': + qctl.qc_cmd = LUSTRE_Q_SETDEFAULT; + qtype = USRQUOTA; + qctl.qc_id = 0; + goto quota_type_def; + case 'u': + qtype = USRQUOTA; + rc = name2uid(&qctl.qc_id, optarg); + goto quota_type; + case 'G': + qctl.qc_cmd = LUSTRE_Q_SETDEFAULT; + qtype = GRPQUOTA; + qctl.qc_id = 0; + goto quota_type_def; + case 'g': + qtype = GRPQUOTA; + rc = name2gid(&qctl.qc_id, optarg); + goto quota_type; + case 'P': + qctl.qc_cmd = LUSTRE_Q_SETDEFAULT; + qtype = PRJQUOTA; + qctl.qc_id = 0; + goto quota_type_def; + case 'p': + qtype = PRJQUOTA; + rc = name2projid(&qctl.qc_id, optarg); +quota_type: + if (rc) { + qctl.qc_id = strtoul(optarg, &endptr, 10); + if (*endptr != '\0') { + fprintf(stderr, "%s setquota: invalid" + " id '%s'\n", progname, optarg); + return -1; } - } else { - param->fp_max_depth = 0; - param->fp_verbose |= VERBOSE_COMP_ID; } - break; - case 'L': - if (!(param->fp_verbose & VERBOSE_DETAIL)) { - param->fp_verbose |= VERBOSE_LAYOUT; - param->fp_max_depth = 0; + + if (qctl.qc_id == 0) { + fprintf(stderr, "%s setquota: can't set quota" + " for root usr/group/project.\n", + progname); + return -1; } - break; -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) - case 'M': -#if LUSTRE_VERSION_CODE >= OBD_OCD_VERSION(2, 11, 53, 0) - fprintf(stderr, "warning: '-M' deprecated" - ", use '-m' instead\n"); -#endif -#endif - case 'm': - if (!(param->fp_verbose & VERBOSE_DETAIL)) - param->fp_max_depth = 0; - param->fp_verbose |= VERBOSE_MDTINDEX; - break; - case 'O': - if (param->fp_obd_uuid) { + +quota_type_def: + if (qctl.qc_type != ALLQUOTA) { fprintf(stderr, - "error: %s: only one obduuid allowed", - argv[0]); + "%s setquota: only one of -u, -U, -g," + " -G, -p or -P may be specified\n", + progname); return CMD_HELP; } - param->fp_obd_uuid = (struct obd_uuid *)optarg; - break; - case 'p': - if (!(param->fp_verbose & VERBOSE_DETAIL)) { - param->fp_verbose |= VERBOSE_POOL; - param->fp_max_depth = 0; - } - break; - case 'q': - param->fp_quiet++; + qctl.qc_type = qtype; break; - case 'r': - param->fp_recursive = 1; + case 'd': + qctl.qc_cmd = LUSTRE_Q_SETDEFAULT; + use_default = true; break; - case 'R': - param->fp_raw = 1; + case 'b': + ARG2ULL(dqb->dqb_bsoftlimit, optarg, 1024); + dqb->dqb_bsoftlimit >>= 10; + limit_mask |= BSLIMIT; + if (dqb->dqb_bsoftlimit && + dqb->dqb_bsoftlimit <= 1024) /* <= 1M? */ + fprintf(stderr, + "%s setquota: warning: block softlimit '%llu' smaller than minimum qunit size\n" + "See '%s help setquota' or Lustre manual for details\n", + progname, dqb->dqb_bsoftlimit, + progname); break; -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(2, 9, 59, 0) - case 's': - fprintf(stderr, "warning: '--size|-s' deprecated, " - "use '--stripe-size|-S' instead\n"); -#endif /* LUSTRE_VERSION_CODE < OBD_OCD_VERSION(2, 9, 59, 0) */ - case 'S': - if (!(param->fp_verbose & VERBOSE_DETAIL)) { - param->fp_verbose |= VERBOSE_SIZE; - param->fp_max_depth = 0; - } + case 'B': + ARG2ULL(dqb->dqb_bhardlimit, optarg, 1024); + dqb->dqb_bhardlimit >>= 10; + limit_mask |= BHLIMIT; + if (dqb->dqb_bhardlimit && + dqb->dqb_bhardlimit <= 1024) /* <= 1M? */ + fprintf(stderr, + "%s setquota: warning: block hardlimit '%llu' smaller than minimum qunit size\n" + "See '%s help setquota' or Lustre manual for details\n", + progname, dqb->dqb_bhardlimit, + progname); break; - case 'v': - param->fp_verbose = VERBOSE_DEFAULT | VERBOSE_DETAIL; + case 'i': + ARG2ULL(dqb->dqb_isoftlimit, optarg, 1); + limit_mask |= ISLIMIT; + if (dqb->dqb_isoftlimit && + dqb->dqb_isoftlimit <= 1024) /* <= 1K inodes? */ + fprintf(stderr, + "%s setquota: warning: inode softlimit '%llu' smaller than minimum qunit size\n" + "See '%s help setquota' or Lustre manual for details\n", + progname, dqb->dqb_isoftlimit, + progname); break; - case 'y': - param->fp_yaml = 1; + case 'I': + ARG2ULL(dqb->dqb_ihardlimit, optarg, 1); + limit_mask |= IHLIMIT; + if (dqb->dqb_ihardlimit && + dqb->dqb_ihardlimit <= 1024) /* <= 1K inodes? */ + fprintf(stderr, + "%s setquota: warning: inode hardlimit '%llu' smaller than minimum qunit size\n" + "See '%s help setquota' or Lustre manual for details\n", + progname, dqb->dqb_ihardlimit, + progname); break; default: + fprintf(stderr, + "%s setquota: unrecognized option '%s'\n", + progname, argv[optind - 1]); return CMD_HELP; } } - if (optind >= argc) - return CMD_HELP; + if (qctl.qc_type == ALLQUOTA) { + fprintf(stderr, + "%s setquota: either -u or -g must be specified\n", + progname); + return CMD_HELP; + } + + if (!use_default && limit_mask == 0) { + fprintf(stderr, + "%s setquota: at least one limit must be specified\n", + progname); + return CMD_HELP; + } + + if (use_default && limit_mask != 0) { + fprintf(stderr, + "%s setquota: limits should not be specified when" + " using default quota\n", + progname); + return CMD_HELP; + } + + if (use_default && qctl.qc_id == 0) { + fprintf(stderr, + "%s setquota: can not set default quota for root" + " user/group/project\n", + progname); + return CMD_HELP; + } + + if (optind != argc - 1) { + fprintf(stderr, + "%s setquota: filesystem not specified or unexpected argument '%s'\n", + progname, argv[optind]); + return CMD_HELP; + } + + mnt = argv[optind]; + + if (use_default) { + dqb->dqb_bhardlimit = 0; + dqb->dqb_bsoftlimit = 0; + dqb->dqb_ihardlimit = 0; + dqb->dqb_isoftlimit = 0; + dqb->dqb_itime = 0; + dqb->dqb_btime = 0; + dqb->dqb_valid |= QIF_LIMITS | QIF_TIMES; + } else if ((!(limit_mask & BHLIMIT) ^ !(limit_mask & BSLIMIT)) || + (!(limit_mask & IHLIMIT) ^ !(limit_mask & ISLIMIT))) { + /* sigh, we can't just set blimits/ilimits */ + struct if_quotactl tmp_qctl = {.qc_cmd = LUSTRE_Q_GETQUOTA, + .qc_type = qctl.qc_type, + .qc_id = qctl.qc_id}; + + rc = llapi_quotactl(mnt, &tmp_qctl); + if (rc < 0) + return rc; + + if (!(limit_mask & BHLIMIT)) + dqb->dqb_bhardlimit = tmp_qctl.qc_dqblk.dqb_bhardlimit; + if (!(limit_mask & BSLIMIT)) + dqb->dqb_bsoftlimit = tmp_qctl.qc_dqblk.dqb_bsoftlimit; + if (!(limit_mask & IHLIMIT)) + dqb->dqb_ihardlimit = tmp_qctl.qc_dqblk.dqb_ihardlimit; + if (!(limit_mask & ISLIMIT)) + dqb->dqb_isoftlimit = tmp_qctl.qc_dqblk.dqb_isoftlimit; + + /* Keep grace times if we have got no softlimit arguments */ + if ((limit_mask & BHLIMIT) && !(limit_mask & BSLIMIT)) { + dqb->dqb_valid |= QIF_BTIME; + dqb->dqb_btime = tmp_qctl.qc_dqblk.dqb_btime; + } + + if ((limit_mask & IHLIMIT) && !(limit_mask & ISLIMIT)) { + dqb->dqb_valid |= QIF_ITIME; + dqb->dqb_itime = tmp_qctl.qc_dqblk.dqb_itime; + } + } + + dqb->dqb_valid |= (limit_mask & (BHLIMIT | BSLIMIT)) ? QIF_BLIMITS : 0; + dqb->dqb_valid |= (limit_mask & (IHLIMIT | ISLIMIT)) ? QIF_ILIMITS : 0; + + rc = llapi_quotactl(mnt, &qctl); + if (rc) { + if (*obd_type) + fprintf(stderr, + "%s setquota: cannot quotactl '%s' '%s': %s", + progname, obd_type, + obd_uuid2str(&qctl.obd_uuid), strerror(-rc)); + return rc; + } + + return 0; +} + +/* Converts seconds value into format string + * result is returned in buf + * Notes: + * 1. result is in descenting order: 1w2d3h4m5s + * 2. zero fields are not filled (except for p. 3): 5d1s + * 3. zero seconds value is presented as "0s" + */ +static char * __sec2str(time_t seconds, char *buf) +{ + const char spec[] = "smhdw"; + const unsigned long mult[] = {1, 60, 60*60, 24*60*60, 7*24*60*60}; + unsigned long c; + char *tail = buf; + int i; + + for (i = sizeof(mult) / sizeof(mult[0]) - 1 ; i >= 0; i--) { + c = seconds / mult[i]; + + if (c > 0 || (i == 0 && buf == tail)) + tail += snprintf(tail, 40-(tail-buf), "%lu%c", c, spec[i]); + + seconds %= mult[i]; + } + + return tail; +} + +static void sec2str(time_t seconds, char *buf, int rc) +{ + char *tail = buf; + + if (rc) + *tail++ = '['; + + tail = __sec2str(seconds, tail); + + if (rc && tail - buf < 39) { + *tail++ = ']'; + *tail++ = 0; + } +} + +static void diff2str(time_t seconds, char *buf, time_t now) +{ + + buf[0] = 0; + if (!seconds) + return; + if (seconds <= now) { + strcpy(buf, "none"); + return; + } + __sec2str(seconds - now, buf); +} + +static void print_quota_title(char *name, struct if_quotactl *qctl, + bool human_readable, bool show_default) +{ + if (show_default) { + printf("Disk default %s quota:\n", qtype_name(qctl->qc_type)); + printf("%15s %8s%8s%8s %8s%8s%8s\n", + "Filesystem", "bquota", "blimit", "bgrace", + "iquota", "ilimit", "igrace"); + } else { + printf("Disk quotas for %s %s (%cid %u):\n", + qtype_name(qctl->qc_type), name, + *qtype_name(qctl->qc_type), qctl->qc_id); + printf("%15s%8s %7s%8s%8s%8s %7s%8s%8s\n", + "Filesystem", human_readable ? "used" : "kbytes", + "quota", "limit", "grace", + "files", "quota", "limit", "grace"); + } +} + +static void kbytes2str(__u64 num, char *buf, int buflen, bool h) +{ + if (!h) { + snprintf(buf, buflen, "%ju", (uintmax_t)num); + } else { + if (num >> 40) + snprintf(buf, buflen, "%5.4gP", + (double)num / ((__u64)1 << 40)); + else if (num >> 30) + snprintf(buf, buflen, "%5.4gT", + (double)num / (1 << 30)); + else if (num >> 20) + snprintf(buf, buflen, "%5.4gG", + (double)num / (1 << 20)); + else if (num >> 10) + snprintf(buf, buflen, "%5.4gM", + (double)num / (1 << 10)); + else + snprintf(buf, buflen, "%ju%s", (uintmax_t)num, "k"); + } +} + +#define STRBUF_LEN 32 +static void print_quota(char *mnt, struct if_quotactl *qctl, int type, + int rc, bool h, bool show_default) +{ + time_t now; + + time(&now); + + if (qctl->qc_cmd == LUSTRE_Q_GETQUOTA || qctl->qc_cmd == Q_GETOQUOTA || + qctl->qc_cmd == LUSTRE_Q_GETDEFAULT) { + int bover = 0, iover = 0; + struct obd_dqblk *dqb = &qctl->qc_dqblk; + char numbuf[3][STRBUF_LEN]; + char timebuf[40]; + char strbuf[STRBUF_LEN]; + + if (dqb->dqb_bhardlimit && + lustre_stoqb(dqb->dqb_curspace) >= dqb->dqb_bhardlimit) { + bover = 1; + } else if (dqb->dqb_bsoftlimit && dqb->dqb_btime) { + if (dqb->dqb_btime > now) { + bover = 2; + } else { + bover = 3; + } + } + + if (dqb->dqb_ihardlimit && + dqb->dqb_curinodes >= dqb->dqb_ihardlimit) { + iover = 1; + } else if (dqb->dqb_isoftlimit && dqb->dqb_itime) { + if (dqb->dqb_itime > now) { + iover = 2; + } else { + iover = 3; + } + } + + + if (strlen(mnt) > 15) + printf("%s\n%15s", mnt, ""); + else + printf("%15s", mnt); + + if (bover) + diff2str(dqb->dqb_btime, timebuf, now); + else if (show_default) + snprintf(timebuf, sizeof(timebuf), "%llu", + dqb->dqb_btime); + + kbytes2str(lustre_stoqb(dqb->dqb_curspace), + strbuf, sizeof(strbuf), h); + if (rc == -EREMOTEIO) + sprintf(numbuf[0], "%s*", strbuf); + else + sprintf(numbuf[0], (dqb->dqb_valid & QIF_SPACE) ? + "%s" : "[%s]", strbuf); + + kbytes2str(dqb->dqb_bsoftlimit, strbuf, sizeof(strbuf), h); + if (type == QC_GENERAL) + sprintf(numbuf[1], (dqb->dqb_valid & QIF_BLIMITS) ? + "%s" : "[%s]", strbuf); + else + sprintf(numbuf[1], "%s", "-"); + + kbytes2str(dqb->dqb_bhardlimit, strbuf, sizeof(strbuf), h); + sprintf(numbuf[2], (dqb->dqb_valid & QIF_BLIMITS) ? + "%s" : "[%s]", strbuf); + + if (show_default) + printf(" %6s %7s %7s", numbuf[1], numbuf[2], timebuf); + else + printf(" %7s%c %6s %7s %7s", + numbuf[0], bover ? '*' : ' ', numbuf[1], + numbuf[2], bover > 1 ? timebuf : "-"); - if (param->fp_recursive) - param->fp_max_depth = -1; - else if (param->fp_verbose & VERBOSE_DETAIL) - param->fp_max_depth = 1; - if (!param->fp_verbose) - param->fp_verbose = VERBOSE_DEFAULT; - if (param->fp_quiet) - param->fp_verbose = VERBOSE_OBJID; + if (iover) + diff2str(dqb->dqb_itime, timebuf, now); + else if (show_default) + snprintf(timebuf, sizeof(timebuf), "%llu", + dqb->dqb_itime); - do { - rc = llapi_getstripe(argv[optind], param); - } while (++optind < argc && !rc); + snprintf(numbuf[0], sizeof(numbuf), + (dqb->dqb_valid & QIF_INODES) ? "%ju" : "[%ju]", + (uintmax_t)dqb->dqb_curinodes); - if (rc) - fprintf(stderr, "error: %s failed for %s.\n", - argv[0], argv[optind - 1]); - return rc; -} + if (type == QC_GENERAL) + sprintf(numbuf[1], (dqb->dqb_valid & QIF_ILIMITS) ? + "%ju" : "[%ju]", + (uintmax_t)dqb->dqb_isoftlimit); + else + sprintf(numbuf[1], "%s", "-"); -static int lfs_tgts(int argc, char **argv) -{ - char mntdir[PATH_MAX] = {'\0'}, path[PATH_MAX] = {'\0'}; - struct find_param param; - int index = 0, rc=0; + sprintf(numbuf[2], (dqb->dqb_valid & QIF_ILIMITS) ? + "%ju" : "[%ju]", (uintmax_t)dqb->dqb_ihardlimit); - if (argc > 2) - return CMD_HELP; + if (show_default) + printf(" %6s %7s %7s", numbuf[1], numbuf[2], timebuf); + else if (type != QC_OSTIDX) + printf(" %7s%c %6s %7s %7s", + numbuf[0], iover ? '*' : ' ', numbuf[1], + numbuf[2], iover > 1 ? timebuf : "-"); + else + printf(" %7s %7s %7s %7s", "-", "-", "-", "-"); + printf("\n"); - if (argc == 2 && !realpath(argv[1], path)) { - rc = -errno; - fprintf(stderr, "error: invalid path '%s': %s\n", - argv[1], strerror(-rc)); - return rc; + } else if (qctl->qc_cmd == LUSTRE_Q_GETINFO || + qctl->qc_cmd == Q_GETOINFO) { + char bgtimebuf[40]; + char igtimebuf[40]; + + sec2str(qctl->qc_dqinfo.dqi_bgrace, bgtimebuf, rc); + sec2str(qctl->qc_dqinfo.dqi_igrace, igtimebuf, rc); + printf("Block grace time: %s; Inode grace time: %s\n", + bgtimebuf, igtimebuf); } +} - while (!llapi_search_mounts(path, index++, mntdir, NULL)) { - /* Check if we have a mount point */ - if (mntdir[0] == '\0') - continue; +static int print_obd_quota(char *mnt, struct if_quotactl *qctl, int is_mdt, + bool h, __u64 *total) +{ + int rc = 0, rc1 = 0, count = 0; + __u32 valid = qctl->qc_valid; - memset(¶m, 0, sizeof(param)); - if (!strcmp(argv[0], "mdts")) - param.fp_get_lmv = 1; + rc = llapi_get_obd_count(mnt, &count, is_mdt); + if (rc) { + fprintf(stderr, "can not get %s count: %s\n", + is_mdt ? "mdt": "ost", strerror(-rc)); + return rc; + } - rc = llapi_ostlist(mntdir, ¶m); + for (qctl->qc_idx = 0; qctl->qc_idx < count; qctl->qc_idx++) { + qctl->qc_valid = is_mdt ? QC_MDTIDX : QC_OSTIDX; + rc = llapi_quotactl(mnt, qctl); if (rc) { - fprintf(stderr, "error: %s: failed on %s\n", - argv[0], mntdir); + /* It is remote client case. */ + if (rc == -EOPNOTSUPP) { + rc = 0; + goto out; + } + + if (!rc1) + rc1 = rc; + fprintf(stderr, "quotactl %s%d failed.\n", + is_mdt ? "mdt": "ost", qctl->qc_idx); + continue; } - if (path[0] != '\0') - break; - memset(mntdir, 0, PATH_MAX); - } - return rc; + print_quota(obd_uuid2str(&qctl->obd_uuid), qctl, + qctl->qc_valid, 0, h, false); + *total += is_mdt ? qctl->qc_dqblk.dqb_ihardlimit : + qctl->qc_dqblk.dqb_bhardlimit; + } +out: + qctl->qc_valid = valid; + return rc ? : rc1; } -static int lfs_getstripe(int argc, char **argv) +static int get_print_quota(char *mnt, char *name, struct if_quotactl *qctl, + int verbose, int quiet, bool human_readable, + bool show_default) { - struct find_param param = { 0 }; + int rc1 = 0, rc2 = 0, rc3 = 0; + char *obd_type = (char *)qctl->obd_type; + char *obd_uuid = (char *)qctl->obd_uuid.uuid; + __u64 total_ialloc = 0, total_balloc = 0; + bool use_default_for_blk = false; + bool use_default_for_file = false; + int inacc; - param.fp_max_depth = 1; - return lfs_getstripe_internal(argc, argv, ¶m); -} + rc1 = llapi_quotactl(mnt, qctl); + if (rc1 < 0) { + switch (rc1) { + case -ESRCH: + fprintf(stderr, "%s quotas are not enabled.\n", + qtype_name(qctl->qc_type)); + goto out; + case -EPERM: + fprintf(stderr, "Permission denied.\n"); + case -ENODEV: + case -ENOENT: + /* We already got error message. */ + goto out; + default: + fprintf(stderr, "Unexpected quotactl error: %s\n", + strerror(-rc1)); + } + } -/* functions */ -static int lfs_getdirstripe(int argc, char **argv) -{ - struct find_param param = { 0 }; - struct option long_opts[] = { -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) - { .val = 'c', .name = "mdt-count", .has_arg = no_argument }, -#endif - { .val = 'D', .name = "default", .has_arg = no_argument }, - { .val = 'H', .name = "mdt-hash", .has_arg = no_argument }, - { .val = 'i', .name = "mdt-index", .has_arg = no_argument }, - { .val = 'O', .name = "obd", .has_arg = required_argument }, - { .val = 'r', .name = "recursive", .has_arg = no_argument }, -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) - { .val = 't', .name = "mdt-hash", .has_arg = no_argument }, -#endif - { .val = 'T', .name = "mdt-count", .has_arg = no_argument }, - { .val = 'y', .name = "yaml", .has_arg = no_argument }, - { .name = NULL } }; - int c, rc; + if (!show_default && qctl->qc_id == 0) { + qctl->qc_dqblk.dqb_bhardlimit = 0; + qctl->qc_dqblk.dqb_bsoftlimit = 0; + qctl->qc_dqblk.dqb_ihardlimit = 0; + qctl->qc_dqblk.dqb_isoftlimit = 0; + qctl->qc_dqblk.dqb_btime = 0; + qctl->qc_dqblk.dqb_itime = 0; + qctl->qc_dqblk.dqb_valid |= QIF_LIMITS | QIF_TIMES; + } - param.fp_get_lmv = 1; + if (qctl->qc_dqblk.dqb_valid & QIF_BTIME && + LQUOTA_FLAG(qctl->qc_dqblk.dqb_btime) & LQUOTA_FLAG_DEFAULT) { + use_default_for_blk = true; + qctl->qc_dqblk.dqb_btime &= LQUOTA_GRACE_MASK; + } - while ((c = getopt_long(argc, argv, - "cDHiO:rtTy", long_opts, NULL)) != -1) - { - switch (c) { - case 'O': - if (param.fp_obd_uuid) { - fprintf(stderr, - "error: %s: only one obduuid allowed", - argv[0]); - return CMD_HELP; - } - param.fp_obd_uuid = (struct obd_uuid *)optarg; - break; -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) - case 'c': -#if LUSTRE_VERSION_CODE >= OBD_OCD_VERSION(2, 10, 50, 0) - fprintf(stderr, "warning: '-c' deprecated" - ", use '-T' instead\n"); -#endif -#endif - case 'T': - param.fp_verbose |= VERBOSE_COUNT; - break; - case 'i': - param.fp_verbose |= VERBOSE_OFFSET; - break; -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) - case 't': -#endif - case 'H': - param.fp_verbose |= VERBOSE_HASH_TYPE; - break; - case 'D': - param.fp_get_default_lmv = 1; - break; - case 'r': - param.fp_recursive = 1; - break; - case 'y': - param.fp_yaml = 1; - break; - default: - return CMD_HELP; - } + if (qctl->qc_dqblk.dqb_valid & QIF_ITIME && + LQUOTA_FLAG(qctl->qc_dqblk.dqb_itime) & LQUOTA_FLAG_DEFAULT) { + use_default_for_file = true; + qctl->qc_dqblk.dqb_itime &= LQUOTA_GRACE_MASK; } - if (optind >= argc) - return CMD_HELP; + if ((qctl->qc_cmd == LUSTRE_Q_GETQUOTA || + qctl->qc_cmd == LUSTRE_Q_GETDEFAULT) && !quiet) + print_quota_title(name, qctl, human_readable, show_default); - if (param.fp_recursive) - param.fp_max_depth = -1; + if (rc1 && *obd_type) + fprintf(stderr, "%s %s ", obd_type, obd_uuid); - if (!param.fp_verbose) - param.fp_verbose = VERBOSE_DEFAULT; + if (qctl->qc_valid != QC_GENERAL) + mnt = ""; - do { - rc = llapi_getstripe(argv[optind], ¶m); - } while (++optind < argc && !rc); + inacc = (qctl->qc_cmd == LUSTRE_Q_GETQUOTA) && + ((qctl->qc_dqblk.dqb_valid & (QIF_LIMITS|QIF_USAGE)) != + (QIF_LIMITS|QIF_USAGE)); + + print_quota(mnt, qctl, QC_GENERAL, rc1, human_readable, show_default); + + if (!show_default && verbose && + qctl->qc_valid == QC_GENERAL && qctl->qc_cmd != LUSTRE_Q_GETINFO) { + char strbuf[STRBUF_LEN]; + + rc2 = print_obd_quota(mnt, qctl, 1, human_readable, + &total_ialloc); + rc3 = print_obd_quota(mnt, qctl, 0, human_readable, + &total_balloc); + kbytes2str(total_balloc, strbuf, sizeof(strbuf), + human_readable); + printf("Total allocated inode limit: %ju, total " + "allocated block limit: %s\n", (uintmax_t)total_ialloc, + strbuf); + } + + if (use_default_for_blk) + printf("%cid %u is using default block quota setting\n", + *qtype_name(qctl->qc_type), qctl->qc_id); + + if (use_default_for_file) + printf("%cid %u is using default file quota setting\n", + *qtype_name(qctl->qc_type), qctl->qc_id); + + if (rc1 || rc2 || rc3 || inacc) + printf("Some errors happened when getting quota info. " + "Some devices may be not working or deactivated. " + "The data in \"[]\" is inaccurate.\n"); +out: + return rc1; - if (rc) - fprintf(stderr, "error: %s failed for %s.\n", - argv[0], argv[optind - 1]); - return rc; } -/* functions */ -static int lfs_setdirstripe(int argc, char **argv) +static int lfs_project(int argc, char **argv) { - char *dname; - int result; - unsigned int stripe_offset = -1; - unsigned int stripe_count = 1; - enum lmv_hash_type hash_type; - char *end; - int c; - char *stripe_offset_opt = NULL; - char *stripe_count_opt = NULL; - char *stripe_hash_opt = NULL; - char *mode_opt = NULL; - bool default_stripe = false; - mode_t mode = S_IRWXU | S_IRWXG | S_IRWXO; - mode_t previous_mode = 0; - bool delete = false; - - struct option long_opts[] = { -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) - { .val = 'c', .name = "count", .has_arg = required_argument }, -#endif - { .val = 'c', .name = "mdt-count", .has_arg = required_argument }, - { .val = 'd', .name = "delete", .has_arg = no_argument }, -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) - { .val = 'i', .name = "index", .has_arg = required_argument }, -#endif - { .val = 'i', .name = "mdt-index", .has_arg = required_argument }, - { .val = 'm', .name = "mode", .has_arg = required_argument }, -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) - { .val = 't', .name = "hash-type", .has_arg = required_argument }, - { .val = 't', .name = "mdt-hash", .has_arg = required_argument }, -#endif - {"mdt-hash", required_argument, 0, 'H'}, -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) - { .val = 'D', .name = "default_stripe", - .has_arg = no_argument }, -#endif - { .val = 'D', .name = "default", .has_arg = no_argument }, - { .name = NULL } }; + int ret = 0, err = 0, c, i; + struct project_handle_control phc = { 0 }; + enum lfs_project_ops_t op; - while ((c = getopt_long(argc, argv, "c:dDi:H:m:t:", long_opts, - NULL)) >= 0) { + phc.newline = true; + phc.assign_projid = false; + /* default action */ + op = LFS_PROJECT_LIST; + + while ((c = getopt(argc, argv, "p:cCsdkr0")) != -1) { switch (c) { - case 0: - /* Long options. */ - break; case 'c': -#if LUSTRE_VERSION_CODE >= OBD_OCD_VERSION(2, 11, 53, 0) - if (strcmp(argv[optind - 1], "--count") == 0) + if (op != LFS_PROJECT_LIST) { fprintf(stderr, - "%s %s: warning: '--count' deprecated, use '--mdt-count' instead\n", - progname, argv[0]); -#endif - stripe_count_opt = optarg; + "%s: cannot specify '-c' '-C' '-s' together\n", + progname); + return CMD_HELP; + } + + op = LFS_PROJECT_CHECK; + break; + case 'C': + if (op != LFS_PROJECT_LIST) { + fprintf(stderr, + "%s: cannot specify '-c' '-C' '-s' together\n", + progname); + return CMD_HELP; + } + + op = LFS_PROJECT_CLEAR; + break; + case 's': + if (op != LFS_PROJECT_LIST) { + fprintf(stderr, + "%s: cannot specify '-c' '-C' '-s' together\n", + progname); + return CMD_HELP; + } + + phc.set_inherit = true; + op = LFS_PROJECT_SET; break; case 'd': - delete = true; - default_stripe = true; + phc.dironly = true; break; - case 'D': - default_stripe = true; + case 'k': + phc.keep_projid = true; break; - case 'i': -#if LUSTRE_VERSION_CODE >= OBD_OCD_VERSION(2, 11, 53, 0) - if (strcmp(argv[optind - 1], "--index") == 0) - fprintf(stderr, - "%s %s: warning: '--index' deprecated, use '--mdt-index' instead\n", - progname, argv[0]); -#endif - stripe_offset_opt = optarg; + case 'r': + phc.recursive = true; break; - case 'm': - mode_opt = optarg; + case 'p': + phc.projid = strtoul(optarg, NULL, 0); + phc.assign_projid = true; + break; -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) - case 't': -#endif - case 'H': -#if LUSTRE_VERSION_CODE >= OBD_OCD_VERSION(2, 11, 53, 0) - if (strcmp(argv[optind - 1], "--hash-type") == 0) - fprintf(stderr, - "%s %s: warning: '--hash-type' deprecated, use '--mdt-hash' instead\n", - progname, argv[0]); -#endif - stripe_hash_opt = optarg; + case '0': + phc.newline = false; break; default: - fprintf(stderr, "%s %s: unrecognized option '%s'\n", - progname, argv[0], argv[optind - 1]); + fprintf(stderr, "%s: invalid option '%c'\n", + progname, optopt); return CMD_HELP; } } - if (optind == argc) { - fprintf(stderr, "%s %s: DIR must be specified\n", - progname, argv[0]); - return CMD_HELP; - } - - if (!delete && stripe_offset_opt == NULL && stripe_count_opt == NULL) { - fprintf(stderr, - "%s %s: stripe offset and count must be specified\n", - progname, argv[0]); - return CMD_HELP; + if (phc.assign_projid && op == LFS_PROJECT_LIST) { + op = LFS_PROJECT_SET; + phc.set_projid = true; + } else if (phc.assign_projid && op == LFS_PROJECT_SET) { + phc.set_projid = true; } - if (stripe_offset_opt != NULL) { - /* get the stripe offset */ - stripe_offset = strtoul(stripe_offset_opt, &end, 0); - if (*end != '\0') { + switch (op) { + case LFS_PROJECT_CHECK: + if (phc.keep_projid) { fprintf(stderr, - "%s %s: bad stripe offset '%s'\n", - progname, argv[0], stripe_offset_opt); + "%s: '-k' is useless together with '-c'\n", + progname); return CMD_HELP; } - } - - if (delete) { - if (stripe_offset_opt != NULL || stripe_count_opt != NULL) { + break; + case LFS_PROJECT_CLEAR: + if (!phc.newline) { fprintf(stderr, - "%s %s: cannot specify -d with -c or -i options\n", - progname, argv[0]); + "%s: '-0' is useless together with '-C'\n", + progname); return CMD_HELP; - } else { - stripe_count = 0; } - } - - - if (mode_opt != NULL) { - mode = strtoul(mode_opt, &end, 8); - if (*end != '\0') { + if (phc.assign_projid) { fprintf(stderr, - "%s %s: bad MODE '%s'\n", - progname, argv[0], mode_opt); + "%s: '-p' is useless together with '-C'\n", + progname); return CMD_HELP; } - previous_mode = umask(0); - } - - if (stripe_hash_opt == NULL) { - hash_type = LMV_HASH_TYPE_FNV_1A_64; - } else { - hash_type = check_hashtype(stripe_hash_opt); - if (hash_type == 0) { - fprintf(stderr, "%s %s: bad stripe hash type '%s'\n", - progname, argv[0], stripe_hash_opt); + break; + case LFS_PROJECT_SET: + if (!phc.newline) { + fprintf(stderr, + "%s: '-0' is useless together with '-s'\n", + progname); return CMD_HELP; } - } - - /* get the stripe count */ - if (stripe_count_opt != NULL) { - stripe_count = strtoul(stripe_count_opt, &end, 0); - if (*end != '\0') { + if (phc.keep_projid) { fprintf(stderr, - "%s %s: bad stripe count '%s'\n", - progname, argv[0], stripe_count_opt); + "%s: '-k' is useless together with '-s'\n", + progname); return CMD_HELP; } - } - - dname = argv[optind]; - do { - if (default_stripe) { - result = llapi_dir_set_default_lmv_stripe(dname, - stripe_offset, stripe_count, - hash_type, NULL); - } else { - result = llapi_dir_create_pool(dname, mode, - stripe_offset, - stripe_count, hash_type, - NULL); - } - - if (result) { + break; + default: + if (!phc.newline) { fprintf(stderr, - "%s setdirstripe: cannot create stripe dir '%s': %s\n", - progname, dname, strerror(-result)); - break; + "%s: '-0' is useless for list operations\n", + progname); + return CMD_HELP; } - dname = argv[++optind]; - } while (dname != NULL); - - if (mode_opt != NULL) - umask(previous_mode); - - return result; -} - -/* functions */ -static int lfs_rmentry(int argc, char **argv) -{ - char *dname; - int index; - int result = 0; + break; + } - if (argc <= 1) { - fprintf(stderr, "error: %s: missing dirname\n", - argv[0]); + argv += optind; + argc -= optind; + if (argc == 0) { + fprintf(stderr, "%s: missing file or directory target(s)\n", + progname); return CMD_HELP; } - index = 1; - dname = argv[index]; - while (dname != NULL) { - result = llapi_direntry_remove(dname); - if (result) { - fprintf(stderr, "error: %s: remove dir entry '%s' " - "failed\n", argv[0], dname); + for (i = 0; i < argc; i++) { + switch (op) { + case LFS_PROJECT_CHECK: + err = lfs_project_check(argv[i], &phc); break; - } - dname = argv[++index]; - } - return result; -} - -static int lfs_mv(int argc, char **argv) -{ - struct find_param param = { - .fp_max_depth = -1, - .fp_mdt_index = -1, - }; - char *end; - int c; - int rc = 0; - struct option long_opts[] = { - { .val = 'M', .name = "mdt-index", .has_arg = required_argument }, - { .val = 'v', .name = "verbose", .has_arg = no_argument }, - { .name = NULL } }; - - while ((c = getopt_long(argc, argv, "M:v", long_opts, NULL)) != -1) { - switch (c) { - case 'M': { - param.fp_mdt_index = strtoul(optarg, &end, 0); - if (*end != '\0') { - fprintf(stderr, "%s: invalid MDT index'%s'\n", - argv[0], optarg); - return CMD_HELP; - } + case LFS_PROJECT_LIST: + err = lfs_project_list(argv[i], &phc); break; - } - case 'v': { - param.fp_verbose = VERBOSE_DETAIL; + case LFS_PROJECT_CLEAR: + err = lfs_project_clear(argv[i], &phc); + break; + case LFS_PROJECT_SET: + err = lfs_project_set(argv[i], &phc); break; - } default: - fprintf(stderr, "error: %s: unrecognized option '%s'\n", - argv[0], argv[optind - 1]); - return CMD_HELP; + break; } + if (err && !ret) + ret = err; } - if (param.fp_mdt_index == -1) { - fprintf(stderr, "%s: MDT index must be specified\n", argv[0]); - return CMD_HELP; - } - - if (optind >= argc) { - fprintf(stderr, "%s: missing operand path\n", argv[0]); - return CMD_HELP; - } - - param.fp_migrate = 1; - rc = llapi_migrate_mdt(argv[optind], ¶m); - if (rc != 0) - fprintf(stderr, "%s: cannot migrate '%s' to MDT%04x: %s\n", - argv[0], argv[optind], param.fp_mdt_index, - strerror(-rc)); - return rc; -} - -static int lfs_osts(int argc, char **argv) -{ - return lfs_tgts(argc, argv); -} - -static int lfs_mdts(int argc, char **argv) -{ - return lfs_tgts(argc, argv); + return ret; } -#define COOK(value) \ -({ \ - int radix = 0; \ - while (value > 1024) { \ - value /= 1024; \ - radix++; \ - } \ - radix; \ -}) -#define UUF "%-20s" -#define CSF "%11s" -#define CDF "%11llu" -#define HDF "%8.1f%c" -#define RSF "%4s" -#define RDF "%3d%%" - -enum mntdf_flags { - MNTDF_INODES = 0x0001, - MNTDF_COOKED = 0x0002, - MNTDF_LAZY = 0x0004, - MNTDF_VERBOSE = 0x0008, -}; - -static int showdf(char *mntdir, struct obd_statfs *stat, - char *uuid, enum mntdf_flags flags, - char *type, int index, int rc) +static int lfs_quota(int argc, char **argv) { - long long avail, used, total; - double ratio = 0; - char *suffix = "KMGTPEZY"; - /* Note if we have >2^64 bytes/fs these buffers will need to be grown */ - char tbuf[3 * sizeof(__u64)]; - char ubuf[3 * sizeof(__u64)]; - char abuf[3 * sizeof(__u64)]; - char rbuf[3 * sizeof(__u64)]; - - if (!uuid || !stat) - return -EINVAL; - - switch (rc) { - case 0: - if (flags & MNTDF_INODES) { - avail = stat->os_ffree; - used = stat->os_files - stat->os_ffree; - total = stat->os_files; - } else { - int shift = flags & MNTDF_COOKED ? 0 : 10; + int c; + char *mnt, *name = NULL; + struct if_quotactl qctl = { .qc_cmd = LUSTRE_Q_GETQUOTA, + .qc_type = ALLQUOTA }; + char *obd_uuid = (char *)qctl.obd_uuid.uuid; + int rc = 0, rc1 = 0, verbose = 0, quiet = 0; + char *endptr; + __u32 valid = QC_GENERAL, idx = 0; + bool human_readable = false; + bool show_default = false; + int qtype; - avail = (stat->os_bavail * stat->os_bsize) >> shift; - used = ((stat->os_blocks - stat->os_bfree) * - stat->os_bsize) >> shift; - total = (stat->os_blocks * stat->os_bsize) >> shift; + while ((c = getopt(argc, argv, "gGi:I:o:pPqtuUvh")) != -1) { + switch (c) { + case 'U': + show_default = true; + case 'u': + qtype = USRQUOTA; + goto quota_type; + case 'G': + show_default = true; + case 'g': + qtype = GRPQUOTA; + goto quota_type; + case 'P': + show_default = true; + case 'p': + qtype = PRJQUOTA; +quota_type: + if (qctl.qc_type != ALLQUOTA) { + fprintf(stderr, + "%s quota: only one of -u, -g, or -p may be specified\n", + progname); + return CMD_HELP; + } + qctl.qc_type = qtype; + break; + case 't': + qctl.qc_cmd = LUSTRE_Q_GETINFO; + break; + case 'o': + valid = qctl.qc_valid = QC_UUID; + snprintf(obd_uuid, sizeof(qctl.obd_uuid), "%s", optarg); + break; + case 'i': + valid = qctl.qc_valid = QC_MDTIDX; + idx = qctl.qc_idx = atoi(optarg); + if (idx == 0 && *optarg != '0') { + fprintf(stderr, + "%s quota: invalid MDT index '%s'\n", + progname, optarg); + return CMD_HELP; + } + break; + case 'I': + valid = qctl.qc_valid = QC_OSTIDX; + idx = qctl.qc_idx = atoi(optarg); + if (idx == 0 && *optarg != '0') { + fprintf(stderr, + "%s quota: invalid OST index '%s'\n", + progname, optarg); + return CMD_HELP; + } + break; + case 'v': + verbose = 1; + break; + case 'q': + quiet = 1; + break; + case 'h': + human_readable = true; + break; + default: + fprintf(stderr, "%s quota: unrecognized option '%s'\n", + progname, argv[optind - 1]); + return CMD_HELP; } + } - if ((used + avail) > 0) - ratio = (double)used / (double)(used + avail); - - if (flags & MNTDF_COOKED) { - int i; - double cook_val; + /* current uid/gid info for "lfs quota /path/to/lustre/mount" */ + if (qctl.qc_cmd == LUSTRE_Q_GETQUOTA && qctl.qc_type == ALLQUOTA && + optind == argc - 1 && !show_default) { - cook_val = (double)total; - i = COOK(cook_val); - if (i > 0) - snprintf(tbuf, sizeof(tbuf), HDF, cook_val, - suffix[i - 1]); - else - snprintf(tbuf, sizeof(tbuf), CDF, total); + qctl.qc_cmd = LUSTRE_Q_GETQUOTA; + qctl.qc_valid = valid; + qctl.qc_idx = idx; - cook_val = (double)used; - i = COOK(cook_val); - if (i > 0) - snprintf(ubuf, sizeof(ubuf), HDF, cook_val, - suffix[i - 1]); - else - snprintf(ubuf, sizeof(ubuf), CDF, used); + for (qtype = USRQUOTA; qtype <= GRPQUOTA; qtype++) { + qctl.qc_type = qtype; + if (qtype == USRQUOTA) { + qctl.qc_id = geteuid(); + rc = uid2name(&name, qctl.qc_id); + } else { + qctl.qc_id = getegid(); + rc = gid2name(&name, qctl.qc_id); + } + if (rc) + name = ""; + mnt = argv[optind]; + rc1 = get_print_quota(mnt, name, &qctl, verbose, quiet, + human_readable, show_default); + if (rc1 && !rc) + rc = rc1; + } + return rc; + /* lfs quota -u username /path/to/lustre/mount */ + } else if (qctl.qc_cmd == LUSTRE_Q_GETQUOTA) { + /* options should be followed by u/g-name and mntpoint */ + if ((!show_default && optind + 2 != argc) || + (show_default && optind + 1 != argc) || + qctl.qc_type == ALLQUOTA) { + fprintf(stderr, + "%s quota: name and mount point must be specified\n", + progname); + return CMD_HELP; + } - cook_val = (double)avail; - i = COOK(cook_val); - if (i > 0) - snprintf(abuf, sizeof(abuf), HDF, cook_val, - suffix[i - 1]); - else - snprintf(abuf, sizeof(abuf), CDF, avail); + if (!show_default) { + name = argv[optind++]; + switch (qctl.qc_type) { + case USRQUOTA: + rc = name2uid(&qctl.qc_id, name); + break; + case GRPQUOTA: + rc = name2gid(&qctl.qc_id, name); + break; + case PRJQUOTA: + rc = name2projid(&qctl.qc_id, name); + break; + default: + rc = -ENOTSUP; + break; + } } else { - snprintf(tbuf, sizeof(tbuf), CDF, total); - snprintf(ubuf, sizeof(tbuf), CDF, used); - snprintf(abuf, sizeof(tbuf), CDF, avail); + qctl.qc_valid = QC_GENERAL; + qctl.qc_cmd = LUSTRE_Q_GETDEFAULT; + qctl.qc_id = 0; } - sprintf(rbuf, RDF, (int)(ratio * 100 + 0.5)); - printf(UUF" "CSF" "CSF" "CSF" "RSF" %-s", - uuid, tbuf, ubuf, abuf, rbuf, mntdir); - if (type) - printf("[%s:%d]", type, index); - - if (stat->os_state) { - /* - * Each character represents the matching - * OS_STATE_* bit. - */ - const char state_names[] = "DRSI"; - __u32 state; - __u32 i; - - printf(" "); - for (i = 0, state = stat->os_state; - state && i < sizeof(state_names); i++) { - if (!(state & (1 << i))) - continue; - printf("%c", state_names[i]); - state ^= 1 << i; + if (rc) { + qctl.qc_id = strtoul(name, &endptr, 10); + if (*endptr != '\0') { + fprintf(stderr, "%s quota: invalid id '%s'\n", + progname, name); + return CMD_HELP; } } - - printf("\n"); - break; - case -ENODATA: - printf(UUF": inactive device\n", uuid); - break; - default: - printf(UUF": %s\n", uuid, strerror(-rc)); - break; + } else if (optind + 1 != argc || qctl.qc_type == ALLQUOTA) { + fprintf(stderr, "%s quota: missing quota info argument(s)\n", + progname); + return CMD_HELP; } - return 0; + mnt = argv[optind]; + rc = get_print_quota(mnt, name, &qctl, verbose, quiet, + human_readable, show_default); + return rc; } +#endif /* HAVE_SYS_QUOTA_H! */ -struct ll_stat_type { - int st_op; - char *st_name; -}; - -static int mntdf(char *mntdir, char *fsname, char *pool, enum mntdf_flags flags) +static int flushctx_ioctl(char *mp) { - struct obd_statfs stat_buf, sum = { .os_bsize = 1 }; - struct obd_uuid uuid_buf; - char *poolname = NULL; - struct ll_stat_type types[] = { - { .st_op = LL_STATFS_LMV, .st_name = "MDT" }, - { .st_op = LL_STATFS_LOV, .st_name = "OST" }, - { .st_name = NULL } }; - struct ll_stat_type *tp; - __u64 ost_ffree = 0; - __u32 index; - __u32 type; - int fd; - int rc = 0; - int rc2; + int fd, rc; - if (pool) { - poolname = strchr(pool, '.'); - if (poolname != NULL) { - if (strncmp(fsname, pool, strlen(fsname))) { - fprintf(stderr, "filesystem name incorrect\n"); - return -ENODEV; - } - poolname++; - } else - poolname = pool; - } + fd = open(mp, O_RDONLY); + if (fd == -1) { + fprintf(stderr, "flushctx: error open %s: %s\n", + mp, strerror(errno)); + return -1; + } - fd = open(mntdir, O_RDONLY); - if (fd < 0) { - rc = -errno; - fprintf(stderr, "%s: cannot open '%s': %s\n", progname, mntdir, - strerror(errno)); - return rc; - } + rc = ioctl(fd, LL_IOC_FLUSHCTX); + if (rc == -1) + fprintf(stderr, "flushctx: error ioctl %s: %s\n", + mp, strerror(errno)); - if (flags & MNTDF_INODES) - printf(UUF" "CSF" "CSF" "CSF" "RSF" %-s\n", - "UUID", "Inodes", "IUsed", "IFree", - "IUse%", "Mounted on"); - else - printf(UUF" "CSF" "CSF" "CSF" "RSF" %-s\n", - "UUID", flags & MNTDF_COOKED ? "bytes" : "1K-blocks", - "Used", "Available", "Use%", "Mounted on"); + close(fd); + return rc; +} - for (tp = types; tp->st_name != NULL; tp++) { - for (index = 0; ; index++) { - memset(&stat_buf, 0, sizeof(struct obd_statfs)); - memset(&uuid_buf, 0, sizeof(struct obd_uuid)); - type = flags & MNTDF_LAZY ? - tp->st_op | LL_STATFS_NODELAY : tp->st_op; - rc2 = llapi_obd_fstatfs(fd, type, index, - &stat_buf, &uuid_buf); - if (rc2 == -ENODEV) - break; - if (rc2 == -EAGAIN) - continue; - if (rc2 == -ENODATA) { /* Inactive device, OK. */ - if (!(flags & MNTDF_VERBOSE)) - continue; - } else if (rc2 < 0 && rc == 0) { - rc = rc2; - } +static int lfs_flushctx(int argc, char **argv) +{ + int kdestroy = 0, c; + char mntdir[PATH_MAX] = {'\0'}; + int index = 0; + int rc = 0; - if (poolname && tp->st_op == LL_STATFS_LOV && - llapi_search_ost(fsname, poolname, - obd_uuid2str(&uuid_buf)) != 1) - continue; + while ((c = getopt(argc, argv, "k")) != -1) { + switch (c) { + case 'k': + kdestroy = 1; + break; + default: + fprintf(stderr, "error: %s: option '-%c' " + "unrecognized\n", argv[0], c); + return CMD_HELP; + } + } - /* the llapi_obd_statfs() call may have returned with - * an error, but if it filled in uuid_buf we will at - * lease use that to print out a message for that OBD. - * If we didn't get anything in the uuid_buf, then fill - * it in so that we can print an error message. */ - if (uuid_buf.uuid[0] == '\0') - snprintf(uuid_buf.uuid, sizeof(uuid_buf.uuid), - "%s%04x", tp->st_name, index); - showdf(mntdir, &stat_buf, obd_uuid2str(&uuid_buf), - flags, tp->st_name, index, rc2); + if (kdestroy) { + if ((rc = system("kdestroy > /dev/null")) != 0) { + rc = WEXITSTATUS(rc); + fprintf(stderr, "error destroying tickets: %d, continuing\n", rc); + } + } - if (rc2 == 0) { - if (tp->st_op == LL_STATFS_LMV) { - sum.os_ffree += stat_buf.os_ffree; - sum.os_files += stat_buf.os_files; - } else /* if (tp->st_op == LL_STATFS_LOV) */ { - sum.os_blocks += stat_buf.os_blocks * - stat_buf.os_bsize; - sum.os_bfree += stat_buf.os_bfree * - stat_buf.os_bsize; - sum.os_bavail += stat_buf.os_bavail * - stat_buf.os_bsize; - ost_ffree += stat_buf.os_ffree; - } - } - } - } + if (optind >= argc) { + /* flush for all mounted lustre fs. */ + while (!llapi_search_mounts(NULL, index++, mntdir, NULL)) { + /* Check if we have a mount point */ + if (mntdir[0] == '\0') + continue; - close(fd); + if (flushctx_ioctl(mntdir)) + rc = -1; - /* If we don't have as many objects free on the OST as inodes - * on the MDS, we reduce the total number of inodes to - * compensate, so that the "inodes in use" number is correct. - * Matches ll_statfs_internal() so the results are consistent. */ - if (ost_ffree < sum.os_ffree) { - sum.os_files = (sum.os_files - sum.os_ffree) + ost_ffree; - sum.os_ffree = ost_ffree; - } - printf("\n"); - showdf(mntdir, &sum, "filesystem_summary:", flags, NULL, 0, 0); - printf("\n"); + mntdir[0] = '\0'; /* avoid matching in next loop */ + } + } else { + /* flush fs as specified */ + while (optind < argc) { + if (flushctx_ioctl(argv[optind++])) + rc = -1; + } + } + return rc; +} - return rc; +static int lfs_cp(int argc, char **argv) +{ + fprintf(stderr, "remote client copy file(s).\n" + "obsolete, does not support it anymore.\n"); + return 0; } -static int lfs_df(int argc, char **argv) +static int lfs_ls(int argc, char **argv) { - char mntdir[PATH_MAX] = {'\0'}, path[PATH_MAX] = {'\0'}; - enum mntdf_flags flags = 0; - int c, rc = 0, index = 0; - char fsname[PATH_MAX] = "", *pool_name = NULL; + fprintf(stderr, "remote client lists directory contents.\n" + "obsolete, does not support it anymore.\n"); + return 0; +} + +static int lfs_changelog(int argc, char **argv) +{ + void *changelog_priv; + struct changelog_rec *rec; + long long startrec = 0, endrec = 0; + char *mdd; struct option long_opts[] = { - { .val = 'h', .name = "human-readable", - .has_arg = no_argument }, - { .val = 'i', .name = "inodes", .has_arg = no_argument }, - { .val = 'l', .name = "lazy", .has_arg = no_argument }, - { .val = 'p', .name = "pool", .has_arg = required_argument }, - { .val = 'v', .name = "verbose", .has_arg = no_argument }, - { .name = NULL} }; + { .val = 'f', .name = "follow", .has_arg = no_argument }, + { .name = NULL } }; + char short_opts[] = "f"; + int rc, follow = 0; - while ((c = getopt_long(argc, argv, "hilp:v", long_opts, NULL)) != -1) { - switch (c) { - case 'h': - flags |= MNTDF_COOKED; - break; - case 'i': - flags |= MNTDF_INODES; - break; - case 'l': - flags |= MNTDF_LAZY; - break; - case 'p': - pool_name = optarg; - break; - case 'v': - flags |= MNTDF_VERBOSE; - break; - default: - return CMD_HELP; - } + while ((rc = getopt_long(argc, argv, short_opts, + long_opts, NULL)) != -1) { + switch (rc) { + case 'f': + follow++; + break; + default: + fprintf(stderr, + "%s changelog: unrecognized option '%s'\n", + progname, argv[optind - 1]); + return CMD_HELP; + } + } + if (optind >= argc) { + fprintf(stderr, "%s changelog: mdtname must be specified\n", + progname); + return CMD_HELP; } - if (optind < argc && !realpath(argv[optind], path)) { - rc = -errno; - fprintf(stderr, "error: invalid path '%s': %s\n", - argv[optind], strerror(-rc)); + + mdd = argv[optind++]; + if (argc > optind) + startrec = strtoll(argv[optind++], NULL, 10); + if (argc > optind) + endrec = strtoll(argv[optind++], NULL, 10); + + rc = llapi_changelog_start(&changelog_priv, + CHANGELOG_FLAG_BLOCK | + CHANGELOG_FLAG_JOBID | + CHANGELOG_FLAG_EXTRA_FLAGS | + (follow ? CHANGELOG_FLAG_FOLLOW : 0), + mdd, startrec); + if (rc < 0) { + fprintf(stderr, "%s changelog: cannot start changelog: %s\n", + progname, strerror(errno = -rc)); return rc; } - while (!llapi_search_mounts(path, index++, mntdir, fsname)) { - /* Check if we have a mount point */ - if (mntdir[0] == '\0') - continue; + rc = llapi_changelog_set_xflags(changelog_priv, + CHANGELOG_EXTRA_FLAG_UIDGID | + CHANGELOG_EXTRA_FLAG_NID | + CHANGELOG_EXTRA_FLAG_OMODE | + CHANGELOG_EXTRA_FLAG_XATTR); + if (rc < 0) { + fprintf(stderr, + "%s changelog: cannot set xflags for changelog: %s\n", + progname, strerror(errno = -rc)); + return rc; + } - rc = mntdf(mntdir, fsname, pool_name, flags); - if (rc || path[0] != '\0') + while ((rc = llapi_changelog_recv(changelog_priv, &rec)) == 0) { + time_t secs; + struct tm ts; + + if (endrec && rec->cr_index > endrec) { + llapi_changelog_free(&rec); break; - fsname[0] = '\0'; /* avoid matching in next loop */ - mntdir[0] = '\0'; /* avoid matching in next loop */ - } + } + if (rec->cr_index < startrec) { + llapi_changelog_free(&rec); + continue; + } - return rc; -} + secs = rec->cr_time >> 30; + gmtime_r(&secs, &ts); + printf("%ju %02d%-5s %02d:%02d:%02d.%09d %04d.%02d.%02d " + "0x%x t="DFID, (uintmax_t)rec->cr_index, rec->cr_type, + changelog_type2str(rec->cr_type), + ts.tm_hour, ts.tm_min, ts.tm_sec, + (int)(rec->cr_time & ((1 << 30) - 1)), + ts.tm_year + 1900, ts.tm_mon + 1, ts.tm_mday, + rec->cr_flags & CLF_FLAGMASK, PFID(&rec->cr_tfid)); -static int lfs_getname(int argc, char **argv) -{ - char mntdir[PATH_MAX] = "", path[PATH_MAX] = "", fsname[PATH_MAX] = ""; - int rc = 0, index = 0, c; - char buf[sizeof(struct obd_uuid)]; + if (rec->cr_flags & CLF_JOBID) { + struct changelog_ext_jobid *jid = + changelog_rec_jobid(rec); - while ((c = getopt(argc, argv, "h")) != -1) - return CMD_HELP; + if (jid->cr_jobid[0] != '\0') + printf(" j=%s", jid->cr_jobid); + } - if (optind == argc) { /* no paths specified, get all paths. */ - while (!llapi_search_mounts(path, index++, mntdir, fsname)) { - rc = llapi_getname(mntdir, buf, sizeof(buf)); - if (rc < 0) { - fprintf(stderr, - "cannot get name for `%s': %s\n", - mntdir, strerror(-rc)); - break; - } + if (rec->cr_flags & CLF_EXTRA_FLAGS) { + struct changelog_ext_extra_flags *ef = + changelog_rec_extra_flags(rec); - printf("%s %s\n", buf, mntdir); + printf(" ef=0x%llx", ef->cr_extra_flags); - path[0] = fsname[0] = mntdir[0] = 0; - } - } else { /* paths specified, only attempt to search these. */ - for (; optind < argc; optind++) { - rc = llapi_getname(argv[optind], buf, sizeof(buf)); - if (rc < 0) { - fprintf(stderr, - "cannot get name for `%s': %s\n", - argv[optind], strerror(-rc)); - break; - } + if (ef->cr_extra_flags & CLFE_UIDGID) { + struct changelog_ext_uidgid *uidgid = + changelog_rec_uidgid(rec); - printf("%s %s\n", buf, argv[optind]); - } - } - return rc; -} + printf(" u=%llu:%llu", + uidgid->cr_uid, uidgid->cr_gid); + } + if (ef->cr_extra_flags & CLFE_NID) { + struct changelog_ext_nid *nid = + changelog_rec_nid(rec); -static int lfs_check(int argc, char **argv) -{ - int rc; - char mntdir[PATH_MAX] = {'\0'}; - int num_types = 1; - char *obd_types[2]; - char obd_type1[4]; - char obd_type2[4]; + printf(" nid=%s", + libcfs_nid2str(nid->cr_nid)); + } - if (argc != 2) - return CMD_HELP; + if (ef->cr_extra_flags & CLFE_OPEN) { + struct changelog_ext_openmode *omd = + changelog_rec_openmode(rec); + char mode[] = "---"; - obd_types[0] = obd_type1; - obd_types[1] = obd_type2; + /* exec mode must be exclusive */ + if (omd->cr_openflags & MDS_FMODE_EXEC) { + mode[2] = 'x'; + } else { + if (omd->cr_openflags & MDS_FMODE_READ) + mode[0] = 'r'; + if (omd->cr_openflags & + (MDS_FMODE_WRITE | + MDS_OPEN_TRUNC | + MDS_OPEN_APPEND)) + mode[1] = 'w'; + } - if (strcmp(argv[1], "osts") == 0) { - strcpy(obd_types[0], "osc"); - } else if (strcmp(argv[1], "mds") == 0) { - strcpy(obd_types[0], "mdc"); - } else if (strcmp(argv[1], "servers") == 0) { - num_types = 2; - strcpy(obd_types[0], "osc"); - strcpy(obd_types[1], "mdc"); - } else { - fprintf(stderr, "error: %s: option '%s' unrecognized\n", - argv[0], argv[1]); - return CMD_HELP; - } + if (strcmp(mode, "---") != 0) + printf(" m=%s", mode); - rc = llapi_search_mounts(NULL, 0, mntdir, NULL); - if (rc < 0 || mntdir[0] == '\0') { - fprintf(stderr, "No suitable Lustre mount found\n"); - return rc; - } + } - rc = llapi_target_check(num_types, obd_types, mntdir); - if (rc) - fprintf(stderr, "error: %s: %s status failed\n", - argv[0],argv[1]); + if (ef->cr_extra_flags & CLFE_XATTR) { + struct changelog_ext_xattr *xattr = + changelog_rec_xattr(rec); - return rc; + if (xattr->cr_xattr[0] != '\0') + printf(" x=%s", xattr->cr_xattr); + } + } -} + if (rec->cr_namelen) + printf(" p="DFID" %.*s", PFID(&rec->cr_pfid), + rec->cr_namelen, changelog_rec_name(rec)); -#ifdef HAVE_SYS_QUOTA_H -#define ARG2INT(nr, str, msg) \ -do { \ - char *endp; \ - nr = strtol(str, &endp, 0); \ - if (*endp) { \ - fprintf(stderr, "error: bad %s: %s\n", msg, str); \ - return CMD_HELP; \ - } \ -} while (0) + if (rec->cr_flags & CLF_RENAME) { + struct changelog_ext_rename *rnm = + changelog_rec_rename(rec); -#define ADD_OVERFLOW(a,b) ((a + b) < a) ? (a = ULONG_MAX) : (a = a + b) + if (!fid_is_zero(&rnm->cr_sfid)) + printf(" s="DFID" sp="DFID" %.*s", + PFID(&rnm->cr_sfid), + PFID(&rnm->cr_spfid), + (int)changelog_rec_snamelen(rec), + changelog_rec_sname(rec)); + } + printf("\n"); -/* Convert format time string "XXwXXdXXhXXmXXs" into seconds value - * returns the value or ULONG_MAX on integer overflow or incorrect format - * Notes: - * 1. the order of specifiers is arbitrary (may be: 5w3s or 3s5w) - * 2. specifiers may be encountered multiple times (2s3s is 5 seconds) - * 3. empty integer value is interpreted as 0 - */ -static unsigned long str2sec(const char* timestr) + llapi_changelog_free(&rec); + } + + llapi_changelog_fini(&changelog_priv); + + if (rc < 0) + fprintf(stderr, "%s changelog: cannot access changelog: %s\n", + progname, strerror(errno = -rc)); + + return (rc == 1 ? 0 : rc); +} + +static int lfs_changelog_clear(int argc, char **argv) { - const char spec[] = "smhdw"; - const unsigned long mult[] = {1, 60, 60*60, 24*60*60, 7*24*60*60}; - unsigned long val = 0; - char *tail; + long long endrec; + int rc; - if (strpbrk(timestr, spec) == NULL) { - /* no specifiers inside the time string, - should treat it as an integer value */ - val = strtoul(timestr, &tail, 10); - return *tail ? ULONG_MAX : val; - } + if (argc != 4) + return CMD_HELP; - /* format string is XXwXXdXXhXXmXXs */ - while (*timestr) { - unsigned long v; - int ind; - char* ptr; + endrec = strtoll(argv[3], NULL, 10); - v = strtoul(timestr, &tail, 10); - if (v == ULONG_MAX || *tail == '\0') - /* value too large (ULONG_MAX or more) - or missing specifier */ - goto error; + rc = llapi_changelog_clear(argv[1], argv[2], endrec); - ptr = strchr(spec, *tail); - if (ptr == NULL) - /* unknown specifier */ - goto error; + if (rc == -EINVAL) + fprintf(stderr, "%s: record out of range: %llu\n", + argv[0], endrec); + else if (rc == -ENOENT) + fprintf(stderr, "%s: no changelog user: %s\n", + argv[0], argv[2]); + else if (rc) + fprintf(stderr, "%s error: %s\n", argv[0], + strerror(-rc)); - ind = ptr - spec; + if (rc) + errno = -rc; - /* check if product will overflow the type */ - if (!(v < ULONG_MAX / mult[ind])) - goto error; + return rc; +} - ADD_OVERFLOW(val, mult[ind] * v); - if (val == ULONG_MAX) - goto error; +static int lfs_fid2path(int argc, char **argv) +{ + struct option long_opts[] = { + { .val = 'c', .name = "cur", .has_arg = no_argument }, + { .val = 'l', .name = "link", .has_arg = required_argument }, + { .val = 'r', .name = "rec", .has_arg = required_argument }, + { .name = NULL } }; + char short_opts[] = "cl:r:"; + char *device, *fid, *path; + long long recno = -1; + int linkno = -1; + int lnktmp; + int printcur = 0; + int rc = 0; + char *endptr = NULL; - timestr = tail + 1; - } + while ((rc = getopt_long(argc, argv, short_opts, + long_opts, NULL)) != -1) { + switch (rc) { + case 'c': + printcur++; + break; + case 'l': + linkno = strtol(optarg, &endptr, 10); + if (*endptr != '\0') { + fprintf(stderr, + "%s fid2path: invalid linkno '%s'\n", + progname, optarg); + return CMD_HELP; + } + break; + case 'r': + recno = strtoll(optarg, &endptr, 10); + if (*endptr != '\0') { + fprintf(stderr, + "%s fid2path: invalid recno '%s'\n", + progname, optarg); + return CMD_HELP; + } + break; + default: + fprintf(stderr, + "%s fid2path: unrecognized option '%s'\n", + progname, argv[optind - 1]); + return CMD_HELP; + } + } - return val; + if (argc < 3) { + fprintf(stderr, + "%s fid2path: and ... must be specified\n", + progname); + return CMD_HELP; + } -error: - return ULONG_MAX; -} + device = argv[optind++]; + path = calloc(1, PATH_MAX); + if (path == NULL) { + rc = -errno; + fprintf(stderr, + "%s fid2path: cannot allocate memory for path: %s\n", + progname, strerror(-rc)); + return rc; + } -#define ARG2ULL(nr, str, def_units) \ -do { \ - unsigned long long limit, units = def_units; \ - int rc; \ - \ - rc = llapi_parse_size(str, &limit, &units, 1); \ - if (rc < 0) { \ - fprintf(stderr, "error: bad limit value %s\n", str); \ - return CMD_HELP; \ - } \ - nr = limit; \ -} while (0) + rc = 0; + while (optind < argc) { + fid = argv[optind++]; -static inline int has_times_option(int argc, char **argv) -{ - int i; + lnktmp = (linkno >= 0) ? linkno : 0; + while (1) { + int oldtmp = lnktmp; + long long rectmp = recno; + int rc2; + rc2 = llapi_fid2path(device, fid, path, PATH_MAX, + &rectmp, &lnktmp); + if (rc2 < 0) { + fprintf(stderr, + "%s fid2path: cannot find '%s': %s\n", + progname, fid, strerror(errno = -rc2)); + if (rc == 0) + rc = rc2; + break; + } - for (i = 1; i < argc; i++) - if (!strcmp(argv[i], "-t")) - return 1; + if (printcur) + fprintf(stdout, "%lld ", rectmp); + if (device[0] == '/') { + fprintf(stdout, "%s", device); + if (device[strlen(device) - 1] != '/') + fprintf(stdout, "/"); + } else if (path[0] == '\0') { + fprintf(stdout, "/"); + } + fprintf(stdout, "%s\n", path); - return 0; + if (linkno >= 0) + /* specified linkno */ + break; + if (oldtmp == lnktmp) + /* no more links */ + break; + } + } + + free(path); + return rc; } -int lfs_setquota_times(int argc, char **argv) +static int lfs_path2fid(int argc, char **argv) { - int c, rc; - struct if_quotactl qctl; - char *mnt, *obd_type = (char *)qctl.obd_type; - struct obd_dqblk *dqb = &qctl.qc_dqblk; - struct obd_dqinfo *dqi = &qctl.qc_dqinfo; - struct option long_opts[] = { - { .val = 'b', .name = "block-grace", .has_arg = required_argument }, - { .val = 'g', .name = "group", .has_arg = no_argument }, - { .val = 'i', .name = "inode-grace", .has_arg = required_argument }, - { .val = 'p', .name = "projid", .has_arg = no_argument }, - { .val = 't', .name = "times", .has_arg = no_argument }, - { .val = 'u', .name = "user", .has_arg = no_argument }, - { .name = NULL } }; - int qtype; - - memset(&qctl, 0, sizeof(qctl)); - qctl.qc_cmd = LUSTRE_Q_SETINFO; - qctl.qc_type = ALLQUOTA; + struct option long_opts[] = { + { .val = 'p', .name = "parents", .has_arg = no_argument }, + { .name = NULL } }; + char **path; + const char short_opts[] = "p"; + const char *sep = ""; + struct lu_fid fid; + int rc = 0; + bool show_parents = false; - while ((c = getopt_long(argc, argv, "b:gi:ptu", - long_opts, NULL)) != -1) { - switch (c) { - case 'u': - qtype = USRQUOTA; - goto quota_type; - case 'g': - qtype = GRPQUOTA; - goto quota_type; + while ((rc = getopt_long(argc, argv, short_opts, + long_opts, NULL)) != -1) { + switch (rc) { case 'p': - qtype = PRJQUOTA; -quota_type: - if (qctl.qc_type != ALLQUOTA) { - fprintf(stderr, "error: -u/g/p can't be used " - "more than once\n"); - return CMD_HELP; - } - qctl.qc_type = qtype; + show_parents = true; break; - case 'b': - if ((dqi->dqi_bgrace = str2sec(optarg)) == ULONG_MAX) { - fprintf(stderr, "error: bad block-grace: %s\n", - optarg); - return CMD_HELP; - } - dqb->dqb_valid |= QIF_BTIME; - break; - case 'i': - if ((dqi->dqi_igrace = str2sec(optarg)) == ULONG_MAX) { - fprintf(stderr, "error: bad inode-grace: %s\n", - optarg); - return CMD_HELP; - } - dqb->dqb_valid |= QIF_ITIME; - break; - case 't': /* Yes, of course! */ - break; - default: /* getopt prints error message for us when opterr != 0 */ - return CMD_HELP; - } - } + default: + fprintf(stderr, + "%s path2fid: unrecognized option '%s'\n", + progname, argv[optind - 1]); + return CMD_HELP; + } + } - if (qctl.qc_type == ALLQUOTA) { - fprintf(stderr, "error: neither -u, -g nor -p specified\n"); - return CMD_HELP; - } + if (optind > argc - 1) { + fprintf(stderr, "%s path2fid: FILE... must be specified\n", + progname); + return CMD_HELP; + } + else if (optind < argc - 1) + sep = ": "; - if (optind != argc - 1) { - fprintf(stderr, "error: unexpected parameters encountered\n"); - return CMD_HELP; - } + rc = 0; + for (path = argv + optind; *path != NULL; path++) { + int err = 0; + if (!show_parents) { + err = llapi_path2fid(*path, &fid); + if (!err) + printf("%s%s"DFID"\n", + *sep != '\0' ? *path : "", sep, + PFID(&fid)); + } else { + char name[NAME_MAX + 1]; + unsigned int linkno = 0; - mnt = argv[optind]; - rc = llapi_quotactl(mnt, &qctl); - if (rc) { - if (*obd_type) - fprintf(stderr, "%s %s ", obd_type, - obd_uuid2str(&qctl.obd_uuid)); - fprintf(stderr, "setquota failed: %s\n", strerror(-rc)); - return rc; - } + while ((err = llapi_path2parent(*path, linkno, &fid, + name, sizeof(name))) == 0) { + if (*sep != '\0' && linkno == 0) + printf("%s%s", *path, sep); + + printf("%s"DFID"/%s", linkno != 0 ? "\t" : "", + PFID(&fid), name); + linkno++; + } + + /* err == -ENODATA is end-of-loop */ + if (linkno > 0 && err == -ENODATA) { + printf("\n"); + err = 0; + } + } - return 0; -} + if (err) { + fprintf(stderr, + "%s path2fid: cannot get %sfid for '%s': %s\n", + progname, show_parents ? "parent " : "", *path, + strerror(-err)); + if (rc == 0) { + rc = err; + errno = -err; + } + } + } -#define BSLIMIT (1 << 0) -#define BHLIMIT (1 << 1) -#define ISLIMIT (1 << 2) -#define IHLIMIT (1 << 3) + return rc; +} -int lfs_setquota(int argc, char **argv) +static int lfs_data_version(int argc, char **argv) { - int c, rc; - struct if_quotactl qctl; - char *mnt, *obd_type = (char *)qctl.obd_type; - struct obd_dqblk *dqb = &qctl.qc_dqblk; - struct option long_opts[] = { - { .val = 'b', .name = "block-softlimit", - .has_arg = required_argument }, - { .val = 'B', .name = "block-hardlimit", - .has_arg = required_argument }, - { .val = 'g', .name = "group", .has_arg = required_argument }, - { .val = 'i', .name = "inode-softlimit", - .has_arg = required_argument }, - { .val = 'I', .name = "inode-hardlimit", - .has_arg = required_argument }, - { .val = 'p', .name = "projid", .has_arg = required_argument }, - { .val = 'u', .name = "user", .has_arg = required_argument }, - { .name = NULL } }; - unsigned limit_mask = 0; - char *endptr; - int qtype; - - if (has_times_option(argc, argv)) - return lfs_setquota_times(argc, argv); + char *path; + __u64 data_version; + int fd; + int rc; + int c; + int data_version_flags = LL_DV_RD_FLUSH; /* Read by default */ - memset(&qctl, 0, sizeof(qctl)); - qctl.qc_cmd = LUSTRE_Q_SETQUOTA; - qctl.qc_type = ALLQUOTA; /* ALLQUOTA makes no sense for setquota, - * so it can be used as a marker that qc_type - * isn't reinitialized from command line */ + if (argc < 2) { + fprintf(stderr, "%s data_version: FILE must be specified\n", + progname); + return CMD_HELP; + } - while ((c = getopt_long(argc, argv, "b:B:g:i:I:p:u:", - long_opts, NULL)) != -1) { + while ((c = getopt(argc, argv, "nrw")) != -1) { switch (c) { - case 'u': - qtype = USRQUOTA; - rc = name2uid(&qctl.qc_id, optarg); - goto quota_type; - case 'g': - qtype = GRPQUOTA; - rc = name2gid(&qctl.qc_id, optarg); - goto quota_type; - case 'p': - qtype = PRJQUOTA; - rc = name2projid(&qctl.qc_id, optarg); -quota_type: - if (qctl.qc_type != ALLQUOTA) { - fprintf(stderr, "error: -u and -g can't be used" - " more than once\n"); - return CMD_HELP; - } - qctl.qc_type = qtype; - if (rc) { - qctl.qc_id = strtoul(optarg, &endptr, 10); - if (*endptr != '\0') { - fprintf(stderr, "error: can't find id " - "for name %s\n", optarg); - return CMD_HELP; - } - } + case 'n': + data_version_flags = 0; break; - case 'b': - ARG2ULL(dqb->dqb_bsoftlimit, optarg, 1024); - dqb->dqb_bsoftlimit >>= 10; - limit_mask |= BSLIMIT; - if (dqb->dqb_bsoftlimit && - dqb->dqb_bsoftlimit <= 1024) /* <= 1M? */ - fprintf(stderr, "warning: block softlimit is " - "smaller than the miminal qunit size, " - "please see the help of setquota or " - "Lustre manual for details.\n"); - break; - case 'B': - ARG2ULL(dqb->dqb_bhardlimit, optarg, 1024); - dqb->dqb_bhardlimit >>= 10; - limit_mask |= BHLIMIT; - if (dqb->dqb_bhardlimit && - dqb->dqb_bhardlimit <= 1024) /* <= 1M? */ - fprintf(stderr, "warning: block hardlimit is " - "smaller than the miminal qunit size, " - "please see the help of setquota or " - "Lustre manual for details.\n"); - break; - case 'i': - ARG2ULL(dqb->dqb_isoftlimit, optarg, 1); - limit_mask |= ISLIMIT; - if (dqb->dqb_isoftlimit && - dqb->dqb_isoftlimit <= 1024) /* <= 1K inodes? */ - fprintf(stderr, "warning: inode softlimit is " - "smaller than the miminal qunit size, " - "please see the help of setquota or " - "Lustre manual for details.\n"); - break; - case 'I': - ARG2ULL(dqb->dqb_ihardlimit, optarg, 1); - limit_mask |= IHLIMIT; - if (dqb->dqb_ihardlimit && - dqb->dqb_ihardlimit <= 1024) /* <= 1K inodes? */ - fprintf(stderr, "warning: inode hardlimit is " - "smaller than the miminal qunit size, " - "please see the help of setquota or " - "Lustre manual for details.\n"); - break; - default: /* getopt prints error message for us when opterr != 0 */ + case 'r': + data_version_flags |= LL_DV_RD_FLUSH; + break; + case 'w': + data_version_flags |= LL_DV_WR_FLUSH; + break; + default: + fprintf(stderr, + "%s data_version: unrecognized option '%s'\n", + progname, argv[optind - 1]); return CMD_HELP; } } - - if (qctl.qc_type == ALLQUOTA) { - fprintf(stderr, "error: neither -u, -g nor -p was specified\n"); + if (optind == argc) { + fprintf(stderr, "%s data_version: FILE must be specified\n", + progname); return CMD_HELP; } - if (limit_mask == 0) { - fprintf(stderr, "error: at least one limit must be specified\n"); - return CMD_HELP; - } - - if (optind != argc - 1) { - fprintf(stderr, "error: unexpected parameters encountered\n"); - return CMD_HELP; - } - - mnt = argv[optind]; + path = argv[optind]; + fd = open(path, O_RDONLY); + if (fd < 0) { + rc = -errno; + fprintf(stderr, "%s data_version: cannot open file '%s': %s\n", + progname, path, strerror(-rc)); + return rc; + } - if ((!(limit_mask & BHLIMIT) ^ !(limit_mask & BSLIMIT)) || - (!(limit_mask & IHLIMIT) ^ !(limit_mask & ISLIMIT))) { - /* sigh, we can't just set blimits/ilimits */ - struct if_quotactl tmp_qctl = {.qc_cmd = LUSTRE_Q_GETQUOTA, - .qc_type = qctl.qc_type, - .qc_id = qctl.qc_id}; - - rc = llapi_quotactl(mnt, &tmp_qctl); - if (rc < 0) { - fprintf(stderr, "error: setquota failed while retrieving" - " current quota settings (%s)\n", - strerror(-rc)); - return rc; - } + rc = llapi_get_data_version(fd, &data_version, data_version_flags); + if (rc < 0) + fprintf(stderr, + "%s data_version: cannot get version for '%s': %s\n", + progname, path, strerror(-rc)); + else + printf("%ju" "\n", (uintmax_t)data_version); - if (!(limit_mask & BHLIMIT)) - dqb->dqb_bhardlimit = tmp_qctl.qc_dqblk.dqb_bhardlimit; - if (!(limit_mask & BSLIMIT)) - dqb->dqb_bsoftlimit = tmp_qctl.qc_dqblk.dqb_bsoftlimit; - if (!(limit_mask & IHLIMIT)) - dqb->dqb_ihardlimit = tmp_qctl.qc_dqblk.dqb_ihardlimit; - if (!(limit_mask & ISLIMIT)) - dqb->dqb_isoftlimit = tmp_qctl.qc_dqblk.dqb_isoftlimit; - - /* Keep grace times if we have got no softlimit arguments */ - if ((limit_mask & BHLIMIT) && !(limit_mask & BSLIMIT)) { - dqb->dqb_valid |= QIF_BTIME; - dqb->dqb_btime = tmp_qctl.qc_dqblk.dqb_btime; - } + close(fd); + return rc; +} - if ((limit_mask & IHLIMIT) && !(limit_mask & ISLIMIT)) { - dqb->dqb_valid |= QIF_ITIME; - dqb->dqb_itime = tmp_qctl.qc_dqblk.dqb_itime; - } - } +static int lfs_hsm_state(int argc, char **argv) +{ + int rc; + int i = 1; + char *path; + struct hsm_user_state hus; - dqb->dqb_valid |= (limit_mask & (BHLIMIT | BSLIMIT)) ? QIF_BLIMITS : 0; - dqb->dqb_valid |= (limit_mask & (IHLIMIT | ISLIMIT)) ? QIF_ILIMITS : 0; + if (argc < 2) + return CMD_HELP; - rc = llapi_quotactl(mnt, &qctl); - if (rc) { - if (*obd_type) - fprintf(stderr, "%s %s ", obd_type, - obd_uuid2str(&qctl.obd_uuid)); - fprintf(stderr, "setquota failed: %s\n", strerror(-rc)); - return rc; - } + do { + path = argv[i]; - return 0; -} + rc = llapi_hsm_state_get(path, &hus); + if (rc) { + fprintf(stderr, "can't get hsm state for %s: %s\n", + path, strerror(errno = -rc)); + return rc; + } -/* Converts seconds value into format string - * result is returned in buf - * Notes: - * 1. result is in descenting order: 1w2d3h4m5s - * 2. zero fields are not filled (except for p. 3): 5d1s - * 3. zero seconds value is presented as "0s" - */ -static char * __sec2str(time_t seconds, char *buf) -{ - const char spec[] = "smhdw"; - const unsigned long mult[] = {1, 60, 60*60, 24*60*60, 7*24*60*60}; - unsigned long c; - char *tail = buf; - int i; + /* Display path name and status flags */ + printf("%s: (0x%08x)", path, hus.hus_states); - for (i = sizeof(mult) / sizeof(mult[0]) - 1 ; i >= 0; i--) { - c = seconds / mult[i]; + if (hus.hus_states & HS_RELEASED) + printf(" released"); + if (hus.hus_states & HS_EXISTS) + printf(" exists"); + if (hus.hus_states & HS_DIRTY) + printf(" dirty"); + if (hus.hus_states & HS_ARCHIVED) + printf(" archived"); + /* Display user-settable flags */ + if (hus.hus_states & HS_NORELEASE) + printf(" never_release"); + if (hus.hus_states & HS_NOARCHIVE) + printf(" never_archive"); + if (hus.hus_states & HS_LOST) + printf(" lost_from_hsm"); - if (c > 0 || (i == 0 && buf == tail)) - tail += snprintf(tail, 40-(tail-buf), "%lu%c", c, spec[i]); + if (hus.hus_archive_id != 0) + printf(", archive_id:%d", hus.hus_archive_id); + printf("\n"); - seconds %= mult[i]; - } + } while (++i < argc); - return tail; + return 0; } -static void sec2str(time_t seconds, char *buf, int rc) -{ - char *tail = buf; +#define LFS_HSM_SET 0 +#define LFS_HSM_CLEAR 1 - if (rc) - *tail++ = '['; +/** + * Generic function to set or clear HSM flags. + * Used by hsm_set and hsm_clear. + * + * @mode if LFS_HSM_SET, set the flags, if LFS_HSM_CLEAR, clear the flags. + */ +static int lfs_hsm_change_flags(int argc, char **argv, int mode) +{ + struct option long_opts[] = { + { .val = 'A', .name = "archived", .has_arg = no_argument }, + { .val = 'a', .name = "noarchive", .has_arg = no_argument }, + { .val = 'd', .name = "dirty", .has_arg = no_argument }, + { .val = 'e', .name = "exists", .has_arg = no_argument }, + { .val = 'l', .name = "lost", .has_arg = no_argument }, + { .val = 'r', .name = "norelease", .has_arg = no_argument }, + { .val = 'i', .name = "archive-id", .has_arg = required_argument }, + { .name = NULL } }; + char short_opts[] = "lraAdei:"; + __u64 mask = 0; + int c, rc; + char *path; + __u32 archive_id = 0; + char *end = NULL; - tail = __sec2str(seconds, tail); + if (argc < 3) + return CMD_HELP; - if (rc && tail - buf < 39) { - *tail++ = ']'; - *tail++ = 0; - } -} + while ((c = getopt_long(argc, argv, short_opts, + long_opts, NULL)) != -1) { + switch (c) { + case 'l': + mask |= HS_LOST; + break; + case 'a': + mask |= HS_NOARCHIVE; + break; + case 'A': + mask |= HS_ARCHIVED; + break; + case 'r': + mask |= HS_NORELEASE; + break; + case 'd': + mask |= HS_DIRTY; + break; + case 'e': + mask |= HS_EXISTS; + break; + case 'i': + archive_id = strtol(optarg, &end, 10); + if (*end != '\0') { + fprintf(stderr, "invalid archive_id: '%s'\n", + end); + return CMD_HELP; + } + break; + case '?': + return CMD_HELP; + default: + fprintf(stderr, "error: %s: option '%s' unrecognized\n", + argv[0], argv[optind - 1]); + return CMD_HELP; + } + } -static void diff2str(time_t seconds, char *buf, time_t now) -{ + /* User should have specified a flag */ + if (mask == 0) + return CMD_HELP; - buf[0] = 0; - if (!seconds) - return; - if (seconds <= now) { - strcpy(buf, "none"); - return; - } - __sec2str(seconds - now, buf); -} + while (optind < argc) { -static void print_quota_title(char *name, struct if_quotactl *qctl, - bool human_readable) -{ - printf("Disk quotas for %s %s (%cid %u):\n", - qtype_name(qctl->qc_type), name, - *qtype_name(qctl->qc_type), qctl->qc_id); - printf("%15s%8s %7s%8s%8s%8s %7s%8s%8s\n", - "Filesystem", human_readable ? "used" : "kbytes", - "quota", "limit", "grace", - "files", "quota", "limit", "grace"); -} + path = argv[optind]; -static void kbytes2str(__u64 num, char *buf, int buflen, bool h) -{ - if (!h) { - snprintf(buf, buflen, "%ju", (uintmax_t)num); - } else { - if (num >> 40) - snprintf(buf, buflen, "%5.4gP", - (double)num / ((__u64)1 << 40)); - else if (num >> 30) - snprintf(buf, buflen, "%5.4gT", - (double)num / (1 << 30)); - else if (num >> 20) - snprintf(buf, buflen, "%5.4gG", - (double)num / (1 << 20)); - else if (num >> 10) - snprintf(buf, buflen, "%5.4gM", - (double)num / (1 << 10)); + /* If mode == 0, this means we apply the mask. */ + if (mode == LFS_HSM_SET) + rc = llapi_hsm_state_set(path, mask, 0, archive_id); else - snprintf(buf, buflen, "%ju%s", (uintmax_t)num, "k"); + rc = llapi_hsm_state_set(path, 0, mask, 0); + + if (rc != 0) { + fprintf(stderr, "Can't change hsm flags for %s: %s\n", + path, strerror(errno = -rc)); + return rc; + } + optind++; } + + return 0; } -#define STRBUF_LEN 32 -static void print_quota(char *mnt, struct if_quotactl *qctl, int type, - int rc, bool h) +static int lfs_hsm_action(int argc, char **argv) { - time_t now; - - time(&now); - - if (qctl->qc_cmd == LUSTRE_Q_GETQUOTA || qctl->qc_cmd == Q_GETOQUOTA) { - int bover = 0, iover = 0; - struct obd_dqblk *dqb = &qctl->qc_dqblk; - char numbuf[3][STRBUF_LEN]; - char timebuf[40]; - char strbuf[STRBUF_LEN]; + int rc; + int i = 1; + char *path; + struct hsm_current_action hca; + struct hsm_extent he; + enum hsm_user_action hua; + enum hsm_progress_states hps; - if (dqb->dqb_bhardlimit && - lustre_stoqb(dqb->dqb_curspace) >= dqb->dqb_bhardlimit) { - bover = 1; - } else if (dqb->dqb_bsoftlimit && dqb->dqb_btime) { - if (dqb->dqb_btime > now) { - bover = 2; - } else { - bover = 3; - } - } + if (argc < 2) + return CMD_HELP; - if (dqb->dqb_ihardlimit && - dqb->dqb_curinodes >= dqb->dqb_ihardlimit) { - iover = 1; - } else if (dqb->dqb_isoftlimit && dqb->dqb_itime) { - if (dqb->dqb_itime > now) { - iover = 2; - } else { - iover = 3; - } - } + do { + path = argv[i]; + rc = llapi_hsm_current_action(path, &hca); + if (rc) { + fprintf(stderr, "can't get hsm action for %s: %s\n", + path, strerror(errno = -rc)); + return rc; + } + he = hca.hca_location; + hua = hca.hca_action; + hps = hca.hca_state; - if (strlen(mnt) > 15) - printf("%s\n%15s", mnt, ""); - else - printf("%15s", mnt); + printf("%s: %s", path, hsm_user_action2name(hua)); - if (bover) - diff2str(dqb->dqb_btime, timebuf, now); + /* Skip file without action */ + if (hca.hca_action == HUA_NONE) { + printf("\n"); + continue; + } - kbytes2str(lustre_stoqb(dqb->dqb_curspace), - strbuf, sizeof(strbuf), h); - if (rc == -EREMOTEIO) - sprintf(numbuf[0], "%s*", strbuf); - else - sprintf(numbuf[0], (dqb->dqb_valid & QIF_SPACE) ? - "%s" : "[%s]", strbuf); + printf(" %s ", hsm_progress_state2name(hps)); - kbytes2str(dqb->dqb_bsoftlimit, strbuf, sizeof(strbuf), h); - if (type == QC_GENERAL) - sprintf(numbuf[1], (dqb->dqb_valid & QIF_BLIMITS) ? - "%s" : "[%s]", strbuf); + if ((hps == HPS_RUNNING) && + (hua == HUA_ARCHIVE || hua == HUA_RESTORE)) + printf("(%llu bytes moved)\n", + (unsigned long long)he.length); + else if ((he.offset + he.length) == LUSTRE_EOF) + printf("(from %llu to EOF)\n", + (unsigned long long)he.offset); else - sprintf(numbuf[1], "%s", "-"); - - kbytes2str(dqb->dqb_bhardlimit, strbuf, sizeof(strbuf), h); - sprintf(numbuf[2], (dqb->dqb_valid & QIF_BLIMITS) ? - "%s" : "[%s]", strbuf); - - printf(" %7s%c %6s %7s %7s", - numbuf[0], bover ? '*' : ' ', numbuf[1], - numbuf[2], bover > 1 ? timebuf : "-"); + printf("(from %llu to %llu)\n", + (unsigned long long)he.offset, + (unsigned long long)(he.offset + he.length)); - if (iover) - diff2str(dqb->dqb_itime, timebuf, now); + } while (++i < argc); - sprintf(numbuf[0], (dqb->dqb_valid & QIF_INODES) ? - "%ju" : "[%ju]", (uintmax_t)dqb->dqb_curinodes); + return 0; +} - if (type == QC_GENERAL) - sprintf(numbuf[1], (dqb->dqb_valid & QIF_ILIMITS) ? - "%ju" : "[%ju]", - (uintmax_t)dqb->dqb_isoftlimit); - else - sprintf(numbuf[1], "%s", "-"); +static int lfs_hsm_set(int argc, char **argv) +{ + return lfs_hsm_change_flags(argc, argv, LFS_HSM_SET); +} - sprintf(numbuf[2], (dqb->dqb_valid & QIF_ILIMITS) ? - "%ju" : "[%ju]", (uintmax_t)dqb->dqb_ihardlimit); +static int lfs_hsm_clear(int argc, char **argv) +{ + return lfs_hsm_change_flags(argc, argv, LFS_HSM_CLEAR); +} - if (type != QC_OSTIDX) - printf(" %7s%c %6s %7s %7s", - numbuf[0], iover ? '*' : ' ', numbuf[1], - numbuf[2], iover > 1 ? timebuf : "-"); - else - printf(" %7s %7s %7s %7s", "-", "-", "-", "-"); - printf("\n"); +/** + * Check file state and return its fid, to be used by lfs_hsm_request(). + * + * \param[in] file Path to file to check + * \param[in,out] fid Pointer to allocated lu_fid struct. + * \param[in,out] last_dev Pointer to last device id used. + * + * \return 0 on success. + */ +static int lfs_hsm_prepare_file(const char *file, struct lu_fid *fid, + dev_t *last_dev) +{ + struct stat st; + int rc; - } else if (qctl->qc_cmd == LUSTRE_Q_GETINFO || - qctl->qc_cmd == Q_GETOINFO) { - char bgtimebuf[40]; - char igtimebuf[40]; + rc = lstat(file, &st); + if (rc) { + fprintf(stderr, "Cannot stat %s: %s\n", file, strerror(errno)); + return -errno; + } + /* Checking for regular file as archiving as posix copytool + * rejects archiving files other than regular files + */ + if (!S_ISREG(st.st_mode)) { + fprintf(stderr, "error: \"%s\" is not a regular file\n", file); + return CMD_HELP; + } + /* A request should be ... */ + if (*last_dev != st.st_dev && *last_dev != 0) { + fprintf(stderr, "All files should be " + "on the same filesystem: %s\n", file); + return -EINVAL; + } + *last_dev = st.st_dev; - sec2str(qctl->qc_dqinfo.dqi_bgrace, bgtimebuf, rc); - sec2str(qctl->qc_dqinfo.dqi_igrace, igtimebuf, rc); - printf("Block grace time: %s; Inode grace time: %s\n", - bgtimebuf, igtimebuf); - } + rc = llapi_path2fid(file, fid); + if (rc) { + fprintf(stderr, "Cannot read FID of %s: %s\n", + file, strerror(-rc)); + return rc; + } + return 0; } -static int print_obd_quota(char *mnt, struct if_quotactl *qctl, int is_mdt, - bool h, __u64 *total) -{ - int rc = 0, rc1 = 0, count = 0; - __u32 valid = qctl->qc_valid; +/* Fill an HSM HUR item with a given file name. + * + * If mntpath is set, then the filename is actually a FID, and no + * lookup on the filesystem will be performed. + * + * \param[in] hur the user request to fill + * \param[in] idx index of the item inside the HUR to fill + * \param[in] mntpath mountpoint of Lustre + * \param[in] fname filename (if mtnpath is NULL) + * or FID (if mntpath is set) + * \param[in] last_dev pointer to last device id used + * + * \retval 0 on success + * \retval CMD_HELP or a negative errno on error + */ +static int fill_hur_item(struct hsm_user_request *hur, unsigned int idx, + const char *mntpath, const char *fname, + dev_t *last_dev) +{ + struct hsm_user_item *hui = &hur->hur_user_item[idx]; + int rc; - rc = llapi_get_obd_count(mnt, &count, is_mdt); - if (rc) { - fprintf(stderr, "can not get %s count: %s\n", - is_mdt ? "mdt": "ost", strerror(-rc)); - return rc; - } + hui->hui_extent.length = -1; - for (qctl->qc_idx = 0; qctl->qc_idx < count; qctl->qc_idx++) { - qctl->qc_valid = is_mdt ? QC_MDTIDX : QC_OSTIDX; - rc = llapi_quotactl(mnt, qctl); - if (rc) { - /* It is remote client case. */ - if (rc == -EOPNOTSUPP) { - rc = 0; - goto out; - } + if (mntpath != NULL) { + if (*fname == '[') + fname++; + rc = sscanf(fname, SFID, RFID(&hui->hui_fid)); + if (rc == 3) { + rc = 0; + } else { + fprintf(stderr, "hsm: '%s' is not a valid FID\n", + fname); + rc = -EINVAL; + } + } else { + rc = lfs_hsm_prepare_file(fname, &hui->hui_fid, last_dev); + } - if (!rc1) - rc1 = rc; - fprintf(stderr, "quotactl %s%d failed.\n", - is_mdt ? "mdt": "ost", qctl->qc_idx); - continue; - } + if (rc == 0) + hur->hur_request.hr_itemcount++; - print_quota(obd_uuid2str(&qctl->obd_uuid), qctl, - qctl->qc_valid, 0, h); - *total += is_mdt ? qctl->qc_dqblk.dqb_ihardlimit : - qctl->qc_dqblk.dqb_bhardlimit; - } -out: - qctl->qc_valid = valid; - return rc ? : rc1; + return rc; } -static int lfs_quota(int argc, char **argv) +static int lfs_hsm_request(int argc, char **argv, int action) { - int c; - char *mnt, *name = NULL; - struct if_quotactl qctl = { .qc_cmd = LUSTRE_Q_GETQUOTA, - .qc_type = ALLQUOTA }; - char *obd_type = (char *)qctl.obd_type; - char *obd_uuid = (char *)qctl.obd_uuid.uuid; - int rc = 0, rc1 = 0, rc2 = 0, rc3 = 0, - verbose = 0, pass = 0, quiet = 0, inacc; - char *endptr; - __u32 valid = QC_GENERAL, idx = 0; - __u64 total_ialloc = 0, total_balloc = 0; - bool human_readable = false; - int qtype; + struct option long_opts[] = { + { .val = 'a', .name = "archive", .has_arg = required_argument }, + { .val = 'D', .name = "data", .has_arg = required_argument }, + { .val = 'l', .name = "filelist", .has_arg = required_argument }, + { .val = 'm', .name = "mntpath", .has_arg = required_argument }, + { .name = NULL } }; + dev_t last_dev = 0; + char short_opts[] = "l:D:a:m:"; + struct hsm_user_request *hur, *oldhur; + int c, i; + size_t len; + int nbfile; + char *line = NULL; + char *filelist = NULL; + char fullpath[PATH_MAX]; + char *opaque = NULL; + int opaque_len = 0; + int archive_id = 0; + FILE *fp; + int nbfile_alloc = 0; + char *some_file = NULL; + char *mntpath = NULL; + int rc; - while ((c = getopt(argc, argv, "gi:I:o:pqtuvh")) != -1) { + if (argc < 2) + return CMD_HELP; + + while ((c = getopt_long(argc, argv, short_opts, + long_opts, NULL)) != -1) { switch (c) { - case 'u': - qtype = USRQUOTA; - goto quota_type; - case 'g': - qtype = GRPQUOTA; - goto quota_type; - case 'p': - qtype = PRJQUOTA; -quota_type: - if (qctl.qc_type != ALLQUOTA) { - fprintf(stderr, "error: use either -u or -g\n"); - return CMD_HELP; - } - qctl.qc_type = qtype; + case 'l': + filelist = optarg; break; - case 't': - qctl.qc_cmd = LUSTRE_Q_GETINFO; - break; - case 'o': - valid = qctl.qc_valid = QC_UUID; - strlcpy(obd_uuid, optarg, sizeof(qctl.obd_uuid)); - break; - case 'i': - valid = qctl.qc_valid = QC_MDTIDX; - idx = qctl.qc_idx = atoi(optarg); - break; - case 'I': - valid = qctl.qc_valid = QC_OSTIDX; - idx = qctl.qc_idx = atoi(optarg); - break; - case 'v': - verbose = 1; - break; - case 'q': - quiet = 1; - break; - case 'h': - human_readable = true; + case 'D': + opaque = optarg; break; - default: - fprintf(stderr, "error: %s: option '-%c' " - "unrecognized\n", argv[0], c); - return CMD_HELP; - } - } - - /* current uid/gid info for "lfs quota /path/to/lustre/mount" */ - if (qctl.qc_cmd == LUSTRE_Q_GETQUOTA && qctl.qc_type == ALLQUOTA && - optind == argc - 1) { -all_output: - memset(&qctl, 0, sizeof(qctl)); /* spoiled by print_*_quota */ - qctl.qc_cmd = LUSTRE_Q_GETQUOTA; - qctl.qc_valid = valid; - qctl.qc_idx = idx; - qctl.qc_type = pass; - switch (qctl.qc_type) { - case USRQUOTA: - qctl.qc_id = geteuid(); - rc = uid2name(&name, qctl.qc_id); + case 'a': + if (action != HUA_ARCHIVE && + action != HUA_REMOVE) { + fprintf(stderr, + "error: -a is supported only " + "when archiving or removing\n"); + return CMD_HELP; + } + archive_id = atoi(optarg); break; - case GRPQUOTA: - qctl.qc_id = getegid(); - rc = gid2name(&name, qctl.qc_id); + case 'm': + if (some_file == NULL) { + mntpath = optarg; + some_file = strdup(optarg); + } break; + case '?': + return CMD_HELP; default: - rc = -ENOTSUP; - break; - } - if (rc) - name = ""; - pass++; - /* lfs quota -u username /path/to/lustre/mount */ - } else if (qctl.qc_cmd == LUSTRE_Q_GETQUOTA) { - /* options should be followed by u/g-name and mntpoint */ - if (optind + 2 != argc || qctl.qc_type == ALLQUOTA) { - fprintf(stderr, "error: missing quota argument(s)\n"); + fprintf(stderr, "error: %s: option '%s' unrecognized\n", + argv[0], argv[optind - 1]); return CMD_HELP; } + } - name = argv[optind++]; - switch (qctl.qc_type) { - case USRQUOTA: - rc = name2uid(&qctl.qc_id, name); - break; - case GRPQUOTA: - rc = name2gid(&qctl.qc_id, name); - break; - case PRJQUOTA: - rc = name2projid(&qctl.qc_id, name); - break; - default: - rc = -ENOTSUP; - break; + /* All remaining args are files, so we have at least nbfile */ + nbfile = argc - optind; + + if ((nbfile == 0) && (filelist == NULL)) + return CMD_HELP; + + if (opaque != NULL) + opaque_len = strlen(opaque); + + /* Alloc the request structure with enough place to store all files + * from command line. */ + hur = llapi_hsm_user_request_alloc(nbfile, opaque_len); + if (hur == NULL) { + fprintf(stderr, "Cannot create the request: %s\n", + strerror(errno)); + return errno; + } + nbfile_alloc = nbfile; + + hur->hur_request.hr_action = action; + hur->hur_request.hr_archive_id = archive_id; + hur->hur_request.hr_flags = 0; + + /* All remaining args are files, add them */ + if (nbfile != 0 && some_file == NULL) + some_file = strdup(argv[optind]); + + for (i = 0; i < nbfile; i++) { + rc = fill_hur_item(hur, i, mntpath, argv[optind + i], + &last_dev); + if (rc) + goto out_free; + } + + /* from here stop using nb_file, use hur->hur_request.hr_itemcount */ + + /* If a filelist was specified, read the filelist from it. */ + if (filelist != NULL) { + fp = fopen(filelist, "r"); + if (fp == NULL) { + fprintf(stderr, "Cannot read the file list %s: %s\n", + filelist, strerror(errno)); + rc = -errno; + goto out_free; } - if (rc) { - qctl.qc_id = strtoul(name, &endptr, 10); - if (*endptr != '\0') { - fprintf(stderr, "error: can't find id for name: %s\n", - name); - return CMD_HELP; + + while ((rc = getline(&line, &len, fp)) != -1) { + /* If allocated buffer was too small, get something + * larger */ + if (nbfile_alloc <= hur->hur_request.hr_itemcount) { + ssize_t size; + + nbfile_alloc = nbfile_alloc * 2 + 1; + oldhur = hur; + hur = llapi_hsm_user_request_alloc(nbfile_alloc, + opaque_len); + if (hur == NULL) { + fprintf(stderr, "hsm: cannot allocate " + "the request: %s\n", + strerror(errno)); + hur = oldhur; + rc = -errno; + fclose(fp); + goto out_free; + } + size = hur_len(oldhur); + if (size < 0) { + fprintf(stderr, "hsm: cannot allocate " + "%u files + %u bytes data\n", + oldhur->hur_request.hr_itemcount, + oldhur->hur_request.hr_data_len); + free(hur); + hur = oldhur; + rc = -E2BIG; + fclose(fp); + goto out_free; + } + memcpy(hur, oldhur, size); + free(oldhur); + } + + /* Chop CR */ + if (line[strlen(line) - 1] == '\n') + line[strlen(line) - 1] = '\0'; + + rc = fill_hur_item(hur, hur->hur_request.hr_itemcount, + mntpath, line, &last_dev); + if (rc) { + fclose(fp); + goto out_free; } - } - } else if (optind + 1 != argc || qctl.qc_type == ALLQUOTA) { - fprintf(stderr, "error: missing quota info argument(s)\n"); - return CMD_HELP; - } - mnt = argv[optind]; - rc1 = llapi_quotactl(mnt, &qctl); - if (rc1 < 0) { - switch (rc1) { - case -ESRCH: - fprintf(stderr, "%s quotas are not enabled.\n", - qtype_name(qctl.qc_type)); - goto out; - case -EPERM: - fprintf(stderr, "Permission denied.\n"); - case -ENODEV: - case -ENOENT: - /* We already got error message. */ - goto out; - default: - fprintf(stderr, "Unexpected quotactl error: %s\n", - strerror(-rc1)); + if (some_file == NULL) { + some_file = line; + line = NULL; + } } + + rc = fclose(fp); + free(line); } - if (qctl.qc_cmd == LUSTRE_Q_GETQUOTA && !quiet) - print_quota_title(name, &qctl, human_readable); + /* If a --data was used, add it to the request */ + hur->hur_request.hr_data_len = opaque_len; + if (opaque != NULL) + memcpy(hur_data(hur), opaque, opaque_len); - if (rc1 && *obd_type) - fprintf(stderr, "%s %s ", obd_type, obd_uuid); + /* Send the HSM request */ + if (realpath(some_file, fullpath) == NULL) { + fprintf(stderr, "Could not find path '%s': %s\n", + some_file, strerror(errno)); + } + rc = llapi_hsm_request(fullpath, hur); + if (rc) { + fprintf(stderr, "Cannot send HSM request (use of %s): %s\n", + some_file, strerror(-rc)); + goto out_free; + } - if (qctl.qc_valid != QC_GENERAL) - mnt = ""; +out_free: + free(some_file); + free(hur); + return rc; +} - inacc = (qctl.qc_cmd == LUSTRE_Q_GETQUOTA) && - ((qctl.qc_dqblk.dqb_valid & (QIF_LIMITS|QIF_USAGE)) != - (QIF_LIMITS|QIF_USAGE)); +static int lfs_hsm_archive(int argc, char **argv) +{ + return lfs_hsm_request(argc, argv, HUA_ARCHIVE); +} - print_quota(mnt, &qctl, QC_GENERAL, rc1, human_readable); +static int lfs_hsm_restore(int argc, char **argv) +{ + return lfs_hsm_request(argc, argv, HUA_RESTORE); +} - if (qctl.qc_valid == QC_GENERAL && qctl.qc_cmd != LUSTRE_Q_GETINFO && - verbose) { - char strbuf[STRBUF_LEN]; +static int lfs_hsm_release(int argc, char **argv) +{ + return lfs_hsm_request(argc, argv, HUA_RELEASE); +} - rc2 = print_obd_quota(mnt, &qctl, 1, human_readable, - &total_ialloc); - rc3 = print_obd_quota(mnt, &qctl, 0, human_readable, - &total_balloc); - kbytes2str(total_balloc, strbuf, sizeof(strbuf), - human_readable); - printf("Total allocated inode limit: %ju, total " - "allocated block limit: %s\n", (uintmax_t)total_ialloc, - strbuf); - } +static int lfs_hsm_remove(int argc, char **argv) +{ + return lfs_hsm_request(argc, argv, HUA_REMOVE); +} - if (rc1 || rc2 || rc3 || inacc) - printf("Some errors happened when getting quota info. " - "Some devices may be not working or deactivated. " - "The data in \"[]\" is inaccurate.\n"); +static int lfs_hsm_cancel(int argc, char **argv) +{ + return lfs_hsm_request(argc, argv, HUA_CANCEL); +} -out: - if (pass > 0 && pass < LL_MAXQUOTAS) - goto all_output; +static int lfs_swap_layouts(int argc, char **argv) +{ + if (argc != 3) + return CMD_HELP; - return rc1; + return llapi_swap_layouts(argv[1], argv[2], 0, 0, + SWAP_LAYOUTS_KEEP_MTIME | + SWAP_LAYOUTS_KEEP_ATIME); } -#endif /* HAVE_SYS_QUOTA_H! */ -static int flushctx_ioctl(char *mp) -{ - int fd, rc; +static const char *const ladvise_names[] = LU_LADVISE_NAMES; - fd = open(mp, O_RDONLY); - if (fd == -1) { - fprintf(stderr, "flushctx: error open %s: %s\n", - mp, strerror(errno)); - return -1; - } +static const char *const lock_mode_names[] = LOCK_MODE_NAMES; - rc = ioctl(fd, LL_IOC_FLUSHCTX); - if (rc == -1) - fprintf(stderr, "flushctx: error ioctl %s: %s\n", - mp, strerror(errno)); +int lfs_get_mode(const char *string) +{ + enum lock_mode_user mode; - close(fd); - return rc; + for (mode = 0; mode < ARRAY_SIZE(lock_mode_names); mode++) { + if (lock_mode_names[mode] == NULL) + continue; + if (strcmp(string, lock_mode_names[mode]) == 0) + return mode; + } + + return -EINVAL; } -static int lfs_flushctx(int argc, char **argv) +static enum lu_ladvise_type lfs_get_ladvice(const char *string) { - int kdestroy = 0, c; - char mntdir[PATH_MAX] = {'\0'}; - int index = 0; - int rc = 0; + enum lu_ladvise_type advice; - while ((c = getopt(argc, argv, "k")) != -1) { - switch (c) { - case 'k': - kdestroy = 1; - break; - default: - fprintf(stderr, "error: %s: option '-%c' " - "unrecognized\n", argv[0], c); - return CMD_HELP; - } - } + for (advice = 0; + advice < ARRAY_SIZE(ladvise_names); advice++) { + if (ladvise_names[advice] == NULL) + continue; + if (strcmp(string, ladvise_names[advice]) == 0) + return advice; + } - if (kdestroy) { - if ((rc = system("kdestroy > /dev/null")) != 0) { - rc = WEXITSTATUS(rc); - fprintf(stderr, "error destroying tickets: %d, continuing\n", rc); - } - } + return LU_LADVISE_INVALID; +} - if (optind >= argc) { - /* flush for all mounted lustre fs. */ - while (!llapi_search_mounts(NULL, index++, mntdir, NULL)) { - /* Check if we have a mount point */ - if (mntdir[0] == '\0') - continue; +static int lfs_ladvise(int argc, char **argv) +{ + struct option long_opts[] = { + { .val = 'a', .name = "advice", .has_arg = required_argument }, + { .val = 'b', .name = "background", .has_arg = no_argument }, + { .val = 'e', .name = "end", .has_arg = required_argument }, + { .val = 'l', .name = "length", .has_arg = required_argument }, + { .val = 'm', .name = "mode", .has_arg = required_argument }, + { .val = 's', .name = "start", .has_arg = required_argument }, + { .val = 'u', .name = "unset", .has_arg = no_argument }, + { .name = NULL } }; + char short_opts[] = "a:be:l:m:s:u"; + int c; + int rc = 0; + const char *path; + int fd; + struct llapi_lu_ladvise advice; + enum lu_ladvise_type advice_type = LU_LADVISE_INVALID; + unsigned long long start = 0; + unsigned long long end = LUSTRE_EOF; + unsigned long long length = 0; + unsigned long long size_units; + unsigned long long flags = 0; + int mode = 0; - if (flushctx_ioctl(mntdir)) - rc = -1; + optind = 0; + while ((c = getopt_long(argc, argv, short_opts, + long_opts, NULL)) != -1) { + switch (c) { + case 'a': + advice_type = lfs_get_ladvice(optarg); + if (advice_type == LU_LADVISE_INVALID) { + fprintf(stderr, "%s: invalid advice type " + "'%s'\n", argv[0], optarg); + fprintf(stderr, "Valid types:"); - mntdir[0] = '\0'; /* avoid matching in next loop */ + for (advice_type = 0; + advice_type < ARRAY_SIZE(ladvise_names); + advice_type++) { + if (ladvise_names[advice_type] == NULL) + continue; + fprintf(stderr, " %s", + ladvise_names[advice_type]); + } + fprintf(stderr, "\n"); + + return CMD_HELP; + } + break; + case 'b': + flags |= LF_ASYNC; + break; + case 'u': + flags |= LF_UNSET; + break; + case 'e': + size_units = 1; + rc = llapi_parse_size(optarg, &end, + &size_units, 0); + if (rc) { + fprintf(stderr, "%s: bad end offset '%s'\n", + argv[0], optarg); + return CMD_HELP; + } + break; + case 's': + size_units = 1; + rc = llapi_parse_size(optarg, &start, + &size_units, 0); + if (rc) { + fprintf(stderr, "%s: bad start offset " + "'%s'\n", argv[0], optarg); + return CMD_HELP; + } + break; + case 'l': + size_units = 1; + rc = llapi_parse_size(optarg, &length, + &size_units, 0); + if (rc) { + fprintf(stderr, "%s: bad length '%s'\n", + argv[0], optarg); + return CMD_HELP; + } + break; + case 'm': + mode = lfs_get_mode(optarg); + if (mode < 0) { + fprintf(stderr, "%s: bad mode '%s', valid " + "modes are READ or WRITE\n", + argv[0], optarg); + return CMD_HELP; + } + break; + case '?': + return CMD_HELP; + default: + fprintf(stderr, "%s: option '%s' unrecognized\n", + argv[0], argv[optind - 1]); + return CMD_HELP; } - } else { - /* flush fs as specified */ - while (optind < argc) { - if (flushctx_ioctl(argv[optind++])) - rc = -1; - } - } - return rc; -} + } -static int lfs_cp(int argc, char **argv) -{ - fprintf(stderr, "remote client copy file(s).\n" - "obsolete, does not support it anymore.\n"); - return 0; -} + if (advice_type == LU_LADVISE_INVALID) { + fprintf(stderr, "%s: please give an advice type\n", argv[0]); + fprintf(stderr, "Valid types:"); + for (advice_type = 0; advice_type < ARRAY_SIZE(ladvise_names); + advice_type++) { + if (ladvise_names[advice_type] == NULL) + continue; + fprintf(stderr, " %s", ladvise_names[advice_type]); + } + fprintf(stderr, "\n"); + return CMD_HELP; + } -static int lfs_ls(int argc, char **argv) -{ - fprintf(stderr, "remote client lists directory contents.\n" - "obsolete, does not support it anymore.\n"); - return 0; -} + if (advice_type == LU_LADVISE_LOCKNOEXPAND) { + fprintf(stderr, "%s: Lock no expand advice is a per file " + "descriptor advice, so when called from lfs, " + "it does nothing.\n", argv[0]); + return CMD_HELP; + } -static int lfs_changelog(int argc, char **argv) -{ - void *changelog_priv; - struct changelog_rec *rec; - long long startrec = 0, endrec = 0; - char *mdd; - struct option long_opts[] = { - { .val = 'f', .name = "follow", .has_arg = no_argument }, - { .name = NULL } }; - char short_opts[] = "f"; - int rc, follow = 0; + if (argc <= optind) { + fprintf(stderr, "%s: please give one or more file names\n", + argv[0]); + return CMD_HELP; + } - while ((rc = getopt_long(argc, argv, short_opts, - long_opts, NULL)) != -1) { - switch (rc) { - case 'f': - follow++; - break; - case '?': - return CMD_HELP; - default: - fprintf(stderr, "error: %s: option '%s' unrecognized\n", - argv[0], argv[optind - 1]); - return CMD_HELP; - } - } - if (optind >= argc) - return CMD_HELP; + if (end != LUSTRE_EOF && length != 0 && end != start + length) { + fprintf(stderr, "%s: conflicting arguments of -l and -e\n", + argv[0]); + return CMD_HELP; + } - mdd = argv[optind++]; - if (argc > optind) - startrec = strtoll(argv[optind++], NULL, 10); - if (argc > optind) - endrec = strtoll(argv[optind++], NULL, 10); + if (end == LUSTRE_EOF && length != 0) + end = start + length; - rc = llapi_changelog_start(&changelog_priv, - CHANGELOG_FLAG_BLOCK | - CHANGELOG_FLAG_JOBID | - (follow ? CHANGELOG_FLAG_FOLLOW : 0), - mdd, startrec); - if (rc < 0) { - fprintf(stderr, "Can't start changelog: %s\n", - strerror(errno = -rc)); - return rc; + if (end <= start) { + fprintf(stderr, "%s: range [%llu, %llu] is invalid\n", + argv[0], start, end); + return CMD_HELP; } - while ((rc = llapi_changelog_recv(changelog_priv, &rec)) == 0) { - time_t secs; - struct tm ts; + if (advice_type != LU_LADVISE_LOCKAHEAD && mode != 0) { + fprintf(stderr, "%s: mode is only valid with lockahead\n", + argv[0]); + return CMD_HELP; + } - if (endrec && rec->cr_index > endrec) { - llapi_changelog_free(&rec); - break; - } - if (rec->cr_index < startrec) { - llapi_changelog_free(&rec); - continue; - } + if (advice_type == LU_LADVISE_LOCKAHEAD && mode == 0) { + fprintf(stderr, "%s: mode is required with lockahead\n", + argv[0]); + return CMD_HELP; + } - secs = rec->cr_time >> 30; - gmtime_r(&secs, &ts); - printf("%ju %02d%-5s %02d:%02d:%02d.%09d %04d.%02d.%02d " - "0x%x t="DFID, (uintmax_t)rec->cr_index, rec->cr_type, - changelog_type2str(rec->cr_type), - ts.tm_hour, ts.tm_min, ts.tm_sec, - (int)(rec->cr_time & ((1 << 30) - 1)), - ts.tm_year + 1900, ts.tm_mon + 1, ts.tm_mday, - rec->cr_flags & CLF_FLAGMASK, PFID(&rec->cr_tfid)); + while (optind < argc) { + int rc2; - if (rec->cr_flags & CLF_JOBID) { - struct changelog_ext_jobid *jid = - changelog_rec_jobid(rec); + path = argv[optind++]; - if (jid->cr_jobid[0] != '\0') - printf(" j=%s", jid->cr_jobid); + fd = open(path, O_RDONLY); + if (fd < 0) { + fprintf(stderr, "%s: cannot open file '%s': %s\n", + argv[0], path, strerror(errno)); + rc2 = -errno; + goto next; } - if (rec->cr_namelen) - printf(" p="DFID" %.*s", PFID(&rec->cr_pfid), - rec->cr_namelen, changelog_rec_name(rec)); - - if (rec->cr_flags & CLF_RENAME) { - struct changelog_ext_rename *rnm = - changelog_rec_rename(rec); - - if (!fid_is_zero(&rnm->cr_sfid)) - printf(" s="DFID" sp="DFID" %.*s", - PFID(&rnm->cr_sfid), - PFID(&rnm->cr_spfid), - (int)changelog_rec_snamelen(rec), - changelog_rec_sname(rec)); + advice.lla_start = start; + advice.lla_end = end; + advice.lla_advice = advice_type; + advice.lla_value1 = 0; + advice.lla_value2 = 0; + advice.lla_value3 = 0; + advice.lla_value4 = 0; + if (advice_type == LU_LADVISE_LOCKAHEAD) { + advice.lla_lockahead_mode = mode; + advice.lla_peradvice_flags = flags; } - printf("\n"); - llapi_changelog_free(&rec); - } - - llapi_changelog_fini(&changelog_priv); + rc2 = llapi_ladvise(fd, flags, 1, &advice); + close(fd); + if (rc2 < 0) { + fprintf(stderr, "%s: cannot give advice '%s' to file " + "'%s': %s\n", argv[0], + ladvise_names[advice_type], + path, strerror(errno)); - if (rc < 0) - fprintf(stderr, "Changelog: %s\n", strerror(errno = -rc)); + goto next; + } - return (rc == 1 ? 0 : rc); +next: + if (rc == 0 && rc2 < 0) + rc = rc2; + } + return rc; } -static int lfs_changelog_clear(int argc, char **argv) +/** The input string contains a comma delimited list of component ids and + * ranges, for example "1,2-4,7". + */ +static int parse_mirror_ids(__u16 *ids, int size, char *arg) { - long long endrec; + bool end_of_loop = false; + char *ptr = NULL; + int nr = 0; int rc; - if (argc != 4) - return CMD_HELP; - - endrec = strtoll(argv[3], NULL, 10); + if (arg == NULL) + return -EINVAL; - rc = llapi_changelog_clear(argv[1], argv[2], endrec); + while (!end_of_loop) { + int start_index; + int end_index; + int i; + char *endptr = NULL; - if (rc == -EINVAL) - fprintf(stderr, "%s: record out of range: %llu\n", - argv[0], endrec); - else if (rc == -ENOENT) - fprintf(stderr, "%s: no changelog user: %s\n", - argv[0], argv[2]); - else if (rc) - fprintf(stderr, "%s error: %s\n", argv[0], - strerror(-rc)); + rc = -EINVAL; + ptr = strchrnul(arg, ','); + end_of_loop = *ptr == '\0'; + *ptr = '\0'; - if (rc) - errno = -rc; + start_index = strtol(arg, &endptr, 0); + if (endptr == arg) /* no data at all */ + break; + if (*endptr != '-' && *endptr != '\0') /* has invalid data */ + break; + if (start_index < 0) + break; - return rc; -} + end_index = start_index; + if (*endptr == '-') { + end_index = strtol(endptr + 1, &endptr, 0); + if (*endptr != '\0') + break; + if (end_index < start_index) + break; + } -static int lfs_fid2path(int argc, char **argv) -{ - struct option long_opts[] = { - { .val = 'c', .name = "cur", .has_arg = no_argument }, - { .val = 'l', .name = "link", .has_arg = required_argument }, - { .val = 'r', .name = "rec", .has_arg = required_argument }, - { .name = NULL } }; - char short_opts[] = "cl:r:"; - char *device, *fid, *path; - long long recno = -1; - int linkno = -1; - int lnktmp; - int printcur = 0; - int rc = 0; + for (i = start_index; i <= end_index && size > 0; i++) { + int j; - while ((rc = getopt_long(argc, argv, short_opts, - long_opts, NULL)) != -1) { - switch (rc) { - case 'c': - printcur++; - break; - case 'l': - linkno = strtol(optarg, NULL, 10); - break; - case 'r': - recno = strtoll(optarg, NULL, 10); - break; - case '?': - return CMD_HELP; - default: - fprintf(stderr, "error: %s: option '%s' unrecognized\n", - argv[0], argv[optind - 1]); - return CMD_HELP; - } - } + /* remove duplicate */ + for (j = 0; j < nr; j++) { + if (ids[j] == i) + break; + } + if (j == nr) { /* no duplicate */ + ids[nr++] = i; + --size; + } + } - if (argc < 3) - return CMD_HELP; + if (size == 0 && i < end_index) + break; - device = argv[optind++]; - path = calloc(1, PATH_MAX); - if (path == NULL) { - fprintf(stderr, "error: Not enough memory\n"); - return -errno; + *ptr = ','; + arg = ++ptr; + rc = 0; } + if (!end_of_loop && ptr != NULL) + *ptr = ','; - rc = 0; - while (optind < argc) { - fid = argv[optind++]; + return rc < 0 ? rc : nr; +} - lnktmp = (linkno >= 0) ? linkno : 0; - while (1) { - int oldtmp = lnktmp; - long long rectmp = recno; - int rc2; - rc2 = llapi_fid2path(device, fid, path, PATH_MAX, - &rectmp, &lnktmp); - if (rc2 < 0) { - fprintf(stderr, "%s: error on FID %s: %s\n", - argv[0], fid, strerror(errno = -rc2)); - if (rc == 0) - rc = rc2; - break; - } +/** + * struct verify_mirror_id - Mirror id to be verified. + * @mirror_id: A specified mirror id. + * @is_valid_id: @mirror_id is valid or not in the mirrored file. + */ +struct verify_mirror_id { + __u16 mirror_id; + bool is_valid_id; +}; - if (printcur) - fprintf(stdout, "%lld ", rectmp); - if (device[0] == '/') { - fprintf(stdout, "%s", device); - if (device[strlen(device) - 1] != '/') - fprintf(stdout, "/"); - } else if (path[0] == '\0') { - fprintf(stdout, "/"); - } - fprintf(stdout, "%s\n", path); +/** + * compare_mirror_ids() - Compare mirror ids. + * @layout: Mirror component list. + * @cbdata: Callback data in verify_mirror_id structure. + * + * This is a callback function called by llapi_layout_comp_iterate() + * to compare the specified mirror id with the one in the current + * component of @layout. If they are the same, then the specified + * mirror id is valid. + * + * Return: a negative error code on failure or + * LLAPI_LAYOUT_ITER_CONT: Proceed iteration + * LLAPI_LAYOUT_ITER_STOP: Stop iteration + */ +static inline +int compare_mirror_ids(struct llapi_layout *layout, void *cbdata) +{ + struct verify_mirror_id *mirror_id_cbdata = + (struct verify_mirror_id *)cbdata; + uint32_t mirror_id; + int rc = 0; - if (linkno >= 0) - /* specified linkno */ - break; - if (oldtmp == lnktmp) - /* no more links */ - break; - } + rc = llapi_layout_mirror_id_get(layout, &mirror_id); + if (rc < 0) { + rc = -errno; + fprintf(stderr, + "%s: llapi_layout_mirror_id_get failed: %s.\n", + progname, strerror(errno)); + return rc; } - free(path); - return rc; + if (mirror_id_cbdata->mirror_id == mirror_id) { + mirror_id_cbdata->is_valid_id = true; + return LLAPI_LAYOUT_ITER_STOP; + } + + return LLAPI_LAYOUT_ITER_CONT; } -static int lfs_path2fid(int argc, char **argv) +/** + * verify_mirror_ids() - Verify specified mirror ids. + * @fname: Mirrored file name. + * @mirror_ids: Specified mirror ids to be verified. + * @ids_nr: Number of specified mirror ids. + * + * This function verifies that specified @mirror_ids are valid + * in the mirrored file @fname. + * + * Return: 0 on success or a negative error code on failure. + */ +static inline +int verify_mirror_ids(const char *fname, __u16 *mirror_ids, int ids_nr) { - struct option long_opts[] = { - { .val = 'p', .name = "parents", .has_arg = no_argument }, - { .name = NULL } }; - char **path; - const char short_opts[] = "p"; - const char *sep = ""; - lustre_fid fid; - int rc = 0; - bool show_parents = false; + struct llapi_layout *layout = NULL; + struct verify_mirror_id mirror_id_cbdata = { 0 }; + struct stat stbuf; + uint32_t flr_state; + int i; + int fd; + int rc = 0; + int rc2 = 0; - while ((rc = getopt_long(argc, argv, short_opts, - long_opts, NULL)) != -1) { - switch (rc) { - case 'p': - show_parents = true; - break; - default: - fprintf(stderr, "error: %s: option '%s' unrecognized\n", - argv[0], argv[optind - 1]); - return CMD_HELP; - } + if (ids_nr <= 0) + return -EINVAL; + + if (stat(fname, &stbuf) < 0) { + fprintf(stderr, "%s: cannot stat file '%s': %s.\n", + progname, fname, strerror(errno)); + rc = -errno; + goto error; } - if (optind > argc - 1) - return CMD_HELP; - else if (optind < argc - 1) - sep = ": "; + if (!S_ISREG(stbuf.st_mode)) { + fprintf(stderr, "%s: '%s' is not a regular file.\n", + progname, fname); + rc = -EINVAL; + goto error; + } - rc = 0; - for (path = argv + optind; *path != NULL; path++) { - int err = 0; - if (!show_parents) { - err = llapi_path2fid(*path, &fid); - if (!err) - printf("%s%s"DFID"\n", - *sep != '\0' ? *path : "", sep, - PFID(&fid)); - } else { - char name[NAME_MAX + 1]; - unsigned int linkno = 0; + fd = open(fname, O_DIRECT | O_RDONLY); + if (fd < 0) { + fprintf(stderr, "%s: cannot open '%s': %s.\n", + progname, fname, strerror(errno)); + rc = -errno; + goto error; + } - while ((err = llapi_path2parent(*path, linkno, &fid, - name, sizeof(name))) == 0) { - if (*sep != '\0' && linkno == 0) - printf("%s%s", *path, sep); + rc = llapi_lease_acquire(fd, LL_LEASE_RDLCK); + if (rc < 0) { + fprintf(stderr, "%s: '%s' llapi_lease_acquire failed: %s.\n", + progname, fname, strerror(errno)); + goto close_fd; + } - printf("%s"DFID"/%s", linkno != 0 ? "\t" : "", - PFID(&fid), name); - linkno++; - } + layout = llapi_layout_get_by_fd(fd, 0); + if (layout == NULL) { + fprintf(stderr, "%s: '%s' llapi_layout_get_by_fd failed: %s.\n", + progname, fname, strerror(errno)); + rc = -errno; + llapi_lease_release(fd); + goto close_fd; + } - /* err == -ENODATA is end-of-loop */ - if (linkno > 0 && err == -ENODATA) { - printf("\n"); - err = 0; - } + rc = llapi_layout_flags_get(layout, &flr_state); + if (rc < 0) { + fprintf(stderr, "%s: '%s' llapi_layout_flags_get failed: %s.\n", + progname, fname, strerror(errno)); + rc = -errno; + goto free_layout; + } + + flr_state &= LCM_FL_FLR_MASK; + switch (flr_state) { + case LCM_FL_NONE: + rc = -EINVAL; + fprintf(stderr, "%s: '%s' file state error: %s.\n", + progname, fname, llapi_layout_flags_string(flr_state)); + goto free_layout; + default: + break; + } + + rc2 = 0; + for (i = 0; i < ids_nr; i++) { + mirror_id_cbdata.mirror_id = mirror_ids[i]; + mirror_id_cbdata.is_valid_id = false; + + rc = llapi_layout_comp_iterate(layout, compare_mirror_ids, + &mirror_id_cbdata); + if (rc < 0) { + rc = -errno; + fprintf(stderr, + "%s: '%s' failed to verify mirror id: %u.\n", + progname, fname, mirror_ids[i]); + goto free_layout; } - if (err) { - fprintf(stderr, "%s: can't get %sfid for %s: %s\n", - argv[0], show_parents ? "parent " : "", *path, - strerror(-err)); - if (rc == 0) { - rc = err; - errno = -err; - } + if (!mirror_id_cbdata.is_valid_id) { + rc2 = -EINVAL; + fprintf(stderr, + "%s: '%s' invalid specified mirror id: %u.\n", + progname, fname, mirror_ids[i]); } } + rc = rc2; +free_layout: + llapi_layout_free(layout); + llapi_lease_release(fd); +close_fd: + close(fd); +error: return rc; } -static int lfs_data_version(int argc, char **argv) +static inline +int lfs_mirror_resync_file(const char *fname, struct ll_ioc_lease *ioc, + __u16 *mirror_ids, int ids_nr) { - char *path; - __u64 data_version; + struct llapi_resync_comp comp_array[1024] = { { 0 } }; + struct llapi_layout *layout; + struct stat stbuf; + uint32_t flr_state; + int comp_size = 0; + int idx; int fd; int rc; - int c; - int data_version_flags = LL_DV_RD_FLUSH; /* Read by default */ - if (argc < 2) - return CMD_HELP; + if (stat(fname, &stbuf) < 0) { + fprintf(stderr, "%s: cannot stat file '%s': %s.\n", + progname, fname, strerror(errno)); + rc = -errno; + goto error; + } + if (!S_ISREG(stbuf.st_mode)) { + fprintf(stderr, "%s: '%s' is not a regular file.\n", + progname, fname); + rc = -EINVAL; + goto error; + } - while ((c = getopt(argc, argv, "nrw")) != -1) { - switch (c) { - case 'n': - data_version_flags = 0; - break; - case 'r': - data_version_flags |= LL_DV_RD_FLUSH; - break; - case 'w': - data_version_flags |= LL_DV_WR_FLUSH; - break; - default: - return CMD_HELP; - } + fd = open(fname, O_DIRECT | O_RDWR); + if (fd < 0) { + fprintf(stderr, "%s: cannot open '%s': %s.\n", + progname, fname, strerror(errno)); + rc = -errno; + goto error; } - if (optind == argc) - return CMD_HELP; - path = argv[optind]; - fd = open(path, O_RDONLY); - if (fd < 0) - err(errno, "cannot open file %s", path); + layout = llapi_layout_get_by_fd(fd, 0); + if (layout == NULL) { + fprintf(stderr, "%s: '%s' llapi_layout_get_by_fd failed: %s.\n", + progname, fname, strerror(errno)); + rc = -errno; + goto close_fd; + } - rc = llapi_get_data_version(fd, &data_version, data_version_flags); - if (rc < 0) - err(errno, "cannot get version for %s", path); - else - printf("%ju" "\n", (uintmax_t)data_version); + rc = llapi_layout_flags_get(layout, &flr_state); + if (rc) { + fprintf(stderr, "%s: '%s' llapi_layout_flags_get failed: %s.\n", + progname, fname, strerror(errno)); + rc = -errno; + goto free_layout; + } - close(fd); - return rc; -} + flr_state &= LCM_FL_FLR_MASK; + if (flr_state == LCM_FL_NONE) { + rc = -EINVAL; + fprintf(stderr, "%s: '%s' is not a FLR file.\n", + progname, fname); + goto free_layout; + } -static int lfs_hsm_state(int argc, char **argv) -{ - int rc; - int i = 1; - char *path; - struct hsm_user_state hus; + /* get stale component info */ + comp_size = llapi_mirror_find_stale(layout, comp_array, + ARRAY_SIZE(comp_array), + mirror_ids, ids_nr); + if (comp_size <= 0) { + rc = comp_size; + goto free_layout; + } - if (argc < 2) - return CMD_HELP; + ioc->lil_mode = LL_LEASE_WRLCK; + ioc->lil_flags = LL_LEASE_RESYNC; + rc = llapi_lease_set(fd, ioc); + if (rc < 0) { + if (rc == -EALREADY) + rc = 0; + else + fprintf(stderr, + "%s: '%s' llapi_lease_get_ext resync failed: %s.\n", + progname, fname, strerror(errno)); + goto free_layout; + } - do { - path = argv[i]; + idx = 0; + while (idx < comp_size) { + ssize_t result; + uint64_t end; + __u16 mirror_id; + int i; - rc = llapi_hsm_state_get(path, &hus); - if (rc) { - fprintf(stderr, "can't get hsm state for %s: %s\n", - path, strerror(errno = -rc)); - return rc; + rc = llapi_lease_check(fd); + if (rc != LL_LEASE_WRLCK) { + fprintf(stderr, "%s: '%s' lost lease lock.\n", + progname, fname); + goto free_layout; } - /* Display path name and status flags */ - printf("%s: (0x%08x)", path, hus.hus_states); + mirror_id = comp_array[idx].lrc_mirror_id; + end = comp_array[idx].lrc_end; - if (hus.hus_states & HS_RELEASED) - printf(" released"); - if (hus.hus_states & HS_EXISTS) - printf(" exists"); - if (hus.hus_states & HS_DIRTY) - printf(" dirty"); - if (hus.hus_states & HS_ARCHIVED) - printf(" archived"); - /* Display user-settable flags */ - if (hus.hus_states & HS_NORELEASE) - printf(" never_release"); - if (hus.hus_states & HS_NOARCHIVE) - printf(" never_archive"); - if (hus.hus_states & HS_LOST) - printf(" lost_from_hsm"); + /* try to combine adjacent component */ + for (i = idx + 1; i < comp_size; i++) { + if (mirror_id != comp_array[i].lrc_mirror_id || + end != comp_array[i].lrc_start) + break; + end = comp_array[i].lrc_end; + } + + result = llapi_mirror_resync_one(fd, layout, mirror_id, + comp_array[idx].lrc_start, + end); + if (result < 0) { + fprintf(stderr, "%s: '%s' llapi_mirror_resync_one: " + "%ld.\n", progname, fname, result); + rc = result; + goto unlock; + } else if (result > 0) { + int j; + + /* mark synced components */ + for (j = idx; j < i; j++) + comp_array[j].lrc_synced = true; + } + + idx = i; + } - if (hus.hus_archive_id != 0) - printf(", archive_id:%d", hus.hus_archive_id); - printf("\n"); +unlock: + /* prepare ioc for lease put */ + ioc->lil_mode = LL_LEASE_UNLCK; + ioc->lil_flags = LL_LEASE_RESYNC_DONE; + ioc->lil_count = 0; + for (idx = 0; idx < comp_size; idx++) { + if (comp_array[idx].lrc_synced) { + ioc->lil_ids[ioc->lil_count] = comp_array[idx].lrc_id; + ioc->lil_count++; + } + } - } while (++i < argc); + rc = llapi_lease_set(fd, ioc); + if (rc <= 0) { + if (rc == 0) /* lost lease lock */ + rc = -EBUSY; + fprintf(stderr, "%s: resync file '%s' failed: %s.\n", + progname, fname, strerror(errno)); + goto free_layout; + } + /** + * llapi_lease_set returns lease mode when it request to unlock + * the lease lock + */ + rc = 0; - return 0; +free_layout: + llapi_layout_free(layout); +close_fd: + close(fd); +error: + return rc; } -#define LFS_HSM_SET 0 -#define LFS_HSM_CLEAR 1 - -/** - * Generic function to set or clear HSM flags. - * Used by hsm_set and hsm_clear. - * - * @mode if LFS_HSM_SET, set the flags, if LFS_HSM_CLEAR, clear the flags. - */ -static int lfs_hsm_change_flags(int argc, char **argv, int mode) +static inline int lfs_mirror_resync(int argc, char **argv) { + struct ll_ioc_lease *ioc = NULL; + __u16 mirror_ids[128] = { 0 }; + int ids_nr = 0; + int c; + int rc = 0; + struct option long_opts[] = { - { .val = 'A', .name = "archived", .has_arg = no_argument }, - { .val = 'a', .name = "noarchive", .has_arg = no_argument }, - { .val = 'd', .name = "dirty", .has_arg = no_argument }, - { .val = 'e', .name = "exists", .has_arg = no_argument }, - { .val = 'l', .name = "lost", .has_arg = no_argument }, - { .val = 'r', .name = "norelease", .has_arg = no_argument }, + { .val = 'o', .name = "only", .has_arg = required_argument }, { .name = NULL } }; - char short_opts[] = "lraAde"; - __u64 mask = 0; - int c, rc; - char *path; - - if (argc < 3) - return CMD_HELP; - while ((c = getopt_long(argc, argv, short_opts, - long_opts, NULL)) != -1) { + while ((c = getopt_long(argc, argv, "o:", long_opts, NULL)) >= 0) { switch (c) { - case 'l': - mask |= HS_LOST; - break; - case 'a': - mask |= HS_NOARCHIVE; - break; - case 'A': - mask |= HS_ARCHIVED; - break; - case 'r': - mask |= HS_NORELEASE; - break; - case 'd': - mask |= HS_DIRTY; - break; - case 'e': - mask |= HS_EXISTS; + case 'o': + rc = parse_mirror_ids(mirror_ids, + sizeof(mirror_ids) / sizeof(__u16), + optarg); + if (rc < 0) { + fprintf(stderr, + "%s: bad mirror ids '%s'.\n", + argv[0], optarg); + goto error; + } + ids_nr = rc; break; - case '?': - return CMD_HELP; default: - fprintf(stderr, "error: %s: option '%s' unrecognized\n", + fprintf(stderr, "%s: options '%s' unrecognized.\n", argv[0], argv[optind - 1]); - return CMD_HELP; + rc = -EINVAL; + goto error; } } - /* User should have specified a flag */ - if (mask == 0) - return CMD_HELP; - - while (optind < argc) { - - path = argv[optind]; + if (argc == optind) { + fprintf(stderr, "%s: no file name given.\n", argv[0]); + rc = CMD_HELP; + goto error; + } - /* If mode == 0, this means we apply the mask. */ - if (mode == LFS_HSM_SET) - rc = llapi_hsm_state_set(path, mask, 0, 0); - else - rc = llapi_hsm_state_set(path, 0, mask, 0); + if (ids_nr > 0 && argc > optind + 1) { + fprintf(stderr, + "%s: option '--only' cannot be used upon multiple files.\n", + argv[0]); + rc = CMD_HELP; + goto error; - if (rc != 0) { - fprintf(stderr, "Can't change hsm flags for %s: %s\n", - path, strerror(errno = -rc)); - return rc; - } - optind++; } - return 0; -} + if (ids_nr > 0) { + rc = verify_mirror_ids(argv[optind], mirror_ids, ids_nr); + if (rc < 0) + goto error; + } -static int lfs_hsm_action(int argc, char **argv) -{ - int rc; - int i = 1; - char *path; - struct hsm_current_action hca; - struct hsm_extent he; - enum hsm_user_action hua; - enum hsm_progress_states hps; + /* set the lease on the file */ + ioc = calloc(sizeof(*ioc) + sizeof(__u32) * 4096, 1); + if (ioc == NULL) { + fprintf(stderr, "%s: cannot alloc id array for ioc: %s.\n", + argv[0], strerror(errno)); + rc = -errno; + goto error; + } - if (argc < 2) - return CMD_HELP; + for (; optind < argc; optind++) { + rc = lfs_mirror_resync_file(argv[optind], ioc, + mirror_ids, ids_nr); + /* ignore previous file's error, continue with next file */ - do { - path = argv[i]; + /* reset ioc */ + memset(ioc, 0, sizeof(__u32) * 4096); + } - rc = llapi_hsm_current_action(path, &hca); - if (rc) { - fprintf(stderr, "can't get hsm action for %s: %s\n", - path, strerror(errno = -rc)); - return rc; - } - he = hca.hca_location; - hua = hca.hca_action; - hps = hca.hca_state; + free(ioc); +error: + return rc; +} - printf("%s: %s", path, hsm_user_action2name(hua)); +/** + * struct verify_chunk - Mirror chunk to be verified. + * @chunk: [start, end) of the chunk. + * @mirror_count: Number of mirror ids in @mirror_id array. + * @mirror_id: Array of valid mirror ids that cover the chunk. + */ +struct verify_chunk { + struct lu_extent chunk; + unsigned int mirror_count; + __u16 mirror_id[LUSTRE_MIRROR_COUNT_MAX]; +}; - /* Skip file without action */ - if (hca.hca_action == HUA_NONE) { - printf("\n"); - continue; +/** + * print_chunks() - Print chunk information. + * @fname: Mirrored file name. + * @chunks: Array of chunks. + * @chunk_count: Number of chunks in @chunks array. + * + * This function prints [start, end) of each chunk in @chunks + * for mirrored file @fname, and also prints the valid mirror ids + * that cover the chunk. + * + * Return: void. + */ +static inline +void print_chunks(const char *fname, struct verify_chunk *chunks, + int chunk_count) +{ + int i; + int j; + + fprintf(stdout, "Chunks to be verified in %s:\n", fname); + for (i = 0; i < chunk_count; i++) { + fprintf(stdout, DEXT, PEXT(&chunks[i].chunk)); + + if (chunks[i].mirror_count == 0) + fprintf(stdout, "\t["); + else { + fprintf(stdout, "\t[%u", chunks[i].mirror_id[0]); + for (j = 1; j < chunks[i].mirror_count; j++) + fprintf(stdout, ", %u", chunks[i].mirror_id[j]); } - - printf(" %s ", hsm_progress_state2name(hps)); - - if ((hps == HPS_RUNNING) && - (hua == HUA_ARCHIVE || hua == HUA_RESTORE)) - printf("(%llu bytes moved)\n", - (unsigned long long)he.length); - else if ((he.offset + he.length) == LUSTRE_EOF) - printf("(from %llu to EOF)\n", - (unsigned long long)he.offset); - else - printf("(from %llu to %llu)\n", - (unsigned long long)he.offset, - (unsigned long long)(he.offset + he.length)); - - } while (++i < argc); - - return 0; + fprintf(stdout, "]\t%u\n", chunks[i].mirror_count); + } + fprintf(stdout, "\n"); } -static int lfs_hsm_set(int argc, char **argv) +/** + * print_checksums() - Print CRC-32 checksum values. + * @chunk: A chunk and its corresponding valid mirror ids. + * @crc: CRC-32 checksum values on the chunk for each valid mirror. + * + * This function prints CRC-32 checksum values on @chunk for + * each valid mirror that covers it. + * + * Return: void. + */ +static inline +void print_checksums(struct verify_chunk *chunk, unsigned long *crc) { - return lfs_hsm_change_flags(argc, argv, LFS_HSM_SET); -} + int i; -static int lfs_hsm_clear(int argc, char **argv) -{ - return lfs_hsm_change_flags(argc, argv, LFS_HSM_CLEAR); + fprintf(stdout, + "CRC-32 checksum value for chunk "DEXT":\n", + PEXT(&chunk->chunk)); + for (i = 0; i < chunk->mirror_count; i++) + fprintf(stdout, "Mirror %u:\t%#lx\n", + chunk->mirror_id[i], crc[i]); + fprintf(stdout, "\n"); } /** - * Check file state and return its fid, to be used by lfs_hsm_request(). + * filter_mirror_id() - Filter specified mirror ids. + * @chunks: Array of chunks. + * @chunk_count: Number of chunks in @chunks array. + * @mirror_ids: Specified mirror ids to be verified. + * @ids_nr: Number of specified mirror ids. * - * \param[in] file Path to file to check - * \param[in,out] fid Pointer to allocated lu_fid struct. - * \param[in,out] last_dev Pointer to last device id used. + * This function scans valid mirror ids that cover each chunk in @chunks + * and filters specified mirror ids. * - * \return 0 on success. + * Return: void. */ -static int lfs_hsm_prepare_file(const char *file, struct lu_fid *fid, - dev_t *last_dev) +static inline +void filter_mirror_id(struct verify_chunk *chunks, int chunk_count, + __u16 *mirror_ids, int ids_nr) { - struct stat st; - int rc; + int i; + int j; + int k; + __u16 valid_id[LUSTRE_MIRROR_COUNT_MAX] = { 0 }; + unsigned int valid_count = 0; - rc = lstat(file, &st); - if (rc) { - fprintf(stderr, "Cannot stat %s: %s\n", file, strerror(errno)); - return -errno; - } - /* Checking for regular file as archiving as posix copytool - * rejects archiving files other than regular files - */ - if (!S_ISREG(st.st_mode)) { - fprintf(stderr, "error: \"%s\" is not a regular file\n", file); - return CMD_HELP; - } - /* A request should be ... */ - if (*last_dev != st.st_dev && *last_dev != 0) { - fprintf(stderr, "All files should be " - "on the same filesystem: %s\n", file); - return -EINVAL; - } - *last_dev = st.st_dev; + for (i = 0; i < chunk_count; i++) { + if (chunks[i].mirror_count == 0) + continue; - rc = llapi_path2fid(file, fid); - if (rc) { - fprintf(stderr, "Cannot read FID of %s: %s\n", - file, strerror(-rc)); - return rc; + valid_count = 0; + for (j = 0; j < ids_nr; j++) { + for (k = 0; k < chunks[i].mirror_count; k++) { + if (chunks[i].mirror_id[k] == mirror_ids[j]) { + valid_id[valid_count] = mirror_ids[j]; + valid_count++; + break; + } + } + } + + memcpy(chunks[i].mirror_id, valid_id, + sizeof(__u16) * valid_count); + chunks[i].mirror_count = valid_count; } - return 0; } -/* Fill an HSM HUR item with a given file name. +/** + * lfs_mirror_prepare_chunk() - Find mirror chunks to be verified. + * @layout: Mirror component list. + * @chunks: Array of chunks. + * @chunks_size: Array size of @chunks. * - * If mntpath is set, then the filename is actually a FID, and no - * lookup on the filesystem will be performed. + * This function scans the components in @layout from offset 0 to LUSTRE_EOF + * to find out chunk segments and store them in @chunks array. * - * \param[in] hur the user request to fill - * \param[in] idx index of the item inside the HUR to fill - * \param[in] mntpath mountpoint of Lustre - * \param[in] fname filename (if mtnpath is NULL) - * or FID (if mntpath is set) - * \param[in] last_dev pointer to last device id used + * The @mirror_id array in each element of @chunks will store the valid + * mirror ids that cover the chunk. If a mirror component covering the + * chunk has LCME_FL_STALE or LCME_FL_OFFLINE flag, then the mirror id + * will not be stored into the @mirror_id array, and the chunk for that + * mirror will not be verified. * - * \retval 0 on success - * \retval CMD_HELP or a negative errno on error + * The @mirror_count in each element of @chunks will store the number of + * mirror ids in @mirror_id array. If @mirror_count is 0, it indicates the + * chunk is invalid in all of the mirrors. And if @mirror_count is 1, it + * indicates the chunk is valid in only one mirror. In both cases, the + * chunk will not be verified. + * + * Here is an example: + * + * 0 1M 2M 3M 4M EOF + * +------+-------------+--------------------+ + * | | | S | mirror1 + * +------+------+------+------+-------------+ + * | | S | S | | mirror2 + * +-------------+------+------+-------------+ + * + * prepared @chunks array will contain 5 elements: + * (([0, 1M), [1, 2], 2), + * ([1M, 2M), [1, 2], 2), + * ([2M, 3M), [1], 1), + * ([3M, 4M], [], 0), + * ([4M, EOF), [2], 1)) + * + * Return: the actual array size of @chunks on success + * or a negative error code on failure. */ -static int fill_hur_item(struct hsm_user_request *hur, unsigned int idx, - const char *mntpath, const char *fname, - dev_t *last_dev) +static inline +int lfs_mirror_prepare_chunk(struct llapi_layout *layout, + struct verify_chunk *chunks, + size_t chunks_size) { - struct hsm_user_item *hui = &hur->hur_user_item[idx]; - int rc; + uint64_t start; + uint64_t end; + uint32_t mirror_id; + uint32_t flags; + int idx = 0; + int i = 0; + int rc = 0; - hui->hui_extent.length = -1; + memset(chunks, 0, sizeof(*chunks) * chunks_size); - if (mntpath != NULL) { - if (*fname == '[') - fname++; - rc = sscanf(fname, SFID, RFID(&hui->hui_fid)); - if (rc == 3) { - rc = 0; - } else { - fprintf(stderr, "hsm: '%s' is not a valid FID\n", - fname); - rc = -EINVAL; + while (1) { + rc = llapi_layout_comp_use(layout, LLAPI_LAYOUT_COMP_USE_FIRST); + if (rc < 0) { + fprintf(stderr, + "%s: move to the first layout component: %s.\n", + progname, strerror(errno)); + goto error; } - } else { - rc = lfs_hsm_prepare_file(fname, &hui->hui_fid, last_dev); - } - if (rc == 0) - hur->hur_request.hr_itemcount++; + i = 0; + rc = 0; + chunks[idx].chunk.e_end = LUSTRE_EOF; + while (rc == 0) { + rc = llapi_layout_comp_extent_get(layout, &start, &end); + if (rc < 0) { + fprintf(stderr, + "%s: llapi_layout_comp_extent_get failed: %s.\n", + progname, strerror(errno)); + goto error; + } + + if (start > chunks[idx].chunk.e_start || + end <= chunks[idx].chunk.e_start) + goto next; + + if (end < chunks[idx].chunk.e_end) + chunks[idx].chunk.e_end = end; - return rc; -} + rc = llapi_layout_comp_flags_get(layout, &flags); + if (rc < 0) { + fprintf(stderr, + "%s: llapi_layout_comp_flags_get failed: %s.\n", + progname, strerror(errno)); + goto error; + } -static int lfs_hsm_request(int argc, char **argv, int action) -{ - struct option long_opts[] = { - { .val = 'a', .name = "archive", .has_arg = required_argument }, - { .val = 'D', .name = "data", .has_arg = required_argument }, - { .val = 'l', .name = "filelist", .has_arg = required_argument }, - { .val = 'm', .name = "mntpath", .has_arg = required_argument }, - { .name = NULL } }; - dev_t last_dev = 0; - char short_opts[] = "l:D:a:m:"; - struct hsm_user_request *hur, *oldhur; - int c, i; - size_t len; - int nbfile; - char *line = NULL; - char *filelist = NULL; - char fullpath[PATH_MAX]; - char *opaque = NULL; - int opaque_len = 0; - int archive_id = 0; - FILE *fp; - int nbfile_alloc = 0; - char *some_file = NULL; - char *mntpath = NULL; - int rc; + if (flags & LCME_FL_STALE || flags & LCME_FL_OFFLINE) + goto next; - if (argc < 2) - return CMD_HELP; + rc = llapi_layout_mirror_id_get(layout, &mirror_id); + if (rc < 0) { + fprintf(stderr, + "%s: llapi_layout_mirror_id_get failed: %s.\n", + progname, strerror(errno)); + goto error; + } - while ((c = getopt_long(argc, argv, short_opts, - long_opts, NULL)) != -1) { - switch (c) { - case 'l': - filelist = optarg; - break; - case 'D': - opaque = optarg; - break; - case 'a': - if (action != HUA_ARCHIVE && - action != HUA_REMOVE) { + chunks[idx].mirror_id[i] = mirror_id; + i++; + if (i >= ARRAY_SIZE(chunks[idx].mirror_id)) { fprintf(stderr, - "error: -a is supported only " - "when archiving or removing\n"); - return CMD_HELP; + "%s: mirror_id array is too small.\n", + progname); + rc = -EINVAL; + goto error; } - archive_id = atoi(optarg); - break; - case 'm': - if (some_file == NULL) { - mntpath = optarg; - some_file = strdup(optarg); + + next: + rc = llapi_layout_comp_use(layout, + LLAPI_LAYOUT_COMP_USE_NEXT); + if (rc < 0) { + fprintf(stderr, + "%s: move to the next layout component: %s.\n", + progname, strerror(errno)); + goto error; } - break; - case '?': - return CMD_HELP; - default: - fprintf(stderr, "error: %s: option '%s' unrecognized\n", - argv[0], argv[optind - 1]); - return CMD_HELP; - } - } + } /* loop through all components */ - /* All remaining args are files, so we have at least nbfile */ - nbfile = argc - optind; + chunks[idx].mirror_count = i; - if ((nbfile == 0) && (filelist == NULL)) - return CMD_HELP; + if (chunks[idx].chunk.e_end == LUSTRE_EOF) + break; - if (opaque != NULL) - opaque_len = strlen(opaque); + idx++; + if (idx >= chunks_size) { + fprintf(stderr, "%s: chunks array is too small.\n", + progname); + rc = -EINVAL; + goto error; + } - /* Alloc the request structure with enough place to store all files - * from command line. */ - hur = llapi_hsm_user_request_alloc(nbfile, opaque_len); - if (hur == NULL) { - fprintf(stderr, "Cannot create the request: %s\n", - strerror(errno)); - return errno; + chunks[idx].chunk.e_start = chunks[idx - 1].chunk.e_end; } - nbfile_alloc = nbfile; - - hur->hur_request.hr_action = action; - hur->hur_request.hr_archive_id = archive_id; - hur->hur_request.hr_flags = 0; - /* All remaining args are files, add them */ - if (nbfile != 0 && some_file == NULL) - some_file = strdup(argv[optind]); +error: + return rc < 0 ? rc : idx + 1; +} - for (i = 0; i < nbfile; i++) { - rc = fill_hur_item(hur, i, mntpath, argv[optind + i], - &last_dev); - if (rc) - goto out_free; - } +/** + * lfs_mirror_verify_chunk() - Verify a chunk. + * @fd: File descriptor of the mirrored file. + * @file_size: Size of the mirrored file. + * @chunk: A chunk and its corresponding valid mirror ids. + * @verbose: Verbose mode. + * + * This function verifies a @chunk contains exactly the same data + * ammong the mirrors that cover it. + * + * If @verbose is specified, then the function will print where the + * differences are if the data do not match. Otherwise, it will + * just return an error in that case. + * + * Return: 0 on success or a negative error code on failure. + */ +static inline +int lfs_mirror_verify_chunk(int fd, size_t file_size, + struct verify_chunk *chunk, int verbose) +{ + const size_t buflen = 4 * 1024 * 1024; /* 4M */ + void *buf; + size_t page_size = sysconf(_SC_PAGESIZE); + ssize_t bytes_read; + ssize_t bytes_done; + size_t count; + off_t pos; + unsigned long crc; + unsigned long crc_array[LUSTRE_MIRROR_COUNT_MAX] = { 0 }; + int i; + int rc = 0; - /* from here stop using nb_file, use hur->hur_request.hr_itemcount */ + if (file_size == 0) + return 0; - /* If a filelist was specified, read the filelist from it. */ - if (filelist != NULL) { - fp = fopen(filelist, "r"); - if (fp == NULL) { - fprintf(stderr, "Cannot read the file list %s: %s\n", - filelist, strerror(errno)); - rc = -errno; - goto out_free; - } + rc = posix_memalign(&buf, page_size, buflen); + if (rc) /* error code is returned directly */ + return -rc; - while ((rc = getline(&line, &len, fp)) != -1) { - /* If allocated buffer was too small, get something - * larger */ - if (nbfile_alloc <= hur->hur_request.hr_itemcount) { - ssize_t size; + if (verbose > 1) { + fprintf(stdout, "Verifying chunk "DEXT" on mirror:", + PEXT(&chunk->chunk)); + for (i = 0; i < chunk->mirror_count; i++) + fprintf(stdout, " %u", chunk->mirror_id[i]); + fprintf(stdout, "\n"); + } - nbfile_alloc = nbfile_alloc * 2 + 1; - oldhur = hur; - hur = llapi_hsm_user_request_alloc(nbfile_alloc, - opaque_len); - if (hur == NULL) { - fprintf(stderr, "hsm: cannot allocate " - "the request: %s\n", - strerror(errno)); - hur = oldhur; - rc = -errno; - fclose(fp); - goto out_free; - } - size = hur_len(oldhur); - if (size < 0) { - fprintf(stderr, "hsm: cannot allocate " - "%u files + %u bytes data\n", - oldhur->hur_request.hr_itemcount, - oldhur->hur_request.hr_data_len); - free(hur); - hur = oldhur; - rc = -E2BIG; - fclose(fp); - goto out_free; - } - memcpy(hur, oldhur, size); - free(oldhur); + bytes_done = 0; + count = MIN(chunk->chunk.e_end, file_size) - chunk->chunk.e_start; + pos = chunk->chunk.e_start; + while (bytes_done < count) { + /* compute initial CRC-32 checksum */ + crc = crc32(0L, Z_NULL, 0); + memset(crc_array, 0, sizeof(crc_array)); + + bytes_read = 0; + for (i = 0; i < chunk->mirror_count; i++) { + bytes_read = llapi_mirror_read(fd, chunk->mirror_id[i], + buf, buflen, pos); + if (bytes_read < 0) { + rc = bytes_read; + fprintf(stderr, + "%s: failed to read data from mirror %u: %s.\n", + progname, chunk->mirror_id[i], + strerror(-rc)); + goto error; } - /* Chop CR */ - if (line[strlen(line) - 1] == '\n') - line[strlen(line) - 1] = '\0'; + /* compute new CRC-32 checksum */ + crc_array[i] = crc32(crc, buf, bytes_read); + } - rc = fill_hur_item(hur, hur->hur_request.hr_itemcount, - mntpath, line, &last_dev); - if (rc) { - fclose(fp); - goto out_free; - } + if (verbose) + print_checksums(chunk, crc_array); - if (some_file == NULL) { - some_file = line; - line = NULL; + /* compare CRC-32 checksum values */ + for (i = 1; i < chunk->mirror_count; i++) { + if (crc_array[i] != crc_array[0]) { + rc = -EINVAL; + if (!verbose) + goto error; + + fprintf(stderr, + "%s: chunk "DEXT" has different checksum value on mirror %u and mirror %u.\n", + progname, PEXT(&chunk->chunk), + chunk->mirror_id[0], + chunk->mirror_id[i]); } } - rc = fclose(fp); - free(line); + pos += bytes_read; + bytes_done += bytes_read; } - /* If a --data was used, add it to the request */ - hur->hur_request.hr_data_len = opaque_len; - if (opaque != NULL) - memcpy(hur_data(hur), opaque, opaque_len); - - /* Send the HSM request */ - if (realpath(some_file, fullpath) == NULL) { - fprintf(stderr, "Could not find path '%s': %s\n", - some_file, strerror(errno)); - } - rc = llapi_hsm_request(fullpath, hur); - if (rc) { - fprintf(stderr, "Cannot send HSM request (use of %s): %s\n", - some_file, strerror(-rc)); - goto out_free; + if (verbose > 1 && rc == 0) { + fprintf(stdout, "Verifying chunk "DEXT" on mirror:", + PEXT(&chunk->chunk)); + for (i = 0; i < chunk->mirror_count; i++) + fprintf(stdout, " %u", chunk->mirror_id[i]); + fprintf(stdout, " PASS\n\n"); } -out_free: - free(some_file); - free(hur); +error: + free(buf); return rc; } -static int lfs_hsm_archive(int argc, char **argv) -{ - return lfs_hsm_request(argc, argv, HUA_ARCHIVE); -} - -static int lfs_hsm_restore(int argc, char **argv) -{ - return lfs_hsm_request(argc, argv, HUA_RESTORE); -} - -static int lfs_hsm_release(int argc, char **argv) +/** + * lfs_mirror_verify_file() - Verify a mirrored file. + * @fname: Mirrored file name. + * @mirror_ids: Specified mirror ids to be verified. + * @ids_nr: Number of specified mirror ids. + * @verbose: Verbose mode. + * + * This function verifies that each SYNC mirror of a mirrored file + * specified by @fname contains exactly the same data. + * + * If @mirror_ids is specified, then the function will verify the + * mirrors specified by @mirror_ids contain exactly the same data. + * + * If @verbose is specified, then the function will print where the + * differences are if the data do not match. Otherwise, it will + * just return an error in that case. + * + * Return: 0 on success or a negative error code on failure. + */ +static inline +int lfs_mirror_verify_file(const char *fname, __u16 *mirror_ids, int ids_nr, + int verbose) { - return lfs_hsm_request(argc, argv, HUA_RELEASE); -} + struct verify_chunk chunks_array[1024] = { }; + struct llapi_layout *layout = NULL; + struct stat stbuf; + uint32_t flr_state; + int fd; + int chunk_count = 0; + int idx = 0; + int rc = 0; + int rc1 = 0; + int rc2 = 0; -static int lfs_hsm_remove(int argc, char **argv) -{ - return lfs_hsm_request(argc, argv, HUA_REMOVE); -} + if (stat(fname, &stbuf) < 0) { + fprintf(stderr, "%s: cannot stat file '%s': %s.\n", + progname, fname, strerror(errno)); + rc = -errno; + goto error; + } -static int lfs_hsm_cancel(int argc, char **argv) -{ - return lfs_hsm_request(argc, argv, HUA_CANCEL); -} + if (!S_ISREG(stbuf.st_mode)) { + fprintf(stderr, "%s: '%s' is not a regular file.\n", + progname, fname); + rc = -EINVAL; + goto error; + } -static int lfs_swap_layouts(int argc, char **argv) -{ - if (argc != 3) - return CMD_HELP; + if (stbuf.st_size == 0) { + if (verbose) + fprintf(stdout, "%s: '%s' file size is 0.\n", + progname, fname); + rc = 0; + goto error; + } - return llapi_swap_layouts(argv[1], argv[2], 0, 0, - SWAP_LAYOUTS_KEEP_MTIME | - SWAP_LAYOUTS_KEEP_ATIME); -} + fd = open(fname, O_DIRECT | O_RDONLY); + if (fd < 0) { + fprintf(stderr, "%s: cannot open '%s': %s.\n", + progname, fname, strerror(errno)); + rc = -errno; + goto error; + } -static const char *const ladvise_names[] = LU_LADVISE_NAMES; + rc = llapi_lease_acquire(fd, LL_LEASE_RDLCK); + if (rc < 0) { + fprintf(stderr, "%s: '%s' llapi_lease_acquire failed: %s.\n", + progname, fname, strerror(errno)); + goto close_fd; + } -static const char *const lock_mode_names[] = LOCK_MODE_NAMES; + layout = llapi_layout_get_by_fd(fd, 0); + if (layout == NULL) { + fprintf(stderr, "%s: '%s' llapi_layout_get_by_fd failed: %s.\n", + progname, fname, strerror(errno)); + rc = -errno; + llapi_lease_release(fd); + goto close_fd; + } -static const char *const lockahead_results[] = { - [LLA_RESULT_SENT] = "Lock request sent", - [LLA_RESULT_DIFFERENT] = "Different matching lock found", - [LLA_RESULT_SAME] = "Matching lock on identical extent found", -}; + rc = llapi_layout_flags_get(layout, &flr_state); + if (rc < 0) { + fprintf(stderr, "%s: '%s' llapi_layout_flags_get failed: %s.\n", + progname, fname, strerror(errno)); + rc = -errno; + goto free_layout; + } -int lfs_get_mode(const char *string) -{ - enum lock_mode_user mode; + flr_state &= LCM_FL_FLR_MASK; + switch (flr_state) { + case LCM_FL_NONE: + rc = -EINVAL; + fprintf(stderr, "%s: '%s' file state error: %s.\n", + progname, fname, llapi_layout_flags_string(flr_state)); + goto free_layout; + default: + break; + } - for (mode = 0; mode < ARRAY_SIZE(lock_mode_names); mode++) { - if (lock_mode_names[mode] == NULL) - continue; - if (strcmp(string, lock_mode_names[mode]) == 0) - return mode; + /* find out mirror chunks to be verified */ + chunk_count = lfs_mirror_prepare_chunk(layout, chunks_array, + ARRAY_SIZE(chunks_array)); + if (chunk_count < 0) { + rc = chunk_count; + goto free_layout; } - return -EINVAL; -} + if (ids_nr > 0) + /* filter specified mirror ids */ + filter_mirror_id(chunks_array, chunk_count, mirror_ids, ids_nr); + + if (verbose > 2) + print_chunks(fname, chunks_array, chunk_count); + + for (idx = 0; idx < chunk_count; idx++) { + if (chunks_array[idx].chunk.e_start >= stbuf.st_size) { + if (verbose) + fprintf(stdout, + "%s: '%s' chunk "DEXT" exceeds file size %#llx: skipped\n", + progname, fname, + PEXT(&chunks_array[idx].chunk), + (unsigned long long)stbuf.st_size); + break; + } -static enum lu_ladvise_type lfs_get_ladvice(const char *string) -{ - enum lu_ladvise_type advice; + if (chunks_array[idx].mirror_count == 0) { + fprintf(stderr, + "%s: '%s' chunk "DEXT" is invalid in all of the mirrors: ", + progname, fname, + PEXT(&chunks_array[idx].chunk)); + if (verbose) { + fprintf(stderr, "skipped\n"); + continue; + } + rc = -EINVAL; + fprintf(stderr, "failed\n"); + goto free_layout; + } - for (advice = 0; - advice < ARRAY_SIZE(ladvise_names); advice++) { - if (ladvise_names[advice] == NULL) + if (chunks_array[idx].mirror_count == 1) { + if (verbose) + fprintf(stdout, + "%s: '%s' chunk "DEXT" is only valid in mirror %u: skipped\n", + progname, fname, + PEXT(&chunks_array[idx].chunk), + chunks_array[idx].mirror_id[0]); continue; - if (strcmp(string, ladvise_names[advice]) == 0) - return advice; + } + + rc = llapi_lease_check(fd); + if (rc != LL_LEASE_RDLCK) { + fprintf(stderr, "%s: '%s' lost lease lock.\n", + progname, fname); + goto free_layout; + } + + /* verify one chunk */ + rc1 = lfs_mirror_verify_chunk(fd, stbuf.st_size, + &chunks_array[idx], verbose); + if (rc1 < 0) { + rc2 = rc1; + if (!verbose) { + rc = rc1; + goto free_layout; + } + } } - return LU_LADVISE_INVALID; + if (rc2 < 0) + rc = rc2; + +free_layout: + llapi_layout_free(layout); + llapi_lease_release(fd); +close_fd: + close(fd); +error: + return rc; } -static int lfs_ladvise(int argc, char **argv) +/** + * lfs_mirror_verify() - Parse and execute lfs mirror verify command. + * @argc: The count of lfs mirror verify command line arguments. + * @argv: Array of strings for lfs mirror verify command line arguments. + * + * This function parses lfs mirror verify command and verifies the + * specified mirrored file(s). + * + * Return: 0 on success or a negative error code on failure. + */ +static inline int lfs_mirror_verify(int argc, char **argv) { + __u16 mirror_ids[LUSTRE_MIRROR_COUNT_MAX] = { 0 }; + int ids_nr = 0; + int c; + int verbose = 0; + int rc = 0; + int rc1 = 0; + char cmd[PATH_MAX]; + struct option long_opts[] = { - { .val = 'a', .name = "advice", .has_arg = required_argument }, - { .val = 'b', .name = "background", .has_arg = no_argument }, - { .val = 'e', .name = "end", .has_arg = required_argument }, - { .val = 'l', .name = "length", .has_arg = required_argument }, - { .val = 'm', .name = "mode", .has_arg = required_argument }, - { .val = 's', .name = "start", .has_arg = required_argument }, - { .val = 'u', .name = "unset", .has_arg = no_argument }, + { .val = 'o', .name = "only", .has_arg = required_argument }, + { .val = 'v', .name = "verbose", .has_arg = no_argument }, { .name = NULL } }; - char short_opts[] = "a:be:l:m:s:u"; - int c; - int rc = 0; - const char *path; - int fd; - struct llapi_lu_ladvise advice; - enum lu_ladvise_type advice_type = LU_LADVISE_INVALID; - unsigned long long start = 0; - unsigned long long end = LUSTRE_EOF; - unsigned long long length = 0; - unsigned long long size_units; - unsigned long long flags = 0; - int mode = 0; - optind = 0; - while ((c = getopt_long(argc, argv, short_opts, - long_opts, NULL)) != -1) { + snprintf(cmd, sizeof(cmd), "%s %s", progname, argv[0]); + progname = cmd; + while ((c = getopt_long(argc, argv, "o:v", long_opts, NULL)) >= 0) { switch (c) { - case 'a': - advice_type = lfs_get_ladvice(optarg); - if (advice_type == LU_LADVISE_INVALID) { - fprintf(stderr, "%s: invalid advice type " - "'%s'\n", argv[0], optarg); - fprintf(stderr, "Valid types:"); - - for (advice_type = 0; - advice_type < ARRAY_SIZE(ladvise_names); - advice_type++) { - if (ladvise_names[advice_type] == NULL) - continue; - fprintf(stderr, " %s", - ladvise_names[advice_type]); - } - fprintf(stderr, "\n"); - - return CMD_HELP; - } - break; - case 'b': - flags |= LF_ASYNC; - break; - case 'u': - flags |= LF_UNSET; - break; - case 'e': - size_units = 1; - rc = llapi_parse_size(optarg, &end, - &size_units, 0); - if (rc) { - fprintf(stderr, "%s: bad end offset '%s'\n", - argv[0], optarg); - return CMD_HELP; - } - break; - case 's': - size_units = 1; - rc = llapi_parse_size(optarg, &start, - &size_units, 0); - if (rc) { - fprintf(stderr, "%s: bad start offset " - "'%s'\n", argv[0], optarg); - return CMD_HELP; + case 'o': + rc = parse_mirror_ids(mirror_ids, + ARRAY_SIZE(mirror_ids), + optarg); + if (rc < 0) { + fprintf(stderr, + "%s: bad mirror ids '%s'.\n", + progname, optarg); + goto error; } - break; - case 'l': - size_units = 1; - rc = llapi_parse_size(optarg, &length, - &size_units, 0); - if (rc) { - fprintf(stderr, "%s: bad length '%s'\n", - argv[0], optarg); - return CMD_HELP; + ids_nr = rc; + if (ids_nr < 2) { + fprintf(stderr, + "%s: at least 2 mirror ids needed with '--only' option.\n", + progname); + rc = CMD_HELP; + goto error; } break; - case 'm': - mode = lfs_get_mode(optarg); - if (mode < 0) { - fprintf(stderr, "%s: bad mode '%s', valid " - "modes are READ or WRITE\n", - argv[0], optarg); - return CMD_HELP; - } + case 'v': + verbose++; break; - case '?': - return CMD_HELP; default: - fprintf(stderr, "%s: option '%s' unrecognized\n", - argv[0], argv[optind - 1]); - return CMD_HELP; - } - } - - if (advice_type == LU_LADVISE_INVALID) { - fprintf(stderr, "%s: please give an advice type\n", argv[0]); - fprintf(stderr, "Valid types:"); - for (advice_type = 0; advice_type < ARRAY_SIZE(ladvise_names); - advice_type++) { - if (ladvise_names[advice_type] == NULL) - continue; - fprintf(stderr, " %s", ladvise_names[advice_type]); + fprintf(stderr, "%s: options '%s' unrecognized.\n", + progname, argv[optind - 1]); + rc = -EINVAL; + goto error; } - fprintf(stderr, "\n"); - return CMD_HELP; } - if (advice_type == LU_LADVISE_LOCKNOEXPAND) { - fprintf(stderr, "%s: Lock no expand advice is a per file " - "descriptor advice, so when called from lfs, " - "it does nothing.\n", argv[0]); - return CMD_HELP; + if (argc == optind) { + fprintf(stderr, "%s: no file name given.\n", progname); + rc = CMD_HELP; + goto error; } - if (argc <= optind) { - fprintf(stderr, "%s: please give one or more file names\n", - argv[0]); - return CMD_HELP; - } + if (ids_nr > 0 && argc > optind + 1) { + fprintf(stderr, + "%s: '--only' cannot be used upon multiple files.\n", + progname); + rc = CMD_HELP; + goto error; - if (end != LUSTRE_EOF && length != 0 && end != start + length) { - fprintf(stderr, "%s: conflicting arguments of -l and -e\n", - argv[0]); - return CMD_HELP; } - if (end == LUSTRE_EOF && length != 0) - end = start + length; - - if (end <= start) { - fprintf(stderr, "%s: range [%llu, %llu] is invalid\n", - argv[0], start, end); - return CMD_HELP; + if (ids_nr > 0) { + rc = verify_mirror_ids(argv[optind], mirror_ids, ids_nr); + if (rc < 0) + goto error; } - if (advice_type != LU_LADVISE_LOCKAHEAD && mode != 0) { - fprintf(stderr, "%s: mode is only valid with lockahead\n", - argv[0]); - return CMD_HELP; + rc = 0; + for (; optind < argc; optind++) { + rc1 = lfs_mirror_verify_file(argv[optind], mirror_ids, ids_nr, + verbose); + if (rc1 < 0) + rc = rc1; } +error: + return rc; +} - if (advice_type == LU_LADVISE_LOCKAHEAD && mode == 0) { - fprintf(stderr, "%s: mode is required with lockahead\n", - argv[0]); - return CMD_HELP; - } +/** + * lfs_mirror() - Parse and execute lfs mirror commands. + * @argc: The count of lfs mirror command line arguments. + * @argv: Array of strings for lfs mirror command line arguments. + * + * This function parses lfs mirror commands and performs the + * corresponding functions specified in mirror_cmdlist[]. + * + * Return: 0 on success or an error code on failure. + */ +static int lfs_mirror(int argc, char **argv) +{ + char cmd[PATH_MAX]; + int rc = 0; - while (optind < argc) { - int rc2; + setlinebuf(stdout); - path = argv[optind++]; + Parser_init("lfs-mirror > ", mirror_cmdlist); - fd = open(path, O_RDONLY); - if (fd < 0) { - fprintf(stderr, "%s: cannot open file '%s': %s\n", - argv[0], path, strerror(errno)); - rc2 = -errno; - goto next; - } + snprintf(cmd, sizeof(cmd), "%s %s", progname, argv[0]); + progname = cmd; + program_invocation_short_name = cmd; + if (argc > 1) + rc = Parser_execarg(argc - 1, argv + 1, mirror_cmdlist); + else + rc = Parser_commands(); - advice.lla_start = start; - advice.lla_end = end; - advice.lla_advice = advice_type; - advice.lla_value1 = 0; - advice.lla_value2 = 0; - advice.lla_value3 = 0; - advice.lla_value4 = 0; - if (advice_type == LU_LADVISE_LOCKAHEAD) { - advice.lla_lockahead_mode = mode; - advice.lla_peradvice_flags = flags; - } + return rc < 0 ? -rc : rc; +} - rc2 = llapi_ladvise(fd, flags, 1, &advice); - close(fd); - if (rc2 < 0) { - fprintf(stderr, "%s: cannot give advice '%s' to file " - "'%s': %s\n", argv[0], - ladvise_names[advice_type], - path, strerror(errno)); +/** + * lfs_mirror_list_commands() - List lfs mirror commands. + * @argc: The count of command line arguments. + * @argv: Array of strings for command line arguments. + * + * This function lists lfs mirror commands defined in mirror_cmdlist[]. + * + * Return: 0 on success. + */ +static int lfs_mirror_list_commands(int argc, char **argv) +{ + char buffer[81] = ""; - goto next; - } + Parser_list_commands(mirror_cmdlist, buffer, sizeof(buffer), + NULL, 0, 4); -next: - if (rc == 0 && rc2 < 0) - rc = rc2; - } - return rc; + return 0; } static int lfs_list_commands(int argc, char **argv) @@ -5537,24 +8764,27 @@ static int lfs_list_commands(int argc, char **argv) int main(int argc, char **argv) { - int rc; + int rc; /* Ensure that liblustreapi constructor has run */ - if (!liblustreapi_initialized) + if (!llapi_liblustreapi_initialized()) fprintf(stderr, "liblustreapi was not properly initialized\n"); - setlinebuf(stdout); + setlinebuf(stdout); + opterr = 0; Parser_init("lfs > ", cmdlist); - progname = argv[0]; /* Used in error messages */ - if (argc > 1) { - rc = Parser_execarg(argc - 1, argv + 1, cmdlist); - } else { - rc = Parser_commands(); - } + progname = program_invocation_short_name; /* Used in error messages */ + if (argc > 1) { + llapi_set_command_name(argv[1]); + rc = Parser_execarg(argc - 1, argv + 1, cmdlist); + llapi_clear_command_name(); + } else { + rc = Parser_commands(); + } - return rc < 0 ? -rc : rc; + return rc < 0 ? -rc : rc; } #ifdef _LUSTRE_IDL_H_