X-Git-Url: https://git.whamcloud.com/?p=fs%2Flustre-release.git;a=blobdiff_plain;f=lustre%2Futils%2Flfs.c;h=0ae49c397c0d4f4914d945751efe3236dd926f3c;hp=f247dd13cf4ae1ffdd0e2ad3c41edddaad175ecd;hb=1e7158d15ed8adad0e8d94cb61bf889c0adcd825;hpb=23b2d47818996a825ab8eadd64ce29089b3d114b diff --git a/lustre/utils/lfs.c b/lustre/utils/lfs.c index f247dd1..0ae49c3 100644 --- a/lustre/utils/lfs.c +++ b/lustre/utils/lfs.c @@ -58,11 +58,14 @@ #include #include #include +#include #include #include #include #include #include +#include +#include #include "lfs_project.h" #include @@ -72,6 +75,7 @@ #include #include #include +#include #ifndef ARRAY_SIZE # define ARRAY_SIZE(a) ((sizeof(a)) / (sizeof((a)[0]))) @@ -114,15 +118,19 @@ static int lfs_hsm_cancel(int argc, char **argv); static int lfs_swap_layouts(int argc, char **argv); static int lfs_mv(int argc, char **argv); static int lfs_ladvise(int argc, char **argv); +static int lfs_getsom(int argc, char **argv); static int lfs_mirror(int argc, char **argv); static int lfs_mirror_list_commands(int argc, char **argv); static int lfs_list_commands(int argc, char **argv); static inline int lfs_mirror_resync(int argc, char **argv); static inline int lfs_mirror_verify(int argc, char **argv); +static inline int lfs_mirror_read(int argc, char **argv); +static inline int lfs_mirror_write(int argc, char **argv); enum setstripe_origin { SO_SETSTRIPE, SO_MIGRATE, + SO_MIGRATE_MDT, SO_MIRROR_CREATE, SO_MIRROR_EXTEND, SO_MIRROR_SPLIT, @@ -157,9 +165,11 @@ static inline int lfs_mirror_split(int argc, char **argv) " [--stripe-count|-c ]\n" \ " [--stripe-index|-i ]\n" \ " [--stripe-size|-S ]\n" \ - " [--layout|-L ]\n" \ + " [--layout|-L ]\n" \ " [--pool|-p ]\n" \ - " [--ost|-o ]\n" + " [--ost|-o ]\n" \ + " [--yaml|-y ]\n" \ + " [--copy=]\n" #define SSM_HELP_COMMON \ "\tstripe_count: Number of OSTs to stripe over (0=fs default, -1 all)\n" \ @@ -179,7 +189,13 @@ static inline int lfs_mirror_split(int argc, char **argv) "\tcomp_end: Extent end of component, start after previous end.\n"\ "\t Can be specified with K, M or G (for KB, MB, GB\n" \ "\t respectively, -1 for EOF). Must be a multiple of\n"\ - "\t stripe_size.\n" + "\t stripe_size.\n" \ + "\tyaml_template_file:\n" \ + "\t YAML layout template file, can't be used with -c,\n" \ + "\t -i, -S, -p, -o, or -E arguments.\n" \ + "\tlustre_src: Lustre file/dir whose layout info is used to set\n" \ + "\t another lustre file or directory, can't used with\n" \ + "\t -c, -i, -S, -p, -o, or -E arguments.\n" #define MIRROR_CREATE_HELP \ "\tmirror_count: Number of mirrors to be created with the upcoming\n" \ @@ -192,7 +208,6 @@ static inline int lfs_mirror_split(int argc, char **argv) "\t It can be a plain layout or a composite layout.\n" \ "\t If not specified, the stripe options inherited\n" \ "\t from the previous component will be used.\n" \ - "\tparent: Use default stripe options from parent directory\n" \ "\tflags: set flags to the component of the current mirror.\n" \ "\t Only \"prefer\" flag is supported so far.\n" @@ -207,7 +222,7 @@ static inline int lfs_mirror_split(int argc, char **argv) #define MIRROR_EXTEND_USAGE \ " <--mirror-count|-N[mirror_count]>\n" \ - " [setstripe options|--parent|-f ]\n" \ + " [setstripe options|-f ]\n" \ " [--no-verify]\n" #define SETSTRIPE_USAGE \ @@ -219,26 +234,28 @@ static inline int lfs_mirror_split(int argc, char **argv) #define MIGRATE_USAGE \ SSM_CMD_COMMON("migrate ") \ - " [--block|-b]\n" \ - " [--non-block|-n]\n" \ + " [--block|-b] [--non-block|-n]\n" \ + " [--non-direct|-D] [--verbose|-v]\n" \ " \n" \ SSM_HELP_COMMON \ "\n" \ "\tblock: Block file access during data migration (default)\n" \ "\tnon-block: Abort migrations if concurrent access is detected\n" \ - -#define SETDIRSTRIPE_USAGE \ - " [--mdt-count|-c stripe_count>\n" \ - " [--mdt-index|-i mdt_index]\n" \ - " [--mdt-hash|-H mdt_hash]\n" \ - " [--default|-D] [--mode|-m mode] \n" \ + "\tnon-direct: Do not use direct I/O to copy file contents\n" \ + "\tverbose: Print each filename as it is migrated\n" \ + +#define SETDIRSTRIPE_USAGE \ + " [--mdt-count|-c stripe_count>\n" \ + " [--mdt-hash|-H mdt_hash]\n" \ + " [--mdt-index|-i mdt_index[,mdt_index,...]\n" \ + " [--default|-D] [--mode|-o mode] \n" \ "\tstripe_count: stripe count of the striped directory\n" \ "\tmdt_index: MDT index of first stripe\n" \ "\tmdt_hash: hash type of the striped directory. mdt types:\n" \ " fnv_1a_64 FNV-1a hash algorithm (default)\n" \ " all_char sum of characters % MDT_COUNT (not recommended)\n" \ "\tdefault_stripe: set default dirstripe of the directory\n" \ - "\tmode: the mode of the directory\n" + "\tmode: the file access permission of the directory (octal)\n" /** * command_t mirror_cmdlist - lfs mirror commands. @@ -248,24 +265,34 @@ command_t mirror_cmdlist[] = { .pc_help = "Create a mirrored file.\n" "usage: lfs mirror create " "<--mirror-count|-N[mirror_count]> " - "[setstripe options|--parent] ... \n" + "[setstripe options] ... \n" MIRROR_CREATE_HELP }, { .pc_name = "extend", .pc_func = lfs_mirror_extend, .pc_help = "Extend a mirrored file.\n" "usage: lfs mirror extend " "<--mirror-count|-N[mirror_count]> [--no-verify] " - "[setstripe options|--parent|-f ] ... \n" + "[setstripe options|-f ] ... \n" MIRROR_EXTEND_HELP }, { .pc_name = "split", .pc_func = lfs_mirror_split, .pc_help = "Split a mirrored file.\n" - "usage: lfs mirror split <--mirror-id > [--destroy|-d] " - "[-f ] \n" - "\tmirror_id: The numerical unique identifier for a mirror. It\n" - "\t can be fetched by lfs getstripe command.\n" - "\tnew_file: This option indicates the layout of the split\n" - "\t mirror will be stored into. If not specified,\n" - "\t a new file named .mirror~\n" - "\t will be used.\n" }, + "usage: lfs mirror split <--mirror-id | \n" + "\t <--component-id|-I > [--destroy|-d] \n" + "\t [-f ] \n" + "\tmirror_id: The numerical unique identifier for a mirror. It\n" + "\t can be fetched by lfs getstripe command.\n" + "\tcomp_id: Unique component ID within a mirror.\n" + "\tnew_file: This option indicates the layout of the split\n" + "\t mirror will be stored into. If not specified,\n" + "\t a new file named .mirror~\n" + "\t will be used.\n" }, + { .pc_name = "read", .pc_func = lfs_mirror_read, + .pc_help = "Read the content of a specified mirror of a file.\n" + "usage: lfs mirror read <--mirror-id|-N " + "[--outfile|-o ] \n" }, + { .pc_name = "write", .pc_func = lfs_mirror_write, + .pc_help = "Write to a specified mirror of a file.\n" + "usage: lfs mirror write <--mirror-id|-N " + "[--inputfile|-i ] \n" }, { .pc_name = "resync", .pc_func = lfs_mirror_resync, .pc_help = "Resynchronizes out-of-sync mirrored file(s).\n" "usage: lfs mirror resync [--only ] " @@ -275,7 +302,7 @@ command_t mirror_cmdlist[] = { "usage: lfs mirror verify " "[--only ] " "[--verbose|-v] [ ...]\n"}, - { .pc_name = "--list-commands", .pc_func = lfs_mirror_list_commands, + { .pc_name = "list-commands", .pc_func = lfs_mirror_list_commands, .pc_help = "list commands supported by lfs mirror"}, { .pc_name = "help", .pc_func = Parser_help, .pc_help = "help" }, { .pc_name = "exit", .pc_func = Parser_quit, .pc_help = "quit" }, @@ -297,6 +324,9 @@ command_t cmdlist[] = { "To totally delete the default striping from an existing directory:\n" "usage: setstripe -d \n" " or\n" + "To create a mirrored file or set s default mirror layout on a directory:\n" + "usage: setstripe -N[mirror_count] [STRIPE_OPTIONS] \n" + " or\n" "To delete the last component(s) from an existing composite file\n" "(note that this will also delete any data in those components):\n" "usage: setstripe --component-del [--component-id|-I ]\n" @@ -319,6 +349,8 @@ command_t cmdlist[] = { " [--component-count]\n" " [--component-start[=[+-]comp_start]]\n" " [--component-end[=[+-]comp_end]|-E[[+-]comp_end]]\n" + " [[!] --mirror-index=[+-] |\n" + " [!] --mirror-id=[+-]]\n" " ..."}, {"setdirstripe", lfs_setdirstripe, 0, "To create a striped directory on a specified MDT. This can only\n" @@ -350,8 +382,7 @@ command_t cmdlist[] = { "find files matching given attributes recursively in directory tree.\n" "usage: find ...\n" " [[!] --atime|-A [+-]N] [[!] --ctime|-C [+-]N]\n" - " [[!] --mtime|-M [+-]N] [--maxdepth|-D N]\n" - " [[!] --mdt-index|--mdt|-m ]\n" + " [[!] --mtime|-M [+-]N] [--maxdepth|-D N] [[!] --blocks|-b N]\n" " [[!] --name|-n ] [[!] --ost|-O ]\n" " [--print|-P] [--print0|-0] [[!] --size|-s [+-]N[bkMGTPE]]\n" " [[!] --stripe-count|-c [+-]]\n" @@ -365,8 +396,11 @@ command_t cmdlist[] = { " [[!] --component-start [+-]N[kMGTPE]]\n" " [[!] --component-end|-E [+-]N[kMGTPE]]\n" " [[!] --component-flags ]\n" + " [[!] --mirror-count|-N [+-]]\n" + " [[!] --mirror-state <[^]state>]\n" " [[!] --mdt-count|-T [+-]]\n" " [[!] --mdt-hash|-H \n" + " [[!] --mdt-index|-m ]\n" "\t !: used before an option indicates 'NOT' requested attribute\n" "\t -: used before a value indicates less than requested value\n" "\t +: used before a value indicates more than requested value\n" @@ -374,9 +408,9 @@ command_t cmdlist[] = { "\t fnv_1a_64 FNV-1a hash algorithm\n" "\t all_char sum of characters % MDT_COUNT\n"}, {"check", lfs_check, 0, - "Display the status of MDS or OSTs (as specified in the command)\n" - "or all the servers (MDS and OSTs).\n" - "usage: check "}, + "Display the status of MGTs, MDTs or OSTs (as specified in the command)\n" + "or all the servers (MGTs, MDTs and OSTs).\n" + "usage: check "}, {"osts", lfs_osts, 0, "list OSTs connected to client " "[for specified path only]\n" "usage: osts [path]"}, {"mdts", lfs_mdts, 0, "list MDTs connected to client " @@ -401,13 +435,25 @@ command_t cmdlist[] = { " setquota [-t] <-u|--user|-g|--group|-p|--projid>\n" " [--block-grace ]\n" " [--inode-grace ] \n" + " setquota <-U|-G|-P>\n" + " -b -B \n" + " -i -I \n" + " setquota <-U|--default-usr|-G|--default-grp|-P|--default-prj>\n" + " [--block-softlimit ]\n" + " [--block-hardlimit ]\n" + " [--inode-softlimit ]\n" + " [--inode-hardlimit ] \n" + " setquota <-u|-g|-p> ||||\n" + " <-d|--default>\n" " -b can be used instead of --block-softlimit/--block-grace\n" " -B can be used instead of --block-hardlimit\n" " -i can be used instead of --inode-softlimit/--inode-grace\n" - " -I can be used instead of --inode-hardlimit\n\n" + " -I can be used instead of --inode-hardlimit\n" + " -d can be used instead of --default\n\n" "Note: The total quota space will be split into many qunits and\n" " balanced over all server targets, the minimal qunit size is\n" " 1M bytes for block space and 1K inodes for inode space.\n\n" + " The maximum quota grace time is 2^48 - 1 seconds.\n\n" " Quota space rebalancing process will stop when this mininum\n" " value is reached. As a result, quota exceeded can be returned\n" " while many targets still have 1MB or 1K inodes of spare\n" @@ -416,7 +462,8 @@ command_t cmdlist[] = { "usage: quota [-q] [-v] [-h] [-o |-i |-I " "]\n" " [<-u|-g|-p> ||||] \n" - " quota [-o |-i |-I ] -t <-u|-g|-p> "}, + " quota [-o |-i |-I ] -t <-u|-g|-p> \n" + " quota [-q] [-v] [h] <-U|-G|-P> "}, {"project", lfs_project, 0, "Change or list project attribute for specified file or directory.\n" "usage: project [-d|-r] \n" @@ -494,9 +541,17 @@ command_t cmdlist[] = { "usage: swap_layouts "}, {"migrate", lfs_setstripe_migrate, 0, "migrate a directory between MDTs.\n" - "usage: migrate --mdt-index [--verbose|-v] " - "\n" - "\tmdt_idx: index of the destination MDT\n" + "usage: migrate [--mdt-count|-c] \n" + " [--mdt-hash|-H] \n" + " [--mdt-index|-m] \n" + " [--verbose|-v]\n" + " \n" + "\tmdt: MDTs to stripe over, if only one MDT is specified\n" + " it's the MDT index of first stripe\n" + "\tmdt_count: number of MDTs to stripe a directory over\n" + "\tmdt_hash: hash type of the striped directory. mdt types:\n" + " fnv_1a_64 FNV-1a hash algorithm (default)\n" + " all_char sum of characters % MDT_COUNT\n" "\n" "migrate file objects from one OST " "layout\nto another (may be not safe with concurent writes).\n" @@ -508,14 +563,16 @@ command_t cmdlist[] = { " [--ost|-o] \n" " [--block|-b]\n" " [--non-block|-n]\n" + " [--non-direct|-D]\n" " \n" "\tstripe_count: number of OSTs to stripe a file over\n" "\tstripe_ost_index: index of the first OST to stripe a file over\n" "\tstripe_size: number of bytes to store before moving to the next OST\n" "\tpool_name: name of the predefined pool of OSTs\n" "\tost_indices: OSTs to stripe over, in order\n" - "\tblock: wait for the operation to return before continuing\n" - "\tnon-block: do not wait for the operation to return.\n"}, + "\tblock: Block file access during data migration (default)\n" + "\tnon-block: Abort migrations if concurrent access is detected\n" + "\tnon-direct: do not use direct I/O to copy file contents.\n"}, {"mv", lfs_mv, 0, "To move directories between MDTs. This command is deprecated, " "use \"migrate\" instead.\n" @@ -534,7 +591,14 @@ command_t cmdlist[] = { "lfs mirror extend - add mirror(s) to an existing file\n" "lfs mirror split - split a mirror from an existing mirrored file\n" "lfs mirror resync - resynchronize out-of-sync mirrored file(s)\n" + "lfs mirror read - read a mirror content of a mirrored file\n" + "lfs mirror write - write to a mirror of a mirrored file\n" "lfs mirror verify - verify mirrored file(s)\n"}, + {"getsom", lfs_getsom, 0, "To list the SOM info for a given file.\n" + "usage: getsom [-s] [-b] [-f] \n" + "\t-s: Only show the size value of the SOM data for a given file\n" + "\t-b: Only show the blocks value of the SOM data for a given file\n" + "\t-f: Only show the flags value of the SOM data for a given file\n"}, {"help", Parser_help, 0, "help"}, {"exit", Parser_quit, 0, "quit"}, {"quit", Parser_quit, 0, "quit"}, @@ -561,19 +625,23 @@ static int check_hashtype(const char *hashtype) static const char *error_loc = "syserror"; enum { - MIGRATION_NONBLOCK = 1 << 0, - MIGRATION_MIRROR = 1 << 1, + MIGRATION_NONBLOCK = 0x0001, + MIGRATION_MIRROR = 0x0002, + MIGRATION_NONDIRECT = 0x0004, + MIGRATION_VERBOSE = 0x0008, }; static int lfs_component_create(char *fname, int open_flags, mode_t open_mode, struct llapi_layout *layout); static int -migrate_open_files(const char *name, const struct llapi_stripe_param *param, +migrate_open_files(const char *name, __u64 migration_flags, + const struct llapi_stripe_param *param, struct llapi_layout *layout, int *fd_src, int *fd_tgt) { int fd = -1; int fdv = -1; + int rflags; int mdt_index; int random_value; char parent[PATH_MAX]; @@ -610,7 +678,10 @@ migrate_open_files(const char *name, const struct llapi_stripe_param *param, /* open file, direct io */ /* even if the file is only read, WR mode is nedeed to allow * layout swap on fd */ - fd = open(name, O_RDWR | O_DIRECT); + rflags = O_RDWR; + if (!(migration_flags & MIGRATION_NONDIRECT)) + rflags |= O_DIRECT; + fd = open(name, rflags); if (fd < 0) { rc = -errno; error_loc = "cannot open source file"; @@ -1014,7 +1085,8 @@ static int lfs_migrate(char *name, __u64 migration_flags, int fdv = -1; int rc; - rc = migrate_open_files(name, param, layout, &fd, &fdv); + rc = migrate_open_files(name, migration_flags, param, layout, + &fd, &fdv); if (rc < 0) goto out; @@ -1058,6 +1130,9 @@ out: if (rc < 0) fprintf(stderr, "error: %s: %s: %s: %s\n", progname, name, error_loc, strerror(-rc)); + else if (migration_flags & MIGRATION_VERBOSE) + printf("%s\n", name); + return rc; } @@ -1105,6 +1180,30 @@ static int comp_str2flags(char *string, __u32 *flags, __u32 *neg_flags) return 0; } +static int mirror_str2state(char *string, __u16 *state, __u16 *neg_state) +{ + if (string == NULL) + return -EINVAL; + + *state = 0; + *neg_state = 0; + + if (strncmp(string, "^", 1) == 0) { + *neg_state = llapi_layout_string_flags(string + 1); + if (*neg_state != 0) + return 0; + } else { + *state = llapi_layout_string_flags(string); + if (*state != 0) + return 0; + } + + llapi_printf(LLAPI_MSG_ERROR, + "%s: mirrored file state '%s' not supported\n", + progname, string); + return -EINVAL; +} + /** * struct mirror_args - Command-line arguments for mirror(s). * @m_count: Number of mirrors to be created with this layout. @@ -1193,12 +1292,14 @@ static inline int mirror_sanity_check_one(struct llapi_layout *layout) * in case the victim file(s) contains the same data as the * original mirrored file. * @MF_DESTROY: Indicates to delete the mirror from the mirrored file. + * @MF_COMP_ID: specified component id instead of mirror id * * Flags for extending a mirrored file. */ enum mirror_flags { MF_NO_VERIFY = 0x1, MF_DESTROY = 0x2, + MF_COMP_ID = 0x4, }; /** @@ -1268,9 +1369,9 @@ static int mirror_create_sanity_check(const char *fname, } if (has_m_file && has_m_layout) { - fprintf(stderr, "error: %s: -f option should not " - "be specified with setstripe options or " - "--parent option\n", progname); + fprintf(stderr, + "error: %s: -f option should not be specified with setstripe options\n", + progname); return -EINVAL; } @@ -1357,7 +1458,7 @@ static int mirror_create(char *fname, struct mirror_args *mirror_list) goto error; } - rc = lfs_component_create(fname, O_CREAT | O_WRONLY, 0644, + rc = lfs_component_create(fname, O_CREAT | O_WRONLY, 0666, layout); if (rc >= 0) { close(rc); @@ -1535,7 +1636,7 @@ static int mirror_extend_layout(char *name, struct llapi_layout *layout) int fdv = -1; int rc; - rc = migrate_open_files(name, NULL, layout, &fd, &fdv); + rc = migrate_open_files(name, 0, NULL, layout, &fd, &fdv); if (rc < 0) goto out; @@ -1619,7 +1720,7 @@ static int mirror_extend(char *fname, struct mirror_args *mirror_list, return rc; } -static int verify_id(struct llapi_layout *layout, void *cbdata) +static int find_mirror_id(struct llapi_layout *layout, void *cbdata) { uint32_t id; int rc; @@ -1634,7 +1735,21 @@ static int verify_id(struct llapi_layout *layout, void *cbdata) return LLAPI_LAYOUT_ITER_CONT; } -static int mirror_split(const char *fname, __u16 mirror_id, +static int find_comp_id(struct llapi_layout *layout, void *cbdata) +{ + uint32_t id; + int rc; + + rc = llapi_layout_comp_id_get(layout, &id); + if (rc < 0) + return rc; + + if (id == *(__u32 *)cbdata) + return LLAPI_LAYOUT_ITER_STOP; + + return LLAPI_LAYOUT_ITER_CONT; +} +static int mirror_split(const char *fname, __u32 id, enum mirror_flags mflags, const char *victim_file) { struct llapi_layout *layout; @@ -1648,7 +1763,7 @@ static int mirror_split(const char *fname, __u16 mirror_id, int fd, fdv; int rc; - /* check fname contains mirror with mirror_id */ + /* check fname contains mirror with mirror_id/comp_id */ layout = llapi_layout_get_by_path(fname, 0); if (!layout) { fprintf(stderr, @@ -1675,7 +1790,12 @@ static int mirror_split(const char *fname, __u16 mirror_id, goto free_layout; } - rc = llapi_layout_comp_iterate(layout, verify_id, &mirror_id); + if (mflags & MF_COMP_ID) { + rc = llapi_layout_comp_iterate(layout, find_comp_id, &id); + id = mirror_id_of(id); + } else { + rc = llapi_layout_comp_iterate(layout, find_mirror_id, &id); + } if (rc < 0) { fprintf(stderr, "error %s: failed to iterate layout of '%s'\n", progname, fname); @@ -1683,7 +1803,7 @@ static int mirror_split(const char *fname, __u16 mirror_id, } else if (rc == LLAPI_LAYOUT_ITER_CONT) { fprintf(stderr, "error %s: file '%s' does not contain mirror with id %u\n", - progname, fname, mirror_id); + progname, fname, id); goto free_layout; } @@ -1700,7 +1820,7 @@ static int mirror_split(const char *fname, __u16 mirror_id, fprintf(stderr, "error %s: file name of '%s' too long\n", progname, fname); rc = -ERANGE; - goto free_layout; + goto close_fd; } strncpy(parent, fname, sizeof(parent)); ptr = strrchr(parent, '/'); @@ -1709,7 +1829,7 @@ static int mirror_split(const char *fname, __u16 mirror_id, fprintf(stderr, "error %s: getcwd failed: %s\n", progname, strerror(errno)); rc = -errno; - goto free_layout; + goto close_fd; } } else { if (ptr == parent) @@ -1721,7 +1841,7 @@ static int mirror_split(const char *fname, __u16 mirror_id, if (rc < 0) { fprintf(stderr, "%s: cannot get MDT index of '%s'\n", progname, fname); - goto free_layout; + goto close_fd; } if (victim_file == NULL) { @@ -1731,7 +1851,7 @@ static int mirror_split(const char *fname, __u16 mirror_id, O_LOV_DELAY_CREATE); } else { snprintf(victim, sizeof(victim), "%s.mirror~%u", - fname, mirror_id); + fname, id); fdv = open(victim, flags, S_IRUSR | S_IWUSR); } } else { @@ -1766,7 +1886,7 @@ static int mirror_split(const char *fname, __u16 mirror_id, data->lil_flags = LL_LEASE_LAYOUT_SPLIT; data->lil_count = 2; data->lil_ids[0] = fdv; - data->lil_ids[1] = mirror_id; + data->lil_ids[1] = id; rc = llapi_lease_set(fd, data); if (rc <= 0) { if (rc == 0) /* lost lease lock */ @@ -1878,13 +1998,18 @@ struct lfs_setstripe_args { __u32 lsa_comp_flags; __u32 lsa_comp_neg_flags; unsigned long long lsa_pattern; + unsigned int lsa_mirror_count; int lsa_nr_tgts; + bool lsa_first_comp; __u32 *lsa_tgts; char *lsa_pool_name; }; static inline void setstripe_args_init(struct lfs_setstripe_args *lsa) { + unsigned int mirror_count = lsa->lsa_mirror_count; + bool first_comp = lsa->lsa_first_comp; + memset(lsa, 0, sizeof(*lsa)); lsa->lsa_stripe_size = LLAPI_LAYOUT_DEFAULT; @@ -1892,6 +2017,9 @@ static inline void setstripe_args_init(struct lfs_setstripe_args *lsa) lsa->lsa_stripe_off = LLAPI_LAYOUT_DEFAULT; lsa->lsa_pattern = LLAPI_LAYOUT_RAID0; lsa->lsa_pool_name = NULL; + + lsa->lsa_mirror_count = mirror_count; + lsa->lsa_first_comp = first_comp; } /** @@ -1941,7 +2069,8 @@ static inline bool setstripe_args_specified(struct lfs_setstripe_args *lsa) * Return: 0 on success or an error code on failure. */ static int comp_args_to_layout(struct llapi_layout **composite, - struct lfs_setstripe_args *lsa) + struct lfs_setstripe_args *lsa, + bool set_extent) { struct llapi_layout *layout = *composite; uint64_t prev_end = 0; @@ -1967,19 +2096,30 @@ static int comp_args_to_layout(struct llapi_layout **composite, return rc; } - rc = llapi_layout_comp_add(layout); + if (lsa->lsa_first_comp) + prev_end = 0; + + if (lsa->lsa_first_comp) + rc = llapi_layout_add_first_comp(layout); + else + rc = llapi_layout_comp_add(layout); if (rc) { fprintf(stderr, "Add component failed. %s\n", strerror(errno)); return rc; } } + /* reset lsa_first_comp */ + lsa->lsa_first_comp = false; - rc = llapi_layout_comp_extent_set(layout, prev_end, lsa->lsa_comp_end); - if (rc) { - fprintf(stderr, "Set extent [%lu, %llu) failed. %s\n", - prev_end, lsa->lsa_comp_end, strerror(errno)); - return rc; + if (set_extent) { + rc = llapi_layout_comp_extent_set(layout, prev_end, + lsa->lsa_comp_end); + if (rc) { + fprintf(stderr, "Set extent [%lu, %llu) failed. %s\n", + prev_end, lsa->lsa_comp_end, strerror(errno)); + return rc; + } } /* Data-on-MDT component setting */ @@ -2069,7 +2209,7 @@ static int comp_args_to_layout(struct llapi_layout **composite, lsa->lsa_stripe_count != LLAPI_LAYOUT_DEFAULT && lsa->lsa_stripe_count != LLAPI_LAYOUT_WIDE && lsa->lsa_nr_tgts != lsa->lsa_stripe_count) { - fprintf(stderr, "stripe_count(%lld) != nr_osts(%d)\n", + fprintf(stderr, "stripe_count(%lld) != nr_tgts(%d)\n", lsa->lsa_stripe_count, lsa->lsa_nr_tgts); return -EINVAL; } @@ -2079,7 +2219,8 @@ static int comp_args_to_layout(struct llapi_layout **composite, if (rc) break; } - } else if (lsa->lsa_stripe_off != LLAPI_LAYOUT_DEFAULT) { + } else if (lsa->lsa_stripe_off != LLAPI_LAYOUT_DEFAULT && + lsa->lsa_stripe_off != -1) { rc = llapi_layout_ost_index_set(layout, 0, lsa->lsa_stripe_off); } if (rc) { @@ -2091,6 +2232,155 @@ static int comp_args_to_layout(struct llapi_layout **composite, return 0; } +static int build_component(struct llapi_layout **layout, + struct lfs_setstripe_args *lsa, bool set_extent) +{ + int rc; + + rc = comp_args_to_layout(layout, lsa, set_extent); + if (rc) + return rc; + + if (lsa->lsa_mirror_count > 0) { + rc = llapi_layout_mirror_count_set(*layout, + lsa->lsa_mirror_count); + if (rc) + return rc; + + rc = llapi_layout_flags_set(*layout, LCM_FL_RDONLY); + if (rc) + return rc; + lsa->lsa_mirror_count = 0; + } + + return rc; +} + +static int build_layout_from_yaml_node(struct cYAML *node, + struct llapi_layout **layout, + struct lfs_setstripe_args *lsa, + __u32 *osts) +{ + char *string; + int rc = 0; + + while (node) { + if (node->cy_type == CYAML_TYPE_OBJECT) { + /* go deep to sub blocks */ + rc = build_layout_from_yaml_node(node->cy_child, layout, + lsa, osts); + if (rc) + return rc; + } else { + if (node->cy_string == NULL) + return -EINVAL; + + string = node->cy_string; + /* skip leading lmm_ if present, to simplify parsing */ + if (strncmp(string, "lmm_", 4) == 0) + string += 4; + + if (node->cy_type == CYAML_TYPE_STRING) { + if (!strcmp(string, "lcme_extent.e_end")) { + if (!strcmp(node->cy_valuestring, "EOF") || + !strcmp(node->cy_valuestring, "eof")) + lsa->lsa_comp_end = LUSTRE_EOF; + } else if (!strcmp(string, "pool")) { + lsa->lsa_pool_name = node->cy_valuestring; + } else if (!strcmp(string, "pattern")) { + if (!strcmp(node->cy_valuestring, "mdt")) + lsa->lsa_pattern = LLAPI_LAYOUT_MDT; + } else if (!strcmp(string, "lcme_flags")) { + rc = comp_str2flags(node->cy_valuestring, + &lsa->lsa_comp_flags, + &lsa->lsa_comp_neg_flags); + if (rc) + return rc; + /* Only template flags have meaning in + * the layout for a new file + */ + lsa->lsa_comp_flags &= LCME_TEMPLATE_FLAGS; + } + } else if (node->cy_type == CYAML_TYPE_NUMBER) { + if (!strcmp(string, "lcm_mirror_count")) { + lsa->lsa_mirror_count = node->cy_valueint; + } else if (!strcmp(string, "lcme_extent.e_start")) { + if (node->cy_valueint != 0 || *layout != NULL) { + rc = build_component(layout, lsa, true); + if (rc) + return rc; + } + + if (node->cy_valueint == 0) + lsa->lsa_first_comp = true; + + /* initialize lsa */ + setstripe_args_init(lsa); + lsa->lsa_tgts = osts; + } else if (!strcmp(string, "lcme_extent.e_end")) { + if (node->cy_valueint == -1) + lsa->lsa_comp_end = LUSTRE_EOF; + else + lsa->lsa_comp_end = node->cy_valueint; + } else if (!strcmp(string, "stripe_count")) { + lsa->lsa_stripe_count = node->cy_valueint; + } else if (!strcmp(string, "stripe_size")) { + lsa->lsa_stripe_size = node->cy_valueint; + } else if (!strcmp(string, "stripe_offset")) { + lsa->lsa_stripe_off = node->cy_valueint; + } else if (!strcmp(string, "l_ost_idx")) { + osts[lsa->lsa_nr_tgts] = node->cy_valueint; + lsa->lsa_nr_tgts++; + } + } + } + node = node->cy_next; + } + + return rc; +} + +static int lfs_comp_create_from_yaml(char *template, + struct llapi_layout **layout, + struct lfs_setstripe_args *lsa, + __u32 *osts) +{ + struct cYAML *tree = NULL, *err_rc = NULL; + int rc = 0; + + tree = cYAML_build_tree(template, NULL, 0, &err_rc, false); + if (!tree) { + fprintf(stderr, "%s: cannot parse YAML file %s\n", + progname, template); + cYAML_build_error(-EINVAL, -1, "yaml", "from comp yaml", + "can't parse", &err_rc); + cYAML_print_tree2file(stderr, err_rc); + cYAML_free_tree(err_rc); + rc = -EINVAL; + goto err; + } + + /* initialize lsa for plain file */ + setstripe_args_init(lsa); + lsa->lsa_tgts = osts; + + rc = build_layout_from_yaml_node(tree, layout, lsa, osts); + if (rc) { + fprintf(stderr, "%s: cannot build layout from YAML file %s.\n", + progname, template); + goto err; + } else { + rc = build_component(layout, lsa, *layout != NULL); + } + /* clean clean lsa */ + setstripe_args_init(lsa); + +err: + if (tree) + cYAML_free_tree(tree); + return rc; +} + /* In 'lfs setstripe --component-add' mode, we need to fetch the extent * end of the last component in the existing file, and adjust the * first extent start of the components to be added accordingly. */ @@ -2257,35 +2547,37 @@ enum { LFS_COMP_DEL_OPT, LFS_COMP_SET_OPT, LFS_COMP_ADD_OPT, - LFS_COMP_USE_PARENT_OPT, LFS_COMP_NO_VERIFY_OPT, LFS_PROJID_OPT, LFS_MIRROR_FLAGS_OPT, LFS_MIRROR_ID_OPT, + LFS_MIRROR_STATE_OPT, + LFS_LAYOUT_COPY, + LFS_MIRROR_INDEX_OPT, }; /* functions */ static int lfs_setstripe_internal(int argc, char **argv, enum setstripe_origin opc) { - struct lfs_setstripe_args lsa; + struct lfs_setstripe_args lsa = { 0 }; struct llapi_stripe_param *param = NULL; struct find_param migrate_mdt_param = { .fp_max_depth = -1, .fp_mdt_index = -1, }; char *fname; - int result; + int result = 0; int result2 = 0; char *end; int c; int delete = 0; - char *mdt_idx_arg = NULL; unsigned long long size_units = 1; bool migrate_mode = false; + bool migrate_mdt_mode = false; bool migration_block = false; __u64 migration_flags = 0; - __u32 osts[LOV_MAX_STRIPE_COUNT] = { 0 }; + __u32 tgts[LOV_MAX_STRIPE_COUNT] = { 0 }; int comp_del = 0, comp_set = 0; int comp_add = 0; __u32 comp_id = 0; @@ -2300,8 +2592,12 @@ static int lfs_setstripe_internal(int argc, char **argv, struct mirror_args *last_mirror = NULL; __u16 mirror_id = 0; char cmd[PATH_MAX]; + bool from_yaml = false; + bool from_copy = false; + char *template = NULL; struct option long_opts[] = { +/* find { .val = '0', .name = "null", .has_arg = no_argument }, */ /* find { .val = 'A', .name = "atime", .has_arg = required_argument }*/ /* --block is only valid in migrate mode */ { .val = 'b', .name = "block", .has_arg = no_argument }, @@ -2323,19 +2619,22 @@ static int lfs_setstripe_internal(int argc, char **argv, { .val = LFS_COMP_SET_OPT, .name = "component-set", .has_arg = no_argument}, - { .val = LFS_COMP_USE_PARENT_OPT, - .name = "parent", .has_arg = no_argument}, { .val = LFS_COMP_NO_VERIFY_OPT, .name = "no-verify", .has_arg = no_argument}, { .val = LFS_MIRROR_FLAGS_OPT, .name = "flags", .has_arg = required_argument}, { .val = LFS_MIRROR_ID_OPT, .name = "mirror-id", .has_arg = required_argument}, + { .val = LFS_LAYOUT_COPY, + .name = "copy", .has_arg = required_argument}, { .val = 'c', .name = "stripe-count", .has_arg = required_argument}, { .val = 'c', .name = "stripe_count", .has_arg = required_argument}, + { .val = 'c', .name = "mdt-count", .has_arg = required_argument}, /* find { .val = 'C', .name = "ctime", .has_arg = required_argument }*/ { .val = 'd', .name = "delete", .has_arg = no_argument}, { .val = 'd', .name = "destroy", .has_arg = no_argument}, + /* --non-direct is only valid in migrate mode */ + { .val = 'D', .name = "non-direct", .has_arg = no_argument }, { .val = 'E', .name = "comp-end", .has_arg = required_argument}, { .val = 'E', .name = "component-end", .has_arg = required_argument}, @@ -2343,7 +2642,8 @@ static int lfs_setstripe_internal(int argc, char **argv, /* find { .val = 'F', .name = "fid", .has_arg = no_argument }, */ /* find { .val = 'g', .name = "gid", .has_arg = no_argument }, */ /* find { .val = 'G', .name = "group", .has_arg = required_argument }*/ -/* dirstripe { .val = 'H', .name = "mdt-hash", .has_arg = required_argument }*/ +/* find { .val = 'h', .name = "help", .has_arg = no_argument }, */ + { .val = 'H', .name = "mdt-hash", .has_arg = required_argument}, { .val = 'i', .name = "stripe-index", .has_arg = required_argument}, { .val = 'i', .name = "stripe_index", .has_arg = required_argument}, { .val = 'I', .name = "comp-id", .has_arg = required_argument}, @@ -2373,7 +2673,7 @@ static int lfs_setstripe_internal(int argc, char **argv, /* find { .val = 'U', .name = "user", .has_arg = required_argument }*/ /* --verbose is only valid in migrate mode */ { .val = 'v', .name = "verbose", .has_arg = no_argument}, -/* getstripe { .val = 'y', .name = "yaml", .has_arg = no_argument }, */ + { .val = 'y', .name = "yaml", .has_arg = required_argument }, { .name = NULL } }; setstripe_args_init(&lsa); @@ -2383,8 +2683,9 @@ static int lfs_setstripe_internal(int argc, char **argv, snprintf(cmd, sizeof(cmd), "%s %s", progname, argv[0]); progname = cmd; - while ((c = getopt_long(argc, argv, "bc:dE:f:i:I:m:N::no:p:L:s:S:v", - long_opts, NULL)) >= 0) { + while ((c = getopt_long(argc, argv, + "bc:dDE:f:H:i:I:m:N::no:p:L:s:S:vy:", long_opts, + NULL)) >= 0) { switch (c) { case 0: /* Long options. */ @@ -2417,15 +2718,6 @@ static int lfs_setstripe_internal(int argc, char **argv, case LFS_COMP_SET_OPT: comp_set = 1; break; - case LFS_COMP_USE_PARENT_OPT: - if (!mirror_mode) { - fprintf(stderr, "error: %s: --parent must be " - "specified with --mirror-count|-N " - "option\n", progname); - goto usage_error; - } - setstripe_args_init(&lsa); - break; case LFS_COMP_NO_VERIFY_OPT: mirror_flags |= MF_NO_VERIFY; break; @@ -2467,6 +2759,10 @@ static int lfs_setstripe_internal(int argc, char **argv, } break; } + case LFS_LAYOUT_COPY: + from_copy = true; + template = optarg; + break; case 'b': if (!migrate_mode) { fprintf(stderr, @@ -2501,9 +2797,19 @@ static int lfs_setstripe_internal(int argc, char **argv, mirror_flags |= MF_DESTROY; } break; + case 'D': + if (!migrate_mode) { + fprintf(stderr, + "%s %s: -D|--non-direct is valid " + "only for migrate command\n", + progname, argv[0]); + goto usage_error; + } + migration_flags |= MIGRATION_NONDIRECT; + break; case 'E': if (lsa.lsa_comp_end != 0) { - result = comp_args_to_layout(lpp, &lsa); + result = comp_args_to_layout(lpp, &lsa, true); if (result) { fprintf(stderr, "%s %s: invalid layout\n", @@ -2528,6 +2834,20 @@ static int lfs_setstripe_internal(int argc, char **argv, } } break; + case 'H': + if (!migrate_mode) { + fprintf(stderr, "--mdt-hash is valid only for migrate command\n"); + return CMD_HELP; + } + + lsa.lsa_pattern = check_hashtype(optarg); + if (lsa.lsa_pattern == 0) { + fprintf(stderr, + "%s %s: bad stripe hash type '%s'\n", + progname, argv[0], optarg); + return CMD_HELP; + } + break; case 'i': lsa.lsa_stripe_off = strtol(optarg, &end, 0); if (*end != '\0') { @@ -2600,11 +2920,24 @@ static int lfs_setstripe_internal(int argc, char **argv, case 'm': if (!migrate_mode) { fprintf(stderr, - "%s %s: -m|--mdt-index valid only for migrate command\n", + "%s %s: -m|--mdt-index is valid only for migrate command\n", progname, argv[0]); goto usage_error; } - mdt_idx_arg = optarg; + migrate_mdt_mode = true; + lsa.lsa_nr_tgts = parse_targets(tgts, + sizeof(tgts) / sizeof(__u32), + lsa.lsa_nr_tgts, optarg); + if (lsa.lsa_nr_tgts < 0) { + fprintf(stderr, + "%s %s: invalid MDT target(s) '%s'\n", + progname, argv[0], optarg); + return CMD_HELP; + } + + lsa.lsa_tgts = tgts; + if (lsa.lsa_stripe_off == LLAPI_LAYOUT_DEFAULT) + lsa.lsa_stripe_off = tgts[0]; break; case 'n': if (!migrate_mode) { @@ -2643,7 +2976,7 @@ static int lfs_setstripe_internal(int argc, char **argv, if (lsa.lsa_comp_end == 0) lsa.lsa_comp_end = LUSTRE_EOF; - result = comp_args_to_layout(lpp, &lsa); + result = comp_args_to_layout(lpp, &lsa, true); if (result) { lfs_mirror_free(new_mirror); goto error; @@ -2663,8 +2996,8 @@ static int lfs_setstripe_internal(int argc, char **argv, fprintf(stderr, "warning: '--ost-list' is " "deprecated, use '--ost' instead\n"); #endif - lsa.lsa_nr_tgts = parse_targets(osts, - sizeof(osts) / sizeof(__u32), + lsa.lsa_nr_tgts = parse_targets(tgts, + sizeof(tgts) / sizeof(__u32), lsa.lsa_nr_tgts, optarg); if (lsa.lsa_nr_tgts < 0) { fprintf(stderr, @@ -2673,14 +3006,19 @@ static int lfs_setstripe_internal(int argc, char **argv, goto usage_error; } - lsa.lsa_tgts = osts; + lsa.lsa_tgts = tgts; if (lsa.lsa_stripe_off == LLAPI_LAYOUT_DEFAULT) - lsa.lsa_stripe_off = osts[0]; + lsa.lsa_stripe_off = tgts[0]; break; case 'p': if (optarg == NULL) goto usage_error; lsa.lsa_pool_name = optarg; + + if (strlen(lsa.lsa_pool_name) == 0 || + strncmp(lsa.lsa_pool_name, "none", + LOV_MAXPOOLNAME) == 0) + lsa.lsa_pool_name = NULL; break; case 'S': result = llapi_parse_size(optarg, &lsa.lsa_stripe_size, @@ -2700,6 +3038,11 @@ static int lfs_setstripe_internal(int argc, char **argv, goto usage_error; } migrate_mdt_param.fp_verbose = VERBOSE_DETAIL; + migration_flags = MIGRATION_VERBOSE; + break; + case 'y': + from_yaml = true; + template = optarg; break; default: fprintf(stderr, "%s %s: unrecognized option '%s'\n", @@ -2730,7 +3073,7 @@ static int lfs_setstripe_internal(int argc, char **argv, } if (lsa.lsa_comp_end != 0) { - result = comp_args_to_layout(lpp, &lsa); + result = comp_args_to_layout(lpp, &lsa, true); if (result) goto error; } @@ -2824,11 +3167,19 @@ static int lfs_setstripe_internal(int argc, char **argv, goto error; } - if (mdt_idx_arg != NULL && optind > 3) { + if (from_yaml && from_copy) { fprintf(stderr, - "%s %s: option -m cannot be used with other options\n", - progname, argv[0]); - goto usage_error; + "%s: can't specify --yaml and --copy together\n", + progname); + goto error; + } + + if ((from_yaml || from_copy) && + (setstripe_args_specified(&lsa) || layout != NULL)) { + fprintf(stderr, "error: %s: can't specify --yaml with " + "-c, -S, -i, -o, -p or -E options.\n", + argv[0]); + goto error; } if ((migration_flags & MIGRATION_NONBLOCK) && migration_block) { @@ -2838,21 +3189,67 @@ static int lfs_setstripe_internal(int argc, char **argv, goto usage_error; } - if (!comp_del && !comp_set && comp_id != 0) { + if (!comp_del && !comp_set && (opc != SO_MIRROR_SPLIT) && + comp_id != 0) { fprintf(stderr, - "%s %s: option -I can only be used with --component-del\n", + "%s %s: option -I can only be used with --component-del or --component-set or lfs mirror split\n", progname, argv[0]); goto usage_error; } - if (mdt_idx_arg != NULL) { + if (migrate_mdt_mode) { + struct lmv_user_md *lmu; + /* initialize migrate mdt parameters */ - migrate_mdt_param.fp_mdt_index = strtoul(mdt_idx_arg, &end, 0); - if (*end != '\0') { - fprintf(stderr, "%s %s: invalid MDT index '%s'\n", - progname, argv[0], mdt_idx_arg); + lmu = calloc(1, lmv_user_md_size(lsa.lsa_nr_tgts, + LMV_USER_MAGIC_SPECIFIC)); + if (!lmu) { + fprintf(stderr, + "%s %s: cannot allocate memory for lmv_user_md: %s\n", + progname, argv[0], strerror(ENOMEM)); + result = -ENOMEM; + goto error; + } + if (lsa.lsa_stripe_count != LLAPI_LAYOUT_DEFAULT) + lmu->lum_stripe_count = lsa.lsa_stripe_count; + if (lsa.lsa_stripe_off == LLAPI_LAYOUT_DEFAULT) { + fprintf(stderr, + "%s %s: migrate should specify MDT index\n", + progname, argv[0]); + free(lmu); goto usage_error; } + lmu->lum_stripe_offset = lsa.lsa_stripe_off; + if (lsa.lsa_pattern != LLAPI_LAYOUT_RAID0) + lmu->lum_hash_type = lsa.lsa_pattern; + else + lmu->lum_hash_type = LMV_HASH_TYPE_FNV_1A_64; + if (lsa.lsa_pool_name) + strncpy(lmu->lum_pool_name, lsa.lsa_pool_name, + sizeof(lmu->lum_pool_name)); + if (lsa.lsa_nr_tgts > 1) { + int i; + + if (lsa.lsa_stripe_count > 0 && + lsa.lsa_stripe_count != LLAPI_LAYOUT_DEFAULT && + lsa.lsa_stripe_count != lsa.lsa_nr_tgts) { + fprintf(stderr, + "error: %s: stripe count %lld doesn't match the number of MDTs: %d\n", + progname, lsa.lsa_stripe_count, + lsa.lsa_nr_tgts); + free(lmu); + goto usage_error; + } + + lmu->lum_magic = LMV_USER_MAGIC_SPECIFIC; + lmu->lum_stripe_count = lsa.lsa_nr_tgts; + for (i = 0; i < lsa.lsa_nr_tgts; i++) + lmu->lum_objects[i].lum_mds = lsa.lsa_tgts[i]; + } else { + lmu->lum_magic = LMV_USER_MAGIC; + } + + migrate_mdt_param.fp_lmv_md = lmu; migrate_mdt_param.fp_migrate = 1; } else if (layout == NULL) { /* initialize stripe parameters */ @@ -2895,13 +3292,33 @@ static int lfs_setstripe_internal(int argc, char **argv, param->lsp_is_specific = true; param->lsp_stripe_count = lsa.lsa_nr_tgts; - memcpy(param->lsp_osts, osts, - sizeof(*osts) * lsa.lsa_nr_tgts); + memcpy(param->lsp_osts, tgts, + sizeof(*tgts) * lsa.lsa_nr_tgts); + } + } + + if (from_yaml) { + /* generate a layout from a YAML template */ + result = lfs_comp_create_from_yaml(template, &layout, + &lsa, tgts); + if (result) { + fprintf(stderr, "error: %s: can't create composite " + "layout from template file %s\n", + argv[0], template); + goto error; + } + } else if (from_copy) { + layout = llapi_layout_get_by_path(template, 0); + if (layout == NULL) { + fprintf(stderr, + "%s: can't create composite layout from file %s.\n", + progname, template); + goto error; } } for (fname = argv[optind]; fname != NULL; fname = argv[++optind]) { - if (mdt_idx_arg != NULL) { + if (migrate_mdt_mode) { result = llapi_migrate_mdt(fname, &migrate_mdt_param); } else if (migrate_mode) { result = lfs_migrate(fname, migration_flags, param, @@ -2922,18 +3339,22 @@ static int lfs_setstripe_internal(int argc, char **argv, result = mirror_extend(fname, mirror_list, mirror_flags); } else if (opc == SO_MIRROR_SPLIT) { - if (mirror_id == 0) { + if (mirror_id == 0 && comp_id == 0) { fprintf(stderr, - "%s %s: no mirror id is specified\n", + "%s %s: no mirror id or component id is specified\n", progname, argv[0]); goto usage_error; } - result = mirror_split(fname, mirror_id, mirror_flags, + if (mirror_id != 0) + comp_id = mirror_id; + else + mirror_flags |= MF_COMP_ID; + result = mirror_split(fname, comp_id, mirror_flags, has_m_file ? mirror_list->m_file : NULL); } else if (layout != NULL) { result = lfs_component_create(fname, O_CREAT | O_WRONLY, - 0644, layout); + 0666, layout); if (result >= 0) { close(result); result = 0; @@ -2941,7 +3362,7 @@ static int lfs_setstripe_internal(int argc, char **argv, } else { result = llapi_file_open_param(fname, O_CREAT | O_WRONLY, - 0644, param); + 0666, param); if (result >= 0) { close(result); result = 0; @@ -2956,6 +3377,7 @@ static int lfs_setstripe_internal(int argc, char **argv, } free(param); + free(migrate_mdt_param.fp_lmv_md); llapi_layout_free(layout); lfs_mirror_list_free(mirror_list); return result2; @@ -2977,28 +3399,38 @@ static int lfs_poollist(int argc, char **argv) static int set_time(time_t *time, time_t *set, char *str) { - time_t t; - int res = 0; + time_t t; + int res = 0; + char *endptr; - if (str[0] == '+') - res = 1; - else if (str[0] == '-') - res = -1; + if (str[0] == '+') + res = 1; + else if (str[0] == '-') + res = -1; - if (res) - str++; + if (res) + str++; - t = strtol(str, NULL, 0); - if (*time < t * 24 * 60 * 60) { - if (res) - str--; - fprintf(stderr, "Wrong time '%s' is specified.\n", str); - return INT_MAX; - } + t = strtol(str, &endptr, 0); + if (*endptr != '\0') { + fprintf(stderr, + "%s find: bad time '%s': %s\n", + progname, str, strerror(EINVAL)); + return INT_MAX; + } + if (*time < t * 24 * 60 * 60) { + if (res != 0) + str--; + fprintf(stderr, + "%s find: bad time '%s': too large\n", + progname, str); + return INT_MAX; + } - *set = *time - t * 24 * 60 * 60; - return res; + *set = *time - t * 24 * 60 * 60; + return res; } + static int name2uid(unsigned int *id, const char *name) { struct passwd *passwd; @@ -3084,6 +3516,7 @@ static int lfs_find(int argc, char **argv) }; struct option long_opts[] = { { .val = 'A', .name = "atime", .has_arg = required_argument }, + { .val = 'b', .name = "blocks", .has_arg = required_argument }, { .val = LFS_COMP_COUNT_OPT, .name = "comp-count", .has_arg = required_argument }, { .val = LFS_COMP_COUNT_OPT, @@ -3099,6 +3532,8 @@ static int lfs_find(int argc, char **argv) { .val = LFS_COMP_START_OPT, .name = "component-start", .has_arg = required_argument }, + { .val = LFS_MIRROR_STATE_OPT, + .name = "mirror-state", .has_arg = required_argument }, { .val = 'c', .name = "stripe-count", .has_arg = required_argument }, { .val = 'c', .name = "stripe_count", .has_arg = required_argument }, { .val = 'C', .name = "ctime", .has_arg = required_argument }, @@ -3120,6 +3555,7 @@ static int lfs_find(int argc, char **argv) { .val = 'm', .name = "mdt_index", .has_arg = required_argument }, { .val = 'M', .name = "mtime", .has_arg = required_argument }, { .val = 'n', .name = "name", .has_arg = required_argument }, + { .val = 'N', .name = "mirror-count", .has_arg = required_argument }, /* find { .val = 'o' .name = "or", .has_arg = no_argument }, like find(1) */ { .val = 'O', .name = "obd", .has_arg = required_argument }, { .val = 'O', .name = "ost", .has_arg = required_argument }, @@ -3155,7 +3591,7 @@ static int lfs_find(int argc, char **argv) /* when getopt_long_only() hits '!' it returns 1, puts "!" in optarg */ while ((c = getopt_long_only(argc, argv, - "-0A:c:C:D:E:g:G:H:i:L:m:M:n:O:Ppqrs:S:t:T:u:U:v", + "-0A:b:c:C:D:E:g:G:H:i:L:m:M:n:N:O:Ppqrs:S:t:T:u:U:v", long_opts, NULL)) >= 0) { xtime = NULL; xsign = NULL; @@ -3217,6 +3653,26 @@ static int lfs_find(int argc, char **argv) if (rc) *xsign = rc; break; + case 'b': + if (optarg[0] == '+') { + param.fp_blocks_sign = -1; + optarg++; + } else if (optarg[0] == '-') { + param.fp_blocks_sign = 1; + optarg++; + } + + param.fp_blocks_units = 1024; + ret = llapi_parse_size(optarg, ¶m.fp_blocks, + ¶m.fp_blocks_units, 0); + if (ret) { + fprintf(stderr, "error: bad blocks '%s'\n", + optarg); + goto err; + } + param.fp_check_blocks = 1; + param.fp_exclude_blocks = !!neg_opt; + break; case LFS_COMP_COUNT_OPT: if (optarg[0] == '+') { param.fp_comp_count_sign = -1; @@ -3269,6 +3725,23 @@ static int lfs_find(int argc, char **argv) param.fp_check_comp_start = 1; param.fp_exclude_comp_start = !!neg_opt; break; + case LFS_MIRROR_STATE_OPT: + rc = mirror_str2state(optarg, ¶m.fp_mirror_state, + ¶m.fp_mirror_neg_state); + if (rc) { + fprintf(stderr, + "error: bad mirrored file state '%s'\n", + optarg); + goto err; + } + param.fp_check_mirror_state = 1; + if (neg_opt) { + __u16 state = param.fp_mirror_neg_state; + param.fp_mirror_neg_state = + param.fp_mirror_state; + param.fp_mirror_state = state; + } + break; case 'c': if (optarg[0] == '+') { param.fp_stripe_count_sign = -1; @@ -3369,6 +3842,25 @@ static int lfs_find(int argc, char **argv) param.fp_pattern = (char *)optarg; param.fp_exclude_pattern = !!neg_opt; break; + case 'N': + if (optarg[0] == '+') { + param.fp_mirror_count_sign = -1; + optarg++; + } else if (optarg[0] == '-') { + param.fp_mirror_count_sign = 1; + optarg++; + } + + param.fp_mirror_count = strtoul(optarg, &endptr, 0); + if (*endptr != '\0') { + fprintf(stderr, + "error: bad mirror count '%s'\n", + optarg); + goto err; + } + param.fp_check_mirror_count = 1; + param.fp_exclude_mirror_count = !!neg_opt; + break; case 'm': case 'i': case 'O': { @@ -3619,6 +4111,7 @@ static int lfs_getstripe_internal(int argc, char **argv, { struct option long_opts[] = { /* find { .val = 'A', .name = "atime", .has_arg = required_argument }*/ +/* find { .val = 'b', .name = "blocks", .has_arg = required_argument }*/ { .val = LFS_COMP_COUNT_OPT, .name = "comp-count", .has_arg = no_argument }, { .val = LFS_COMP_COUNT_OPT, @@ -3631,6 +4124,10 @@ static int lfs_getstripe_internal(int argc, char **argv, .name = "comp-start", .has_arg = optional_argument }, { .val = LFS_COMP_START_OPT, .name = "component-start", .has_arg = optional_argument }, + { .val = LFS_MIRROR_INDEX_OPT, + .name = "mirror-index", .has_arg = required_argument }, + { .val = LFS_MIRROR_ID_OPT, + .name = "mirror-id", .has_arg = required_argument }, { .val = 'c', .name = "stripe-count", .has_arg = no_argument }, { .val = 'c', .name = "stripe_count", .has_arg = no_argument }, /* find { .val = 'C', .name = "ctime", .has_arg = required_argument }*/ @@ -3652,6 +4149,7 @@ static int lfs_getstripe_internal(int argc, char **argv, { .val = 'm', .name = "mdt_index", .has_arg = no_argument }, /* find { .val = 'M', .name = "mtime", .has_arg = required_argument }*/ /* find { .val = 'n', .name = "name", .has_arg = required_argument }*/ + { .val = 'N', .name = "mirror-count", .has_arg = no_argument }, { .val = 'O', .name = "obd", .has_arg = required_argument }, { .val = 'O', .name = "ost", .has_arg = required_argument }, { .val = 'p', .name = "pool", .has_arg = no_argument }, @@ -3669,11 +4167,36 @@ static int lfs_getstripe_internal(int argc, char **argv, { .val = 'y', .name = "yaml", .has_arg = no_argument }, { .name = NULL } }; int c, rc; + int neg_opt = 0; + int pathstart = -1, pathend = -1; + int isoption; char *end, *tmp; - while ((c = getopt_long(argc, argv, "cdDE::FghiI::LmMoO:pqrRsSvy", - long_opts, NULL)) != -1) { + while ((c = getopt_long(argc, argv, + "-cdDE::FghiI::LmMNoO:pqrRsSvy", + long_opts, NULL)) != -1) { + if (neg_opt) + --neg_opt; + + /* '!' is part of option */ + isoption = (c != 1) || (strcmp(optarg, "!") == 0); + if (!isoption && pathend != -1) { + fprintf(stderr, + "error: %s: filename|dirname must either precede options or follow options\n", + argv[0]); + return CMD_HELP; + } + if (!isoption && pathstart == -1) + pathstart = optind - 1; + if (isoption && pathstart != -1 && pathend == -1) + pathend = optind - 2; + switch (c) { + case 1: + /* unknown: opt is "!" */ + if (strcmp(optarg, "!") == 0) + neg_opt = 2; + break; case 'c': if (!(param->fp_verbose & VERBOSE_DETAIL)) { param->fp_verbose |= VERBOSE_COUNT; @@ -3727,6 +4250,58 @@ static int lfs_getstripe_internal(int argc, char **argv, param->fp_max_depth = 0; } break; + case LFS_MIRROR_INDEX_OPT: + if (optarg[0] == '+') { + param->fp_mirror_index_sign = -1; + optarg++; + } else if (optarg[0] == '-') { + param->fp_mirror_index_sign = 1; + optarg++; + } + + param->fp_mirror_index = strtoul(optarg, &end, 0); + if (*end != '\0' || (param->fp_mirror_index == 0 && + param->fp_mirror_index_sign == 0 && neg_opt == 0)) { + fprintf(stderr, + "%s %s: invalid mirror index '%s'\n", + progname, argv[0], optarg); + return CMD_HELP; + } + if (param->fp_mirror_id != 0) { + fprintf(stderr, + "%s %s: can't specify both mirror index and mirror ID\n", + progname, argv[0]); + return CMD_HELP; + } + param->fp_check_mirror_index = 1; + param->fp_exclude_mirror_index = !!neg_opt; + break; + case LFS_MIRROR_ID_OPT: + if (optarg[0] == '+') { + param->fp_mirror_id_sign = -1; + optarg++; + } else if (optarg[0] == '-') { + param->fp_mirror_id_sign = 1; + optarg++; + } + + param->fp_mirror_id = strtoul(optarg, &end, 0); + if (*end != '\0' || (param->fp_mirror_id == 0 && + param->fp_mirror_id_sign == 0 && neg_opt == 0)) { + fprintf(stderr, + "%s %s: invalid mirror ID '%s'\n", + progname, argv[0], optarg); + return CMD_HELP; + } + if (param->fp_mirror_index != 0) { + fprintf(stderr, + "%s %s: can't specify both mirror index and mirror ID\n", + progname, argv[0]); + return CMD_HELP; + } + param->fp_check_mirror_id = 1; + param->fp_exclude_mirror_id = !!neg_opt; + break; case 'd': param->fp_max_depth = 0; break; @@ -3779,7 +4354,7 @@ static int lfs_getstripe_internal(int argc, char **argv, break; case 'i': if (!(param->fp_verbose & VERBOSE_DETAIL)) { - param->fp_verbose |= VERBOSE_OFFSET; + param->fp_verbose |= VERBOSE_STRIPE_OFFSET; param->fp_max_depth = 0; } break; @@ -3802,7 +4377,7 @@ static int lfs_getstripe_internal(int argc, char **argv, break; case 'L': if (!(param->fp_verbose & VERBOSE_DETAIL)) { - param->fp_verbose |= VERBOSE_LAYOUT; + param->fp_verbose |= VERBOSE_PATTERN; param->fp_max_depth = 0; } break; @@ -3816,9 +4391,15 @@ static int lfs_getstripe_internal(int argc, char **argv, param->fp_max_depth = 0; param->fp_verbose |= VERBOSE_MDTINDEX; break; - case 'O': - if (param->fp_obd_uuid) { - fprintf(stderr, + case 'N': + if (!(param->fp_verbose & VERBOSE_DETAIL)) { + param->fp_verbose |= VERBOSE_MIRROR_COUNT; + param->fp_max_depth = 0; + } + break; + case 'O': + if (param->fp_obd_uuid) { + fprintf(stderr, "error: %s: only one obduuid allowed", argv[0]); return CMD_HELP; @@ -3842,7 +4423,7 @@ static int lfs_getstripe_internal(int argc, char **argv, break; case 'S': if (!(param->fp_verbose & VERBOSE_DETAIL)) { - param->fp_verbose |= VERBOSE_SIZE; + param->fp_verbose |= VERBOSE_STRIPE_SIZE; param->fp_max_depth = 0; } break; @@ -3857,7 +4438,16 @@ static int lfs_getstripe_internal(int argc, char **argv, } } - if (optind >= argc) + if (pathstart == -1) { + fprintf(stderr, "error: %s: no filename|pathname\n", + argv[0]); + return CMD_HELP; + } else if (pathend == -1) { + /* no options */ + pathend = argc; + } + + if (pathend > argc) return CMD_HELP; if (param->fp_recursive) @@ -3871,8 +4461,8 @@ static int lfs_getstripe_internal(int argc, char **argv, param->fp_verbose = VERBOSE_OBJID; do { - rc = llapi_getstripe(argv[optind], param); - } while (++optind < argc && !rc); + rc = llapi_getstripe(argv[pathstart], param); + } while (++pathstart < pathend && !rc); if (rc) fprintf(stderr, "error: %s failed for %s.\n", @@ -3958,7 +4548,7 @@ static int lfs_getdirstripe(int argc, char **argv) break; case 'i': case 'm': - param.fp_verbose |= VERBOSE_OFFSET; + param.fp_verbose |= VERBOSE_STRIPE_OFFSET; break; #if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) case 't': @@ -4007,12 +4597,345 @@ static int lfs_getdirstripe(int argc, char **argv) return rc; } +enum mntdf_flags { + MNTDF_INODES = 0x0001, + MNTDF_COOKED = 0x0002, + MNTDF_LAZY = 0x0004, + MNTDF_VERBOSE = 0x0008, + MNTDF_SHOW = 0x0010, +}; + +#define COOK(value) \ +({ \ + int radix = 0; \ + while (value > 1024) { \ + value /= 1024; \ + radix++; \ + } \ + radix; \ +}) +#define UUF "%-20s" +#define CSF "%11s" +#define CDF "%11llu" +#define HDF "%8.1f%c" +#define RSF "%4s" +#define RDF "%3d%%" + +static inline int obd_statfs_ratio(const struct obd_statfs *st, bool inodes) +{ + double avail, used, ratio = 0; + + if (inodes) { + avail = st->os_ffree; + used = st->os_files - st->os_ffree; + } else { + avail = st->os_bavail; + used = st->os_blocks - st->os_bfree; + } + if (avail + used > 0) + ratio = used / (used + avail) * 100; + + /* Round up to match df(1) usage percentage */ + return (ratio - (int)ratio) > 0 ? (int)(ratio + 1) : (int)ratio; +} + +static int showdf(char *mntdir, struct obd_statfs *stat, + char *uuid, enum mntdf_flags flags, + char *type, int index, int rc) +{ + long long avail, used, total; + int ratio = 0; + char *suffix = "KMGTPEZY"; + /* Note if we have >2^64 bytes/fs these buffers will need to be grown */ + char tbuf[3 * sizeof(__u64)]; + char ubuf[3 * sizeof(__u64)]; + char abuf[3 * sizeof(__u64)]; + char rbuf[3 * sizeof(__u64)]; + + if (!uuid || !stat) + return -EINVAL; + + switch (rc) { + case 0: + if (flags & MNTDF_INODES) { + avail = stat->os_ffree; + used = stat->os_files - stat->os_ffree; + total = stat->os_files; + } else { + int shift = flags & MNTDF_COOKED ? 0 : 10; + + avail = (stat->os_bavail * stat->os_bsize) >> shift; + used = ((stat->os_blocks - stat->os_bfree) * + stat->os_bsize) >> shift; + total = (stat->os_blocks * stat->os_bsize) >> shift; + } + + ratio = obd_statfs_ratio(stat, flags & MNTDF_INODES); + + if (flags & MNTDF_COOKED) { + int i; + double cook_val; + + cook_val = (double)total; + i = COOK(cook_val); + if (i > 0) + snprintf(tbuf, sizeof(tbuf), HDF, cook_val, + suffix[i - 1]); + else + snprintf(tbuf, sizeof(tbuf), CDF, total); + + cook_val = (double)used; + i = COOK(cook_val); + if (i > 0) + snprintf(ubuf, sizeof(ubuf), HDF, cook_val, + suffix[i - 1]); + else + snprintf(ubuf, sizeof(ubuf), CDF, used); + + cook_val = (double)avail; + i = COOK(cook_val); + if (i > 0) + snprintf(abuf, sizeof(abuf), HDF, cook_val, + suffix[i - 1]); + else + snprintf(abuf, sizeof(abuf), CDF, avail); + } else { + snprintf(tbuf, sizeof(tbuf), CDF, total); + snprintf(ubuf, sizeof(tbuf), CDF, used); + snprintf(abuf, sizeof(tbuf), CDF, avail); + } + + sprintf(rbuf, RDF, ratio); + printf(UUF" "CSF" "CSF" "CSF" "RSF" %-s", + uuid, tbuf, ubuf, abuf, rbuf, mntdir); + if (type) + printf("[%s:%d]", type, index); + + if (stat->os_state) { + /* + * Each character represents the matching + * OS_STATE_* bit. + */ + const char state_names[] = "DRSI"; + __u32 state; + __u32 i; + + printf(" "); + for (i = 0, state = stat->os_state; + state && i < sizeof(state_names); i++) { + if (!(state & (1 << i))) + continue; + printf("%c", state_names[i]); + state ^= 1 << i; + } + } + + printf("\n"); + break; + case -ENODATA: + printf(UUF": inactive device\n", uuid); + break; + default: + printf(UUF": %s\n", uuid, strerror(-rc)); + break; + } + + return 0; +} + +struct ll_stat_type { + int st_op; + char *st_name; +}; + +#define LL_STATFS_MAX LOV_MAX_STRIPE_COUNT + +struct ll_statfs_data { + int sd_index; + struct obd_statfs sd_st; +}; + +struct ll_statfs_buf { + int sb_count; + struct ll_statfs_data sb_buf[LL_STATFS_MAX]; +}; + +static int mntdf(char *mntdir, char *fsname, char *pool, enum mntdf_flags flags, + int ops, struct ll_statfs_buf *lsb) +{ + struct obd_statfs stat_buf, sum = { .os_bsize = 1 }; + struct obd_uuid uuid_buf; + char *poolname = NULL; + struct ll_stat_type types[] = { + { .st_op = LL_STATFS_LMV, .st_name = "MDT" }, + { .st_op = LL_STATFS_LOV, .st_name = "OST" }, + { .st_name = NULL } }; + struct ll_stat_type *tp; + __u64 ost_ffree = 0; + __u32 index; + __u32 type; + int fd; + int rc = 0; + int rc2; + + if (pool) { + poolname = strchr(pool, '.'); + if (poolname != NULL) { + if (strncmp(fsname, pool, strlen(fsname))) { + fprintf(stderr, "filesystem name incorrect\n"); + return -ENODEV; + } + poolname++; + } else + poolname = pool; + } + + fd = open(mntdir, O_RDONLY); + if (fd < 0) { + rc = -errno; + fprintf(stderr, "%s: cannot open '%s': %s\n", progname, mntdir, + strerror(errno)); + return rc; + } + + if (flags & MNTDF_SHOW) { + if (flags & MNTDF_INODES) + printf(UUF" "CSF" "CSF" "CSF" "RSF" %-s\n", + "UUID", "Inodes", "IUsed", "IFree", + "IUse%", "Mounted on"); + else + printf(UUF" "CSF" "CSF" "CSF" "RSF" %-s\n", + "UUID", + flags & MNTDF_COOKED ? "bytes" : "1K-blocks", + "Used", "Available", "Use%", "Mounted on"); + } + + for (tp = types; tp->st_name != NULL; tp++) { + bool have_ost = false; + + if (!(tp->st_op & ops)) + continue; + + for (index = 0; ; index++) { + memset(&stat_buf, 0, sizeof(struct obd_statfs)); + memset(&uuid_buf, 0, sizeof(struct obd_uuid)); + type = flags & MNTDF_LAZY ? + tp->st_op | LL_STATFS_NODELAY : tp->st_op; + rc2 = llapi_obd_fstatfs(fd, type, index, + &stat_buf, &uuid_buf); + if (rc2 == -ENODEV) + break; + if (rc2 == -EAGAIN) + continue; + if (rc2 == -ENODATA) { /* Inactive device, OK. */ + if (!(flags & MNTDF_VERBOSE)) + continue; + } else if (rc2 < 0 && rc == 0) { + rc = rc2; + } + + /* If we have OSTs then don't report MDT block counts. + * For MDT-only filesystems the expectation is that all + * layouts have a DoM component. For filesystems with + * OSTs, files are not necessarily going to store data + * on MDTs, and MDT space is limited to a fraction of + * OST space, so don't include it in the summary. + */ + if (tp->st_op == LL_STATFS_LOV && !have_ost) { + have_ost = true; + sum.os_blocks = 0; + sum.os_bfree = 0; + sum.os_bavail = 0; + } + + if (poolname && tp->st_op == LL_STATFS_LOV && + llapi_search_ost(fsname, poolname, + obd_uuid2str(&uuid_buf)) != 1) + continue; + + /* the llapi_obd_statfs() call may have returned with + * an error, but if it filled in uuid_buf we will at + * lease use that to print out a message for that OBD. + * If we didn't get anything in the uuid_buf, then fill + * it in so that we can print an error message. */ + if (uuid_buf.uuid[0] == '\0') + snprintf(uuid_buf.uuid, sizeof(uuid_buf.uuid), + "%s%04x", tp->st_name, index); + if (!rc && lsb) { + lsb->sb_buf[lsb->sb_count].sd_index = index; + lsb->sb_buf[lsb->sb_count].sd_st = stat_buf; + lsb->sb_count++; + } + if (flags & MNTDF_SHOW) + showdf(mntdir, &stat_buf, + obd_uuid2str(&uuid_buf), flags, + tp->st_name, index, rc2); + + if (rc2) + continue; + + if (tp->st_op == LL_STATFS_LMV) { + sum.os_ffree += stat_buf.os_ffree; + sum.os_files += stat_buf.os_files; + } else /* if (tp->st_op == LL_STATFS_LOV) */ { + ost_ffree += stat_buf.os_ffree; + } + sum.os_blocks += stat_buf.os_blocks * + stat_buf.os_bsize; + sum.os_bfree += stat_buf.os_bfree * + stat_buf.os_bsize; + sum.os_bavail += stat_buf.os_bavail * + stat_buf.os_bsize; + } + } + + close(fd); + + /* If we don't have as many objects free on the OST as inodes + * on the MDS, we reduce the total number of inodes to + * compensate, so that the "inodes in use" number is correct. + * Matches ll_statfs_internal() so the results are consistent. */ + if (ost_ffree < sum.os_ffree) { + sum.os_files = (sum.os_files - sum.os_ffree) + ost_ffree; + sum.os_ffree = ost_ffree; + } + if (flags & MNTDF_SHOW) { + printf("\n"); + showdf(mntdir, &sum, "filesystem_summary:", flags, NULL, 0, 0); + printf("\n"); + } + + return rc; +} + +static int ll_statfs_data_comp(const void *sd1, const void *sd2) +{ + const struct obd_statfs *st1 = &((const struct ll_statfs_data *)sd1)-> + sd_st; + const struct obd_statfs *st2 = &((const struct ll_statfs_data *)sd2)-> + sd_st; + int r1 = obd_statfs_ratio(st1, false); + int r2 = obd_statfs_ratio(st2, false); + int64_t result = r1 - r2; + + /* if both space usage are above 90, compare free inodes */ + if (r1 > 90 && r2 > 90) + result = st2->os_ffree - st1->os_ffree; + + if (result < 0) + return -1; + else if (result == 0) + return 0; + else + return 1; +} + /* functions */ static int lfs_setdirstripe(int argc, char **argv) { char *dname; int result; - struct lfs_setstripe_args lsa; + struct lfs_setstripe_args lsa = { 0 }; struct llapi_stripe_param *param = NULL; __u32 mdts[LMV_MAX_STRIPE_COUNT] = { 0 }; char *end; @@ -4022,6 +4945,9 @@ static int lfs_setdirstripe(int argc, char **argv) mode_t mode = S_IRWXU | S_IRWXG | S_IRWXO; mode_t previous_mode = 0; bool delete = false; + struct ll_statfs_buf *lsb = NULL; + char mntdir[PATH_MAX] = ""; + bool auto_distributed = false; struct option long_opts[] = { { .val = 'c', .name = "count", .has_arg = required_argument }, @@ -4030,7 +4956,13 @@ static int lfs_setdirstripe(int argc, char **argv) { .val = 'D', .name = "default", .has_arg = no_argument }, { .val = 'D', .name = "default_stripe", .has_arg = no_argument }, { .val = 'H', .name = "mdt-hash", .has_arg = required_argument }, +#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(2, 17, 53, 0) { .val = 'i', .name = "mdt-index", .has_arg = required_argument }, + { .val = 'i', .name = "mdt", .has_arg = required_argument }, +#else + { .val = 'm', .name = "mdt-index", .has_arg = required_argument }, + { .val = 'm', .name = "mdt", .has_arg = required_argument }, +#endif #if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) { .val = 'i', .name = "index", .has_arg = required_argument }, #endif @@ -4039,6 +4971,7 @@ static int lfs_setdirstripe(int argc, char **argv) { .val = 't', .name = "hash-type", .has_arg = required_argument }, #endif { .val = 'T', .name = "mdt-count", .has_arg = required_argument }, +/* setstripe { .val = 'y', .name = "yaml", .has_arg = no_argument }, */ { .name = NULL } }; setstripe_args_init(&lsa); @@ -4081,6 +5014,11 @@ static int lfs_setdirstripe(int argc, char **argv) } break; case 'i': +#if LUSTRE_VERSION_CODE >= OBD_OCD_VERSION(2, 17, 53, 0) + case 'm': +#endif + fprintf(stderr, "warning: '-m' is deprecated, " + "use '--mode' or '-o' instead\n"); #if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) if (strcmp(argv[optind - 1], "--index") == 0) fprintf(stderr, @@ -4101,7 +5039,7 @@ static int lfs_setdirstripe(int argc, char **argv) if (lsa.lsa_stripe_off == LLAPI_LAYOUT_DEFAULT) lsa.lsa_stripe_off = mdts[0]; break; -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(2, 16, 53, 0) +#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(2, 15, 53, 0) case 'm': fprintf(stderr, "warning: '-m' is deprecated, " "use '--mode' or '-o' instead\n"); @@ -4150,8 +5088,13 @@ static int lfs_setdirstripe(int argc, char **argv) previous_mode = umask(0); } - /* initialize stripe parameters */ - param = calloc(1, offsetof(typeof(*param), lsp_osts[lsa.lsa_nr_tgts])); + /* + * initialize stripe parameters, in case param is converted to specific, + * i.e, 'lfs mkdir -i -1 -c N', always allocate space for lsp_tgts. + */ + param = calloc(1, offsetof(typeof(*param), + lsp_tgts[lsa.lsa_stripe_count != LLAPI_LAYOUT_DEFAULT ? + lsa.lsa_stripe_count : lsa.lsa_nr_tgts])); if (param == NULL) { fprintf(stderr, "%s %s: cannot allocate memory for parameters: %s\n", @@ -4189,10 +5132,102 @@ static int lfs_setdirstripe(int argc, char **argv) dname = argv[optind]; do { - if (default_stripe) + if (default_stripe) { result = llapi_dir_set_default_lmv(dname, param); - else - result = llapi_dir_create_param(dname, mode, param); + } else { + /* if current \a dname isn't under the same \a mntdir + * as the last one, and the last one was + * auto-distributed, restore \a param. + */ + if (mntdir[0] != '\0' && + strncmp(dname, mntdir, strlen(mntdir)) && + auto_distributed) { + param->lsp_is_specific = false; + param->lsp_stripe_offset = -1; + auto_distributed = false; + } + + if (!param->lsp_is_specific && + param->lsp_stripe_offset == -1) { + char path[PATH_MAX] = ""; + + if (!lsb) { + lsb = malloc(sizeof(*lsb)); + if (!lsb) { + result = -ENOMEM; + break; + } + } + lsb->sb_count = 0; + + /* use mntdir for dirname() temporarily */ + strncpy(mntdir, dname, sizeof(mntdir)); + if (!realpath(dirname(mntdir), path)) { + result = -errno; + fprintf(stderr, + "error: invalid path '%s': %s\n", + argv[optind], strerror(errno)); + break; + } + mntdir[0] = '\0'; + + result = llapi_search_mounts(path, 0, mntdir, + NULL); + if (result < 0 || mntdir[0] == '\0') { + fprintf(stderr, + "No suitable Lustre mount found\n"); + break; + } + + result = mntdf(mntdir, NULL, NULL, 0, + LL_STATFS_LMV, lsb); + if (result < 0) + break; + + if (param->lsp_stripe_count > lsb->sb_count) { + fprintf(stderr, + "error: stripe count %d is too big\n", + param->lsp_stripe_count); + result = -ERANGE; + break; + } + + qsort(lsb->sb_buf, lsb->sb_count, + sizeof(struct ll_statfs_data), + ll_statfs_data_comp); + + auto_distributed = true; + } + + if (auto_distributed) { + int r; + int nr = MAX(param->lsp_stripe_count, + lsb->sb_count / 2); + + /* don't use server whose usage is above 90% */ + while (nr != param->lsp_stripe_count && + obd_statfs_ratio(&lsb->sb_buf[nr].sd_st, + false) > 90) + nr = MAX(param->lsp_stripe_count, + nr / 2); + + /* get \a r between [0, nr) */ + r = rand() % nr; + + param->lsp_stripe_offset = + lsb->sb_buf[r].sd_index; + if (param->lsp_stripe_count > 1) { + int i = 0; + + param->lsp_is_specific = true; + for (; i < param->lsp_stripe_count; i++) + param->lsp_tgts[(i + r) % nr] = + lsb->sb_buf[i].sd_index; + } + } + + result = llapi_dir_create(dname, mode, param); + } if (result) { fprintf(stderr, @@ -4206,6 +5241,7 @@ static int lfs_setdirstripe(int argc, char **argv) if (mode_opt != NULL) umask(previous_mode); + free(lsb); free(param); return result; } @@ -4220,343 +5256,102 @@ static int lfs_rmentry(int argc, char **argv) if (argc <= 1) { fprintf(stderr, "error: %s: missing dirname\n", argv[0]); - return CMD_HELP; - } - - index = 1; - dname = argv[index]; - while (dname != NULL) { - result = llapi_direntry_remove(dname); - if (result) { - fprintf(stderr, "error: %s: remove dir entry '%s' " - "failed\n", argv[0], dname); - break; - } - dname = argv[++index]; - } - return result; -} - -static int lfs_mv(int argc, char **argv) -{ - struct find_param param = { - .fp_max_depth = -1, - .fp_mdt_index = -1, - }; - char *end; - int c; - int rc = 0; - struct option long_opts[] = { - { .val = 'm', .name = "mdt-index", .has_arg = required_argument }, - { .val = 'v', .name = "verbose", .has_arg = no_argument }, - { .name = NULL } }; - - while ((c = getopt_long(argc, argv, "m:M:v", long_opts, NULL)) != -1) { - switch (c) { -#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) - case 'M': - fprintf(stderr, "warning: '-M' deprecated" - ", use '--mdt-index' or '-m' instead\n"); -#endif - case 'm': - param.fp_mdt_index = strtoul(optarg, &end, 0); - if (*end != '\0') { - fprintf(stderr, "%s: invalid MDT index'%s'\n", - argv[0], optarg); - return CMD_HELP; - } - break; - case 'v': - param.fp_verbose = VERBOSE_DETAIL; - break; - default: - fprintf(stderr, "error: %s: unrecognized option '%s'\n", - argv[0], argv[optind - 1]); - return CMD_HELP; - } - } - - if (param.fp_mdt_index == -1) { - fprintf(stderr, "%s: MDT index must be specified\n", argv[0]); - return CMD_HELP; - } - - if (optind >= argc) { - fprintf(stderr, "%s: missing operand path\n", argv[0]); - return CMD_HELP; - } - - param.fp_migrate = 1; - rc = llapi_migrate_mdt(argv[optind], ¶m); - if (rc != 0) - fprintf(stderr, "%s: cannot migrate '%s' to MDT%04x: %s\n", - argv[0], argv[optind], param.fp_mdt_index, - strerror(-rc)); - return rc; -} - -static int lfs_osts(int argc, char **argv) -{ - return lfs_tgts(argc, argv); -} - -static int lfs_mdts(int argc, char **argv) -{ - return lfs_tgts(argc, argv); -} - -#define COOK(value) \ -({ \ - int radix = 0; \ - while (value > 1024) { \ - value /= 1024; \ - radix++; \ - } \ - radix; \ -}) -#define UUF "%-20s" -#define CSF "%11s" -#define CDF "%11llu" -#define HDF "%8.1f%c" -#define RSF "%4s" -#define RDF "%3d%%" - -enum mntdf_flags { - MNTDF_INODES = 0x0001, - MNTDF_COOKED = 0x0002, - MNTDF_LAZY = 0x0004, - MNTDF_VERBOSE = 0x0008, -}; - -static int showdf(char *mntdir, struct obd_statfs *stat, - char *uuid, enum mntdf_flags flags, - char *type, int index, int rc) -{ - long long avail, used, total; - double ratio = 0; - char *suffix = "KMGTPEZY"; - /* Note if we have >2^64 bytes/fs these buffers will need to be grown */ - char tbuf[3 * sizeof(__u64)]; - char ubuf[3 * sizeof(__u64)]; - char abuf[3 * sizeof(__u64)]; - char rbuf[3 * sizeof(__u64)]; - - if (!uuid || !stat) - return -EINVAL; - - switch (rc) { - case 0: - if (flags & MNTDF_INODES) { - avail = stat->os_ffree; - used = stat->os_files - stat->os_ffree; - total = stat->os_files; - } else { - int shift = flags & MNTDF_COOKED ? 0 : 10; - - avail = (stat->os_bavail * stat->os_bsize) >> shift; - used = ((stat->os_blocks - stat->os_bfree) * - stat->os_bsize) >> shift; - total = (stat->os_blocks * stat->os_bsize) >> shift; - } - - if ((used + avail) > 0) - ratio = (double)used / (double)(used + avail); - - if (flags & MNTDF_COOKED) { - int i; - double cook_val; - - cook_val = (double)total; - i = COOK(cook_val); - if (i > 0) - snprintf(tbuf, sizeof(tbuf), HDF, cook_val, - suffix[i - 1]); - else - snprintf(tbuf, sizeof(tbuf), CDF, total); - - cook_val = (double)used; - i = COOK(cook_val); - if (i > 0) - snprintf(ubuf, sizeof(ubuf), HDF, cook_val, - suffix[i - 1]); - else - snprintf(ubuf, sizeof(ubuf), CDF, used); - - cook_val = (double)avail; - i = COOK(cook_val); - if (i > 0) - snprintf(abuf, sizeof(abuf), HDF, cook_val, - suffix[i - 1]); - else - snprintf(abuf, sizeof(abuf), CDF, avail); - } else { - snprintf(tbuf, sizeof(tbuf), CDF, total); - snprintf(ubuf, sizeof(tbuf), CDF, used); - snprintf(abuf, sizeof(tbuf), CDF, avail); - } - - sprintf(rbuf, RDF, (int)(ratio * 100 + 0.5)); - printf(UUF" "CSF" "CSF" "CSF" "RSF" %-s", - uuid, tbuf, ubuf, abuf, rbuf, mntdir); - if (type) - printf("[%s:%d]", type, index); - - if (stat->os_state) { - /* - * Each character represents the matching - * OS_STATE_* bit. - */ - const char state_names[] = "DRSI"; - __u32 state; - __u32 i; - - printf(" "); - for (i = 0, state = stat->os_state; - state && i < sizeof(state_names); i++) { - if (!(state & (1 << i))) - continue; - printf("%c", state_names[i]); - state ^= 1 << i; - } - } - - printf("\n"); - break; - case -ENODATA: - printf(UUF": inactive device\n", uuid); - break; - default: - printf(UUF": %s\n", uuid, strerror(-rc)); - break; - } - - return 0; -} - -struct ll_stat_type { - int st_op; - char *st_name; -}; - -static int mntdf(char *mntdir, char *fsname, char *pool, enum mntdf_flags flags) -{ - struct obd_statfs stat_buf, sum = { .os_bsize = 1 }; - struct obd_uuid uuid_buf; - char *poolname = NULL; - struct ll_stat_type types[] = { - { .st_op = LL_STATFS_LMV, .st_name = "MDT" }, - { .st_op = LL_STATFS_LOV, .st_name = "OST" }, - { .st_name = NULL } }; - struct ll_stat_type *tp; - __u64 ost_ffree = 0; - __u32 index; - __u32 type; - int fd; - int rc = 0; - int rc2; - - if (pool) { - poolname = strchr(pool, '.'); - if (poolname != NULL) { - if (strncmp(fsname, pool, strlen(fsname))) { - fprintf(stderr, "filesystem name incorrect\n"); - return -ENODEV; - } - poolname++; - } else - poolname = pool; + return CMD_HELP; } - fd = open(mntdir, O_RDONLY); - if (fd < 0) { - rc = -errno; - fprintf(stderr, "%s: cannot open '%s': %s\n", progname, mntdir, - strerror(errno)); - return rc; + index = 1; + dname = argv[index]; + while (dname != NULL) { + result = llapi_direntry_remove(dname); + if (result) { + fprintf(stderr, "error: %s: remove dir entry '%s' " + "failed\n", argv[0], dname); + break; + } + dname = argv[++index]; } + return result; +} - if (flags & MNTDF_INODES) - printf(UUF" "CSF" "CSF" "CSF" "RSF" %-s\n", - "UUID", "Inodes", "IUsed", "IFree", - "IUse%", "Mounted on"); - else - printf(UUF" "CSF" "CSF" "CSF" "RSF" %-s\n", - "UUID", flags & MNTDF_COOKED ? "bytes" : "1K-blocks", - "Used", "Available", "Use%", "Mounted on"); - - for (tp = types; tp->st_name != NULL; tp++) { - for (index = 0; ; index++) { - memset(&stat_buf, 0, sizeof(struct obd_statfs)); - memset(&uuid_buf, 0, sizeof(struct obd_uuid)); - type = flags & MNTDF_LAZY ? - tp->st_op | LL_STATFS_NODELAY : tp->st_op; - rc2 = llapi_obd_fstatfs(fd, type, index, - &stat_buf, &uuid_buf); - if (rc2 == -ENODEV) - break; - if (rc2 == -EAGAIN) - continue; - if (rc2 == -ENODATA) { /* Inactive device, OK. */ - if (!(flags & MNTDF_VERBOSE)) - continue; - } else if (rc2 < 0 && rc == 0) { - rc = rc2; - } - - if (poolname && tp->st_op == LL_STATFS_LOV && - llapi_search_ost(fsname, poolname, - obd_uuid2str(&uuid_buf)) != 1) - continue; +static int lfs_mv(int argc, char **argv) +{ + struct lmv_user_md lmu = { LMV_USER_MAGIC }; + struct find_param param = { + .fp_max_depth = -1, + .fp_mdt_index = -1, + }; + char *end; + int c; + int rc = 0; + struct option long_opts[] = { + { .val = 'm', .name = "mdt", .has_arg = required_argument }, + { .val = 'm', .name = "mdt-index", .has_arg = required_argument }, + { .val = 'v', .name = "verbose", .has_arg = no_argument }, + { .name = NULL } }; - /* the llapi_obd_statfs() call may have returned with - * an error, but if it filled in uuid_buf we will at - * lease use that to print out a message for that OBD. - * If we didn't get anything in the uuid_buf, then fill - * it in so that we can print an error message. */ - if (uuid_buf.uuid[0] == '\0') - snprintf(uuid_buf.uuid, sizeof(uuid_buf.uuid), - "%s%04x", tp->st_name, index); - showdf(mntdir, &stat_buf, obd_uuid2str(&uuid_buf), - flags, tp->st_name, index, rc2); - - if (rc2 == 0) { - if (tp->st_op == LL_STATFS_LMV) { - sum.os_ffree += stat_buf.os_ffree; - sum.os_files += stat_buf.os_files; - } else /* if (tp->st_op == LL_STATFS_LOV) */ { - sum.os_blocks += stat_buf.os_blocks * - stat_buf.os_bsize; - sum.os_bfree += stat_buf.os_bfree * - stat_buf.os_bsize; - sum.os_bavail += stat_buf.os_bavail * - stat_buf.os_bsize; - ost_ffree += stat_buf.os_ffree; - } + while ((c = getopt_long(argc, argv, "m:M:v", long_opts, NULL)) != -1) { + switch (c) { +#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 53, 0) + case 'M': + fprintf(stderr, "warning: '-M' deprecated" + ", use '--mdt-index' or '-m' instead\n"); +#endif + case 'm': + lmu.lum_stripe_offset = strtoul(optarg, &end, 0); + if (*end != '\0') { + fprintf(stderr, "%s mv: bad MDT index '%s'\n", + progname, optarg); + return CMD_HELP; } + break; + case 'v': + param.fp_verbose = VERBOSE_DETAIL; + break; + default: + fprintf(stderr, "%s mv: unrecognized option '%s'\n", + progname, argv[optind - 1]); + return CMD_HELP; } } - close(fd); + if (lmu.lum_stripe_offset == -1) { + fprintf(stderr, "%s mv: MDT index must be specified\n", + progname); + return CMD_HELP; + } - /* If we don't have as many objects free on the OST as inodes - * on the MDS, we reduce the total number of inodes to - * compensate, so that the "inodes in use" number is correct. - * Matches ll_statfs_internal() so the results are consistent. */ - if (ost_ffree < sum.os_ffree) { - sum.os_files = (sum.os_files - sum.os_ffree) + ost_ffree; - sum.os_ffree = ost_ffree; + if (optind >= argc) { + fprintf(stderr, "%s mv: DIR must be specified\n", progname); + return CMD_HELP; } - printf("\n"); - showdf(mntdir, &sum, "filesystem_summary:", flags, NULL, 0, 0); - printf("\n"); + + /* initialize migrate mdt parameters */ + param.fp_lmv_md = &lmu; + param.fp_migrate = 1; + rc = llapi_migrate_mdt(argv[optind], ¶m); + if (rc != 0) + fprintf(stderr, "%s mv: cannot migrate '%s' to MDT%04x: %s\n", + progname, argv[optind], param.fp_mdt_index, + strerror(-rc)); return rc; } +static int lfs_osts(int argc, char **argv) +{ + return lfs_tgts(argc, argv); +} + +static int lfs_mdts(int argc, char **argv) +{ + return lfs_tgts(argc, argv); +} + static int lfs_df(int argc, char **argv) { char mntdir[PATH_MAX] = {'\0'}, path[PATH_MAX] = {'\0'}; - enum mntdf_flags flags = 0; + enum mntdf_flags flags = MNTDF_SHOW; + int ops = LL_STATFS_LMV | LL_STATFS_LOV; int c, rc = 0, index = 0; char fsname[PATH_MAX] = "", *pool_name = NULL; struct option long_opts[] = { @@ -4601,7 +5396,7 @@ static int lfs_df(int argc, char **argv) if (mntdir[0] == '\0') continue; - rc = mntdf(mntdir, fsname, pool_name, flags); + rc = mntdf(mntdir, fsname, pool_name, flags, ops, NULL); if (rc || path[0] != '\0') break; fsname[0] = '\0'; /* avoid matching in next loop */ @@ -4652,12 +5447,13 @@ static int lfs_getname(int argc, char **argv) static int lfs_check(int argc, char **argv) { - int rc; - char mntdir[PATH_MAX] = {'\0'}; - int num_types = 1; - char *obd_types[2]; - char obd_type1[4]; - char obd_type2[4]; + char mntdir[PATH_MAX] = {'\0'}; + int num_types = 1; + char *obd_types[3]; + char obd_type1[4]; + char obd_type2[4]; + char obd_type3[4]; + int rc; if (argc != 2) { fprintf(stderr, "%s check: server type must be specified\n", @@ -4665,17 +5461,23 @@ static int lfs_check(int argc, char **argv) return CMD_HELP; } - obd_types[0] = obd_type1; - obd_types[1] = obd_type2; - - if (strcmp(argv[1], "osts") == 0) { - strcpy(obd_types[0], "osc"); - } else if (strcmp(argv[1], "mds") == 0) { - strcpy(obd_types[0], "mdc"); - } else if (strcmp(argv[1], "servers") == 0) { - num_types = 2; - strcpy(obd_types[0], "osc"); - strcpy(obd_types[1], "mdc"); + obd_types[0] = obd_type1; + obd_types[1] = obd_type2; + obd_types[2] = obd_type3; + + if (strcmp(argv[1], "osts") == 0) { + strcpy(obd_types[0], "osc"); + } else if (strcmp(argv[1], "mdts") == 0 || + strcmp(argv[1], "mds") == 0) { + strcpy(obd_types[0], "mdc"); + } else if (strcmp(argv[1], "mgts") == 0) { + strcpy(obd_types[0], "mgc"); + } else if (strcmp(argv[1], "all") == 0 || + strcmp(argv[1], "servers") == 0) { + num_types = 3; + strcpy(obd_types[0], "osc"); + strcpy(obd_types[1], "mdc"); + strcpy(obd_types[2], "mgc"); } else { fprintf(stderr, "%s check: unrecognized option '%s'\n", progname, argv[1]); @@ -4868,6 +5670,12 @@ quota_type: return CMD_HELP; } + if ((dqb->dqb_valid | QIF_BTIME && dqi->dqi_bgrace >= UINT_MAX) || + (dqb->dqb_valid | QIF_ITIME && dqi->dqi_igrace >= UINT_MAX)) { + fprintf(stderr, "error: grace time is too large\n"); + return CMD_HELP; + } + mnt = argv[optind]; rc = llapi_quotactl(mnt, &qctl); if (rc) { @@ -4888,25 +5696,30 @@ quota_type: int lfs_setquota(int argc, char **argv) { - int c, rc; - struct if_quotactl qctl; - char *mnt, *obd_type = (char *)qctl.obd_type; - struct obd_dqblk *dqb = &qctl.qc_dqblk; - struct option long_opts[] = { + int c, rc = 0; + struct if_quotactl qctl; + char *mnt, *obd_type = (char *)qctl.obd_type; + struct obd_dqblk *dqb = &qctl.qc_dqblk; + struct option long_opts[] = { { .val = 'b', .name = "block-softlimit", .has_arg = required_argument }, { .val = 'B', .name = "block-hardlimit", .has_arg = required_argument }, + { .val = 'd', .name = "default", .has_arg = no_argument }, { .val = 'g', .name = "group", .has_arg = required_argument }, + { .val = 'G', .name = "default-grp", .has_arg = no_argument }, { .val = 'i', .name = "inode-softlimit", .has_arg = required_argument }, { .val = 'I', .name = "inode-hardlimit", .has_arg = required_argument }, { .val = 'p', .name = "projid", .has_arg = required_argument }, + { .val = 'P', .name = "default-prj", .has_arg = no_argument }, { .val = 'u', .name = "user", .has_arg = required_argument }, + { .val = 'U', .name = "default-usr", .has_arg = no_argument }, { .name = NULL } }; - unsigned limit_mask = 0; - char *endptr; + unsigned limit_mask = 0; + char *endptr; + bool use_default = false; int qtype; if (has_times_option(argc, argv)) @@ -4918,37 +5731,65 @@ int lfs_setquota(int argc, char **argv) * so it can be used as a marker that qc_type * isn't reinitialized from command line */ - while ((c = getopt_long(argc, argv, "b:B:g:i:I:p:u:", + while ((c = getopt_long(argc, argv, "b:B:dg:Gi:I:p:Pu:U", long_opts, NULL)) != -1) { switch (c) { + case 'U': + qctl.qc_cmd = LUSTRE_Q_SETDEFAULT; + qtype = USRQUOTA; + qctl.qc_id = 0; + goto quota_type_def; case 'u': qtype = USRQUOTA; rc = name2uid(&qctl.qc_id, optarg); goto quota_type; + case 'G': + qctl.qc_cmd = LUSTRE_Q_SETDEFAULT; + qtype = GRPQUOTA; + qctl.qc_id = 0; + goto quota_type_def; case 'g': qtype = GRPQUOTA; rc = name2gid(&qctl.qc_id, optarg); goto quota_type; + case 'P': + qctl.qc_cmd = LUSTRE_Q_SETDEFAULT; + qtype = PRJQUOTA; + qctl.qc_id = 0; + goto quota_type_def; case 'p': qtype = PRJQUOTA; rc = name2projid(&qctl.qc_id, optarg); quota_type: - if (qctl.qc_type != ALLQUOTA) { - fprintf(stderr, - "%s setquota: only one of -u, -g or -p may be specified\n", - progname); - return CMD_HELP; - } - qctl.qc_type = qtype; if (rc) { qctl.qc_id = strtoul(optarg, &endptr, 10); if (*endptr != '\0') { - fprintf(stderr, - "%s setquota: invalid id '%s'\n", - progname, optarg); + fprintf(stderr, "%s setquota: invalid" + " id '%s'\n", progname, optarg); return -1; } } + + if (qctl.qc_id == 0) { + fprintf(stderr, "%s setquota: can't set quota" + " for root usr/group/project.\n", + progname); + return -1; + } + +quota_type_def: + if (qctl.qc_type != ALLQUOTA) { + fprintf(stderr, + "%s setquota: only one of -u, -U, -g," + " -G, -p or -P may be specified\n", + progname); + return CMD_HELP; + } + qctl.qc_type = qtype; + break; + case 'd': + qctl.qc_cmd = LUSTRE_Q_SETDEFAULT; + use_default = true; break; case 'b': ARG2ULL(dqb->dqb_bsoftlimit, optarg, 1024); @@ -5011,13 +5852,29 @@ quota_type: return CMD_HELP; } - if (limit_mask == 0) { + if (!use_default && limit_mask == 0) { fprintf(stderr, "%s setquota: at least one limit must be specified\n", progname); return CMD_HELP; } + if (use_default && limit_mask != 0) { + fprintf(stderr, + "%s setquota: limits should not be specified when" + " using default quota\n", + progname); + return CMD_HELP; + } + + if (use_default && qctl.qc_id == 0) { + fprintf(stderr, + "%s setquota: can not set default quota for root" + " user/group/project\n", + progname); + return CMD_HELP; + } + if (optind != argc - 1) { fprintf(stderr, "%s setquota: filesystem not specified or unexpected argument '%s'\n", @@ -5027,42 +5884,50 @@ quota_type: mnt = argv[optind]; - if ((!(limit_mask & BHLIMIT) ^ !(limit_mask & BSLIMIT)) || - (!(limit_mask & IHLIMIT) ^ !(limit_mask & ISLIMIT))) { - /* sigh, we can't just set blimits/ilimits */ - struct if_quotactl tmp_qctl = {.qc_cmd = LUSTRE_Q_GETQUOTA, - .qc_type = qctl.qc_type, - .qc_id = qctl.qc_id}; - - rc = llapi_quotactl(mnt, &tmp_qctl); + if (use_default) { + dqb->dqb_bhardlimit = 0; + dqb->dqb_bsoftlimit = 0; + dqb->dqb_ihardlimit = 0; + dqb->dqb_isoftlimit = 0; + dqb->dqb_itime = 0; + dqb->dqb_btime = 0; + dqb->dqb_valid |= QIF_LIMITS | QIF_TIMES; + } else if ((!(limit_mask & BHLIMIT) ^ !(limit_mask & BSLIMIT)) || + (!(limit_mask & IHLIMIT) ^ !(limit_mask & ISLIMIT))) { + /* sigh, we can't just set blimits/ilimits */ + struct if_quotactl tmp_qctl = {.qc_cmd = LUSTRE_Q_GETQUOTA, + .qc_type = qctl.qc_type, + .qc_id = qctl.qc_id}; + + rc = llapi_quotactl(mnt, &tmp_qctl); if (rc < 0) return rc; - if (!(limit_mask & BHLIMIT)) - dqb->dqb_bhardlimit = tmp_qctl.qc_dqblk.dqb_bhardlimit; - if (!(limit_mask & BSLIMIT)) - dqb->dqb_bsoftlimit = tmp_qctl.qc_dqblk.dqb_bsoftlimit; - if (!(limit_mask & IHLIMIT)) - dqb->dqb_ihardlimit = tmp_qctl.qc_dqblk.dqb_ihardlimit; - if (!(limit_mask & ISLIMIT)) - dqb->dqb_isoftlimit = tmp_qctl.qc_dqblk.dqb_isoftlimit; - - /* Keep grace times if we have got no softlimit arguments */ - if ((limit_mask & BHLIMIT) && !(limit_mask & BSLIMIT)) { - dqb->dqb_valid |= QIF_BTIME; - dqb->dqb_btime = tmp_qctl.qc_dqblk.dqb_btime; - } + if (!(limit_mask & BHLIMIT)) + dqb->dqb_bhardlimit = tmp_qctl.qc_dqblk.dqb_bhardlimit; + if (!(limit_mask & BSLIMIT)) + dqb->dqb_bsoftlimit = tmp_qctl.qc_dqblk.dqb_bsoftlimit; + if (!(limit_mask & IHLIMIT)) + dqb->dqb_ihardlimit = tmp_qctl.qc_dqblk.dqb_ihardlimit; + if (!(limit_mask & ISLIMIT)) + dqb->dqb_isoftlimit = tmp_qctl.qc_dqblk.dqb_isoftlimit; + + /* Keep grace times if we have got no softlimit arguments */ + if ((limit_mask & BHLIMIT) && !(limit_mask & BSLIMIT)) { + dqb->dqb_valid |= QIF_BTIME; + dqb->dqb_btime = tmp_qctl.qc_dqblk.dqb_btime; + } - if ((limit_mask & IHLIMIT) && !(limit_mask & ISLIMIT)) { - dqb->dqb_valid |= QIF_ITIME; - dqb->dqb_itime = tmp_qctl.qc_dqblk.dqb_itime; - } - } + if ((limit_mask & IHLIMIT) && !(limit_mask & ISLIMIT)) { + dqb->dqb_valid |= QIF_ITIME; + dqb->dqb_itime = tmp_qctl.qc_dqblk.dqb_itime; + } + } - dqb->dqb_valid |= (limit_mask & (BHLIMIT | BSLIMIT)) ? QIF_BLIMITS : 0; - dqb->dqb_valid |= (limit_mask & (IHLIMIT | ISLIMIT)) ? QIF_ILIMITS : 0; + dqb->dqb_valid |= (limit_mask & (BHLIMIT | BSLIMIT)) ? QIF_BLIMITS : 0; + dqb->dqb_valid |= (limit_mask & (IHLIMIT | ISLIMIT)) ? QIF_ILIMITS : 0; - rc = llapi_quotactl(mnt, &qctl); + rc = llapi_quotactl(mnt, &qctl); if (rc) { if (*obd_type) fprintf(stderr, @@ -5131,15 +5996,22 @@ static void diff2str(time_t seconds, char *buf, time_t now) } static void print_quota_title(char *name, struct if_quotactl *qctl, - bool human_readable) + bool human_readable, bool show_default) { - printf("Disk quotas for %s %s (%cid %u):\n", - qtype_name(qctl->qc_type), name, - *qtype_name(qctl->qc_type), qctl->qc_id); - printf("%15s%8s %7s%8s%8s%8s %7s%8s%8s\n", - "Filesystem", human_readable ? "used" : "kbytes", - "quota", "limit", "grace", - "files", "quota", "limit", "grace"); + if (show_default) { + printf("Disk default %s quota:\n", qtype_name(qctl->qc_type)); + printf("%15s %8s%8s%8s %8s%8s%8s\n", + "Filesystem", "bquota", "blimit", "bgrace", + "iquota", "ilimit", "igrace"); + } else { + printf("Disk quotas for %s %s (%cid %u):\n", + qtype_name(qctl->qc_type), name, + *qtype_name(qctl->qc_type), qctl->qc_id); + printf("%15s%8s %7s%8s%8s%8s %7s%8s%8s\n", + "Filesystem", human_readable ? "used" : "kbytes", + "quota", "limit", "grace", + "files", "quota", "limit", "grace"); + } } static void kbytes2str(__u64 num, char *buf, int buflen, bool h) @@ -5166,20 +6038,21 @@ static void kbytes2str(__u64 num, char *buf, int buflen, bool h) #define STRBUF_LEN 32 static void print_quota(char *mnt, struct if_quotactl *qctl, int type, - int rc, bool h) + int rc, bool h, bool show_default) { - time_t now; + time_t now; - time(&now); + time(&now); - if (qctl->qc_cmd == LUSTRE_Q_GETQUOTA || qctl->qc_cmd == Q_GETOQUOTA) { + if (qctl->qc_cmd == LUSTRE_Q_GETQUOTA || qctl->qc_cmd == Q_GETOQUOTA || + qctl->qc_cmd == LUSTRE_Q_GETDEFAULT) { int bover = 0, iover = 0; struct obd_dqblk *dqb = &qctl->qc_dqblk; char numbuf[3][STRBUF_LEN]; char timebuf[40]; char strbuf[STRBUF_LEN]; - if (dqb->dqb_bhardlimit && + if (dqb->dqb_bhardlimit && lustre_stoqb(dqb->dqb_curspace) >= dqb->dqb_bhardlimit) { bover = 1; } else if (dqb->dqb_bsoftlimit && dqb->dqb_btime) { @@ -5209,6 +6082,9 @@ static void print_quota(char *mnt, struct if_quotactl *qctl, int type, if (bover) diff2str(dqb->dqb_btime, timebuf, now); + else if (show_default) + snprintf(timebuf, sizeof(timebuf), "%llu", + dqb->dqb_btime); kbytes2str(lustre_stoqb(dqb->dqb_curspace), strbuf, sizeof(strbuf), h); @@ -5229,15 +6105,23 @@ static void print_quota(char *mnt, struct if_quotactl *qctl, int type, sprintf(numbuf[2], (dqb->dqb_valid & QIF_BLIMITS) ? "%s" : "[%s]", strbuf); - printf(" %7s%c %6s %7s %7s", - numbuf[0], bover ? '*' : ' ', numbuf[1], - numbuf[2], bover > 1 ? timebuf : "-"); + if (show_default) + printf(" %6s %7s %7s", numbuf[1], numbuf[2], timebuf); + else + printf(" %7s%c %6s %7s %7s", + numbuf[0], bover ? '*' : ' ', numbuf[1], + numbuf[2], bover > 1 ? timebuf : "-"); + if (iover) diff2str(dqb->dqb_itime, timebuf, now); + else if (show_default) + snprintf(timebuf, sizeof(timebuf), "%llu", + dqb->dqb_itime); - sprintf(numbuf[0], (dqb->dqb_valid & QIF_INODES) ? - "%ju" : "[%ju]", (uintmax_t)dqb->dqb_curinodes); + snprintf(numbuf[0], sizeof(numbuf), + (dqb->dqb_valid & QIF_INODES) ? "%ju" : "[%ju]", + (uintmax_t)dqb->dqb_curinodes); if (type == QC_GENERAL) sprintf(numbuf[1], (dqb->dqb_valid & QIF_ILIMITS) ? @@ -5249,7 +6133,9 @@ static void print_quota(char *mnt, struct if_quotactl *qctl, int type, sprintf(numbuf[2], (dqb->dqb_valid & QIF_ILIMITS) ? "%ju" : "[%ju]", (uintmax_t)dqb->dqb_ihardlimit); - if (type != QC_OSTIDX) + if (show_default) + printf(" %6s %7s %7s", numbuf[1], numbuf[2], timebuf); + else if (type != QC_OSTIDX) printf(" %7s%c %6s %7s %7s", numbuf[0], iover ? '*' : ' ', numbuf[1], numbuf[2], iover > 1 ? timebuf : "-"); @@ -5300,7 +6186,7 @@ static int print_obd_quota(char *mnt, struct if_quotactl *qctl, int is_mdt, } print_quota(obd_uuid2str(&qctl->obd_uuid), qctl, - qctl->qc_valid, 0, h); + qctl->qc_valid, 0, h, false); *total += is_mdt ? qctl->qc_dqblk.dqb_ihardlimit : qctl->qc_dqblk.dqb_bhardlimit; } @@ -5310,12 +6196,15 @@ out: } static int get_print_quota(char *mnt, char *name, struct if_quotactl *qctl, - int verbose, int quiet, bool human_readable) + int verbose, int quiet, bool human_readable, + bool show_default) { int rc1 = 0, rc2 = 0, rc3 = 0; char *obd_type = (char *)qctl->obd_type; char *obd_uuid = (char *)qctl->obd_uuid.uuid; __u64 total_ialloc = 0, total_balloc = 0; + bool use_default_for_blk = false; + bool use_default_for_file = false; int inacc; rc1 = llapi_quotactl(mnt, qctl); @@ -5337,8 +6226,31 @@ static int get_print_quota(char *mnt, char *name, struct if_quotactl *qctl, } } - if (qctl->qc_cmd == LUSTRE_Q_GETQUOTA && !quiet) - print_quota_title(name, qctl, human_readable); + if (!show_default && qctl->qc_id == 0) { + qctl->qc_dqblk.dqb_bhardlimit = 0; + qctl->qc_dqblk.dqb_bsoftlimit = 0; + qctl->qc_dqblk.dqb_ihardlimit = 0; + qctl->qc_dqblk.dqb_isoftlimit = 0; + qctl->qc_dqblk.dqb_btime = 0; + qctl->qc_dqblk.dqb_itime = 0; + qctl->qc_dqblk.dqb_valid |= QIF_LIMITS | QIF_TIMES; + } + + if (qctl->qc_dqblk.dqb_valid & QIF_BTIME && + LQUOTA_FLAG(qctl->qc_dqblk.dqb_btime) & LQUOTA_FLAG_DEFAULT) { + use_default_for_blk = true; + qctl->qc_dqblk.dqb_btime &= LQUOTA_GRACE_MASK; + } + + if (qctl->qc_dqblk.dqb_valid & QIF_ITIME && + LQUOTA_FLAG(qctl->qc_dqblk.dqb_itime) & LQUOTA_FLAG_DEFAULT) { + use_default_for_file = true; + qctl->qc_dqblk.dqb_itime &= LQUOTA_GRACE_MASK; + } + + if ((qctl->qc_cmd == LUSTRE_Q_GETQUOTA || + qctl->qc_cmd == LUSTRE_Q_GETDEFAULT) && !quiet) + print_quota_title(name, qctl, human_readable, show_default); if (rc1 && *obd_type) fprintf(stderr, "%s %s ", obd_type, obd_uuid); @@ -5350,10 +6262,10 @@ static int get_print_quota(char *mnt, char *name, struct if_quotactl *qctl, ((qctl->qc_dqblk.dqb_valid & (QIF_LIMITS|QIF_USAGE)) != (QIF_LIMITS|QIF_USAGE)); - print_quota(mnt, qctl, QC_GENERAL, rc1, human_readable); + print_quota(mnt, qctl, QC_GENERAL, rc1, human_readable, show_default); - if (qctl->qc_valid == QC_GENERAL && qctl->qc_cmd != LUSTRE_Q_GETINFO && - verbose) { + if (!show_default && verbose && + qctl->qc_valid == QC_GENERAL && qctl->qc_cmd != LUSTRE_Q_GETINFO) { char strbuf[STRBUF_LEN]; rc2 = print_obd_quota(mnt, qctl, 1, human_readable, @@ -5367,6 +6279,14 @@ static int get_print_quota(char *mnt, char *name, struct if_quotactl *qctl, strbuf); } + if (use_default_for_blk) + printf("%cid %u is using default block quota setting\n", + *qtype_name(qctl->qc_type), qctl->qc_id); + + if (use_default_for_file) + printf("%cid %u is using default file quota setting\n", + *qtype_name(qctl->qc_type), qctl->qc_id); + if (rc1 || rc2 || rc3 || inacc) printf("Some errors happened when getting quota info. " "Some devices may be not working or deactivated. " @@ -5541,16 +6461,23 @@ static int lfs_quota(int argc, char **argv) char *endptr; __u32 valid = QC_GENERAL, idx = 0; bool human_readable = false; + bool show_default = false; int qtype; - while ((c = getopt(argc, argv, "gi:I:o:pqtuvh")) != -1) { + while ((c = getopt(argc, argv, "gGi:I:o:pPqtuUvh")) != -1) { switch (c) { + case 'U': + show_default = true; case 'u': qtype = USRQUOTA; goto quota_type; + case 'G': + show_default = true; case 'g': qtype = GRPQUOTA; goto quota_type; + case 'P': + show_default = true; case 'p': qtype = PRJQUOTA; quota_type: @@ -5567,7 +6494,7 @@ quota_type: break; case 'o': valid = qctl.qc_valid = QC_UUID; - strlcpy(obd_uuid, optarg, sizeof(qctl.obd_uuid)); + snprintf(obd_uuid, sizeof(qctl.obd_uuid), "%s", optarg); break; case 'i': valid = qctl.qc_valid = QC_MDTIDX; @@ -5607,7 +6534,7 @@ quota_type: /* current uid/gid info for "lfs quota /path/to/lustre/mount" */ if (qctl.qc_cmd == LUSTRE_Q_GETQUOTA && qctl.qc_type == ALLQUOTA && - optind == argc - 1) { + optind == argc - 1 && !show_default) { qctl.qc_cmd = LUSTRE_Q_GETQUOTA; qctl.qc_valid = valid; @@ -5626,35 +6553,45 @@ quota_type: name = ""; mnt = argv[optind]; rc1 = get_print_quota(mnt, name, &qctl, verbose, quiet, - human_readable); + human_readable, show_default); if (rc1 && !rc) rc = rc1; } + return rc; /* lfs quota -u username /path/to/lustre/mount */ } else if (qctl.qc_cmd == LUSTRE_Q_GETQUOTA) { /* options should be followed by u/g-name and mntpoint */ - if (optind + 2 != argc || qctl.qc_type == ALLQUOTA) { + if ((!show_default && optind + 2 != argc) || + (show_default && optind + 1 != argc) || + qctl.qc_type == ALLQUOTA) { fprintf(stderr, "%s quota: name and mount point must be specified\n", progname); return CMD_HELP; } - name = argv[optind++]; - switch (qctl.qc_type) { - case USRQUOTA: - rc = name2uid(&qctl.qc_id, name); - break; - case GRPQUOTA: - rc = name2gid(&qctl.qc_id, name); - break; - case PRJQUOTA: - rc = name2projid(&qctl.qc_id, name); - break; - default: - rc = -ENOTSUP; - break; + if (!show_default) { + name = argv[optind++]; + switch (qctl.qc_type) { + case USRQUOTA: + rc = name2uid(&qctl.qc_id, name); + break; + case GRPQUOTA: + rc = name2gid(&qctl.qc_id, name); + break; + case PRJQUOTA: + rc = name2projid(&qctl.qc_id, name); + break; + default: + rc = -ENOTSUP; + break; + } + } else { + qctl.qc_valid = QC_GENERAL; + qctl.qc_cmd = LUSTRE_Q_GETDEFAULT; + qctl.qc_id = 0; } + if (rc) { qctl.qc_id = strtoul(name, &endptr, 10); if (*endptr != '\0') { @@ -5663,15 +6600,15 @@ quota_type: return CMD_HELP; } } - mnt = argv[optind]; - rc = get_print_quota(mnt, name, &qctl, verbose, quiet, - human_readable); } else if (optind + 1 != argc || qctl.qc_type == ALLQUOTA) { fprintf(stderr, "%s quota: missing quota info argument(s)\n", progname); return CMD_HELP; } + mnt = argv[optind]; + rc = get_print_quota(mnt, name, &qctl, verbose, quiet, + human_readable, show_default); return rc; } #endif /* HAVE_SYS_QUOTA_H! */ @@ -5776,16 +6713,18 @@ static int lfs_changelog(int argc, char **argv) case 'f': follow++; break; - case '?': - return CMD_HELP; default: - fprintf(stderr, "error: %s: option '%s' unrecognized\n", - argv[0], argv[optind - 1]); + fprintf(stderr, + "%s changelog: unrecognized option '%s'\n", + progname, argv[optind - 1]); return CMD_HELP; } } - if (optind >= argc) - return CMD_HELP; + if (optind >= argc) { + fprintf(stderr, "%s changelog: mdtname must be specified\n", + progname); + return CMD_HELP; + } mdd = argv[optind++]; if (argc > optind) @@ -5800,18 +6739,20 @@ static int lfs_changelog(int argc, char **argv) (follow ? CHANGELOG_FLAG_FOLLOW : 0), mdd, startrec); if (rc < 0) { - fprintf(stderr, "Can't start changelog: %s\n", - strerror(errno = -rc)); + fprintf(stderr, "%s changelog: cannot start changelog: %s\n", + progname, strerror(errno = -rc)); return rc; } rc = llapi_changelog_set_xflags(changelog_priv, CHANGELOG_EXTRA_FLAG_UIDGID | CHANGELOG_EXTRA_FLAG_NID | - CHANGELOG_EXTRA_FLAG_OMODE); + CHANGELOG_EXTRA_FLAG_OMODE | + CHANGELOG_EXTRA_FLAG_XATTR); if (rc < 0) { - fprintf(stderr, "Can't set xflags for changelog: %s\n", - strerror(errno = -rc)); + fprintf(stderr, + "%s changelog: cannot set xflags for changelog: %s\n", + progname, strerror(errno = -rc)); return rc; } @@ -5876,10 +6817,10 @@ static int lfs_changelog(int argc, char **argv) if (omd->cr_openflags & MDS_FMODE_EXEC) { mode[2] = 'x'; } else { - if (omd->cr_openflags & FMODE_READ) + if (omd->cr_openflags & MDS_FMODE_READ) mode[0] = 'r'; if (omd->cr_openflags & - (FMODE_WRITE | + (MDS_FMODE_WRITE | MDS_OPEN_TRUNC | MDS_OPEN_APPEND)) mode[1] = 'w'; @@ -5889,6 +6830,14 @@ static int lfs_changelog(int argc, char **argv) printf(" m=%s", mode); } + + if (ef->cr_extra_flags & CLFE_XATTR) { + struct changelog_ext_xattr *xattr = + changelog_rec_xattr(rec); + + if (xattr->cr_xattr[0] != '\0') + printf(" x=%s", xattr->cr_xattr); + } } if (rec->cr_namelen) @@ -5909,14 +6858,15 @@ static int lfs_changelog(int argc, char **argv) printf("\n"); llapi_changelog_free(&rec); - } + } - llapi_changelog_fini(&changelog_priv); + llapi_changelog_fini(&changelog_priv); - if (rc < 0) - fprintf(stderr, "Changelog: %s\n", strerror(errno = -rc)); + if (rc < 0) + fprintf(stderr, "%s changelog: cannot access changelog: %s\n", + progname, strerror(errno = -rc)); - return (rc == 1 ? 0 : rc); + return (rc == 1 ? 0 : rc); } static int lfs_changelog_clear(int argc, char **argv) @@ -5961,36 +6911,55 @@ static int lfs_fid2path(int argc, char **argv) int lnktmp; int printcur = 0; int rc = 0; + char *endptr = NULL; while ((rc = getopt_long(argc, argv, short_opts, long_opts, NULL)) != -1) { - switch (rc) { - case 'c': - printcur++; - break; - case 'l': - linkno = strtol(optarg, NULL, 10); - break; - case 'r': - recno = strtoll(optarg, NULL, 10); - break; - case '?': - return CMD_HELP; - default: - fprintf(stderr, "error: %s: option '%s' unrecognized\n", - argv[0], argv[optind - 1]); - return CMD_HELP; - } - } + switch (rc) { + case 'c': + printcur++; + break; + case 'l': + linkno = strtol(optarg, &endptr, 10); + if (*endptr != '\0') { + fprintf(stderr, + "%s fid2path: invalid linkno '%s'\n", + progname, optarg); + return CMD_HELP; + } + break; + case 'r': + recno = strtoll(optarg, &endptr, 10); + if (*endptr != '\0') { + fprintf(stderr, + "%s fid2path: invalid recno '%s'\n", + progname, optarg); + return CMD_HELP; + } + break; + default: + fprintf(stderr, + "%s fid2path: unrecognized option '%s'\n", + progname, argv[optind - 1]); + return CMD_HELP; + } + } - if (argc < 3) + if (argc < 3) { + fprintf(stderr, + "%s fid2path: and ... must be specified\n", + progname); return CMD_HELP; + } device = argv[optind++]; path = calloc(1, PATH_MAX); if (path == NULL) { - fprintf(stderr, "error: Not enough memory\n"); - return -errno; + rc = -errno; + fprintf(stderr, + "%s fid2path: cannot allocate memory for path: %s\n", + progname, strerror(-rc)); + return rc; } rc = 0; @@ -6005,8 +6974,9 @@ static int lfs_fid2path(int argc, char **argv) rc2 = llapi_fid2path(device, fid, path, PATH_MAX, &rectmp, &lnktmp); if (rc2 < 0) { - fprintf(stderr, "%s: error on FID %s: %s\n", - argv[0], fid, strerror(errno = -rc2)); + fprintf(stderr, + "%s fid2path: cannot find '%s': %s\n", + progname, fid, strerror(errno = -rc2)); if (rc == 0) rc = rc2; break; @@ -6055,14 +7025,18 @@ static int lfs_path2fid(int argc, char **argv) show_parents = true; break; default: - fprintf(stderr, "error: %s: option '%s' unrecognized\n", - argv[0], argv[optind - 1]); + fprintf(stderr, + "%s path2fid: unrecognized option '%s'\n", + progname, argv[optind - 1]); return CMD_HELP; } } - if (optind > argc - 1) + if (optind > argc - 1) { + fprintf(stderr, "%s path2fid: FILE... must be specified\n", + progname); return CMD_HELP; + } else if (optind < argc - 1) sep = ": "; @@ -6097,8 +7071,9 @@ static int lfs_path2fid(int argc, char **argv) } if (err) { - fprintf(stderr, "%s: can't get %sfid for %s: %s\n", - argv[0], show_parents ? "parent " : "", *path, + fprintf(stderr, + "%s path2fid: cannot get %sfid for '%s': %s\n", + progname, show_parents ? "parent " : "", *path, strerror(-err)); if (rc == 0) { rc = err; @@ -6119,8 +7094,11 @@ static int lfs_data_version(int argc, char **argv) int c; int data_version_flags = LL_DV_RD_FLUSH; /* Read by default */ - if (argc < 2) + if (argc < 2) { + fprintf(stderr, "%s data_version: FILE must be specified\n", + progname); return CMD_HELP; + } while ((c = getopt(argc, argv, "nrw")) != -1) { switch (c) { @@ -6134,20 +7112,32 @@ static int lfs_data_version(int argc, char **argv) data_version_flags |= LL_DV_WR_FLUSH; break; default: + fprintf(stderr, + "%s data_version: unrecognized option '%s'\n", + progname, argv[optind - 1]); return CMD_HELP; } } - if (optind == argc) + if (optind == argc) { + fprintf(stderr, "%s data_version: FILE must be specified\n", + progname); return CMD_HELP; + } path = argv[optind]; fd = open(path, O_RDONLY); - if (fd < 0) - err(errno, "cannot open file %s", path); + if (fd < 0) { + rc = -errno; + fprintf(stderr, "%s data_version: cannot open file '%s': %s\n", + progname, path, strerror(-rc)); + return rc; + } rc = llapi_get_data_version(fd, &data_version, data_version_flags); if (rc < 0) - err(errno, "cannot get version for %s", path); + fprintf(stderr, + "%s data_version: cannot get version for '%s': %s\n", + progname, path, strerror(-rc)); else printf("%ju" "\n", (uintmax_t)data_version); @@ -7068,9 +8058,9 @@ int verify_mirror_ids(const char *fname, __u16 *mirror_ids, int ids_nr) goto error; } - rc = llapi_lease_get(fd, LL_LEASE_RDLCK); + rc = llapi_lease_acquire(fd, LL_LEASE_RDLCK); if (rc < 0) { - fprintf(stderr, "%s: '%s' llapi_lease_get failed: %s.\n", + fprintf(stderr, "%s: '%s' llapi_lease_acquire failed: %s.\n", progname, fname, strerror(errno)); goto close_fd; } @@ -7080,7 +8070,7 @@ int verify_mirror_ids(const char *fname, __u16 *mirror_ids, int ids_nr) fprintf(stderr, "%s: '%s' llapi_layout_get_by_fd failed: %s.\n", progname, fname, strerror(errno)); rc = -errno; - llapi_lease_put(fd); + llapi_lease_release(fd); goto close_fd; } @@ -7094,10 +8084,10 @@ int verify_mirror_ids(const char *fname, __u16 *mirror_ids, int ids_nr) flr_state &= LCM_FL_FLR_MASK; switch (flr_state) { - case LCM_FL_NOT_FLR: + case LCM_FL_NONE: rc = -EINVAL; fprintf(stderr, "%s: '%s' file state error: %s.\n", - progname, fname, lcm_flags_string(flr_state)); + progname, fname, llapi_layout_flags_string(flr_state)); goto free_layout; default: break; @@ -7129,7 +8119,7 @@ int verify_mirror_ids(const char *fname, __u16 *mirror_ids, int ids_nr) free_layout: llapi_layout_free(layout); - llapi_lease_put(fd); + llapi_lease_release(fd); close_fd: close(fd); error: @@ -7144,6 +8134,8 @@ int lfs_mirror_resync_file(const char *fname, struct ll_ioc_lease *ioc, struct llapi_layout *layout; struct stat stbuf; uint32_t flr_state; + uint64_t start; + uint64_t end; int comp_size = 0; int idx; int fd; @@ -7170,205 +8162,606 @@ int lfs_mirror_resync_file(const char *fname, struct ll_ioc_lease *ioc, goto error; } + layout = llapi_layout_get_by_fd(fd, 0); + if (layout == NULL) { + fprintf(stderr, "%s: '%s' llapi_layout_get_by_fd failed: %s.\n", + progname, fname, strerror(errno)); + rc = -errno; + goto close_fd; + } + + rc = llapi_layout_flags_get(layout, &flr_state); + if (rc) { + fprintf(stderr, "%s: '%s' llapi_layout_flags_get failed: %s.\n", + progname, fname, strerror(errno)); + rc = -errno; + goto free_layout; + } + + flr_state &= LCM_FL_FLR_MASK; + if (flr_state == LCM_FL_NONE) { + rc = -EINVAL; + fprintf(stderr, "%s: '%s' is not a FLR file.\n", + progname, fname); + goto free_layout; + } + + /* get stale component info */ + comp_size = llapi_mirror_find_stale(layout, comp_array, + ARRAY_SIZE(comp_array), + mirror_ids, ids_nr); + if (comp_size <= 0) { + rc = comp_size; + goto free_layout; + } + ioc->lil_mode = LL_LEASE_WRLCK; ioc->lil_flags = LL_LEASE_RESYNC; rc = llapi_lease_set(fd, ioc); if (rc < 0) { - fprintf(stderr, - "%s: '%s' llapi_lease_set resync failed: %s.\n", + if (rc == -EALREADY) + rc = 0; + else + fprintf(stderr, + "%s: '%s' llapi_lease_get_ext resync failed: %s.\n", + progname, fname, strerror(errno)); + goto free_layout; + } + + /* get the read range [start, end) */ + start = comp_array[0].lrc_start; + end = comp_array[0].lrc_end; + for (idx = 1; idx < comp_size; idx++) { + if (comp_array[idx].lrc_start < start) + start = comp_array[idx].lrc_start; + if (end < comp_array[idx].lrc_end) + end = comp_array[idx].lrc_end; + } + + rc = llapi_lease_check(fd); + if (rc != LL_LEASE_WRLCK) { + fprintf(stderr, "%s: '%s' lost lease lock.\n", + progname, fname); + goto free_layout; + } + + rc = llapi_mirror_resync_many(fd, layout, comp_array, comp_size, + start, end); + if (rc < 0) + fprintf(stderr, "%s: '%s' llapi_mirror_resync_many: %d.\n", + progname, fname, rc); + + /* prepare ioc for lease put */ + ioc->lil_mode = LL_LEASE_UNLCK; + ioc->lil_flags = LL_LEASE_RESYNC_DONE; + ioc->lil_count = 0; + for (idx = 0; idx < comp_size; idx++) { + if (comp_array[idx].lrc_synced) { + ioc->lil_ids[ioc->lil_count] = comp_array[idx].lrc_id; + ioc->lil_count++; + } + } + + rc = llapi_lease_set(fd, ioc); + if (rc <= 0) { + if (rc == 0) /* lost lease lock */ + rc = -EBUSY; + fprintf(stderr, "%s: resync file '%s' failed: %s.\n", progname, fname, strerror(errno)); - goto close_fd; + goto free_layout; + } + /** + * llapi_lease_set returns lease mode when it request to unlock + * the lease lock + */ + rc = 0; + +free_layout: + llapi_layout_free(layout); +close_fd: + close(fd); +error: + return rc; +} + +static inline int lfs_mirror_resync(int argc, char **argv) +{ + struct ll_ioc_lease *ioc = NULL; + __u16 mirror_ids[128] = { 0 }; + int ids_nr = 0; + int c; + int rc = 0; + + struct option long_opts[] = { + { .val = 'o', .name = "only", .has_arg = required_argument }, + { .name = NULL } }; + + while ((c = getopt_long(argc, argv, "o:", long_opts, NULL)) >= 0) { + switch (c) { + case 'o': + rc = parse_mirror_ids(mirror_ids, + sizeof(mirror_ids) / sizeof(__u16), + optarg); + if (rc < 0) { + fprintf(stderr, + "%s: bad mirror ids '%s'.\n", + argv[0], optarg); + goto error; + } + ids_nr = rc; + break; + default: + fprintf(stderr, "%s: options '%s' unrecognized.\n", + argv[0], argv[optind - 1]); + rc = -EINVAL; + goto error; + } + } + + if (argc == optind) { + fprintf(stderr, "%s: no file name given.\n", argv[0]); + rc = CMD_HELP; + goto error; + } + + if (ids_nr > 0 && argc > optind + 1) { + fprintf(stderr, + "%s: option '--only' cannot be used upon multiple files.\n", + argv[0]); + rc = CMD_HELP; + goto error; + + } + + if (ids_nr > 0) { + rc = verify_mirror_ids(argv[optind], mirror_ids, ids_nr); + if (rc < 0) + goto error; + } + + /* set the lease on the file */ + ioc = calloc(sizeof(*ioc) + sizeof(__u32) * 4096, 1); + if (ioc == NULL) { + fprintf(stderr, "%s: cannot alloc id array for ioc: %s.\n", + argv[0], strerror(errno)); + rc = -errno; + goto error; + } + + for (; optind < argc; optind++) { + rc = lfs_mirror_resync_file(argv[optind], ioc, + mirror_ids, ids_nr); + /* ignore previous file's error, continue with next file */ + + /* reset ioc */ + memset(ioc, 0, sizeof(*ioc) + sizeof(__u32) * 4096); + } + + free(ioc); +error: + return rc; +} + +static inline int verify_mirror_id_by_fd(int fd, __u16 mirror_id) +{ + struct llapi_layout *layout; + int rc; + + layout = llapi_layout_get_by_fd(fd, 0); + if (layout == NULL) { + fprintf(stderr, "could not get layout.\n"); + return -EINVAL; + } + + rc = llapi_layout_comp_iterate(layout, find_mirror_id, &mirror_id); + if (rc < 0) { + fprintf(stderr, "failed to iterate layout\n"); + llapi_layout_free(layout); + + return rc; + } else if (rc == LLAPI_LAYOUT_ITER_CONT) { + fprintf(stderr, "does not find mirror with ID %u\n", mirror_id); + llapi_layout_free(layout); + + return -EINVAL; + } + llapi_layout_free(layout); + + return 0; +} + +/** + * Check whether two files are the same file + * \retval 0 same file + * \retval 1 not the same file + * \retval <0 error code + */ +static inline int check_same_file(const char *f1, const char *f2) +{ + struct stat stbuf1; + struct stat stbuf2; + + if (stat(f1, &stbuf1) < 0) { + fprintf(stderr, "%s: cannot stat file '%s': %s\n", + progname, f1, strerror(errno)); + return -errno; + } + + if (stat(f2, &stbuf2) < 0) { + fprintf(stderr, "%s: cannot stat file '%s': %s\n", + progname, f2, strerror(errno)); + return -errno; + } + + if (stbuf1.st_rdev == stbuf2.st_rdev && + stbuf1.st_ino == stbuf2.st_ino) + return 0; + + return 1; +} + +static inline int lfs_mirror_read(int argc, char **argv) +{ + int rc = CMD_HELP; + __u16 mirror_id = 0; + const char *outfile = NULL; + char *fname; + int fd = 0; + int outfd; + int c; + void *buf; + const size_t buflen = 4 << 20; + off_t pos; + struct option long_opts[] = { + { .val = 'N', .name = "mirror-id", .has_arg = required_argument }, + { .val = 'o', .name = "outfile", .has_arg = required_argument }, + { .name = NULL } }; + + while ((c = getopt_long(argc, argv, "N:o:", long_opts, NULL)) >= 0) { + char *end; + + switch (c) { + case 'N': + mirror_id = strtoul(optarg, &end, 0); + if (*end != '\0' || mirror_id == 0) { + fprintf(stderr, + "%s %s: invalid mirror ID '%s'\n", + progname, argv[0], optarg); + return rc; + } + break; + case 'o': + outfile = optarg; + break; + default: + fprintf(stderr, "%s: option '%s' unrecognized.\n", + progname, argv[optind - 1]); + return -EINVAL; + } + } + + if (argc == optind) { + fprintf(stderr, "%s %s: no mirrored file provided\n", + progname, argv[0]); + return rc; + } else if (argc > optind + 1) { + fprintf(stderr, "%s %s: too many files\n", progname, argv[0]); + return rc; + } + + if (mirror_id == 0) { + fprintf(stderr, "%s %s: no valid mirror ID is provided\n", + progname, argv[0]); + return rc; + } + + /* open mirror file */ + fname = argv[optind]; + + if (outfile) { + rc = check_same_file(fname, outfile); + if (rc == 0) { + fprintf(stderr, + "%s %s: output file cannot be the mirrored file\n", + progname, argv[0]); + return -EINVAL; + } + if (rc < 0) + return rc; } - layout = llapi_layout_get_by_fd(fd, 0); - if (layout == NULL) { - fprintf(stderr, "%s: '%s' llapi_layout_get_by_fd failed: %s.\n", - progname, fname, strerror(errno)); - rc = -errno; - goto close_fd; + fd = open(fname, O_DIRECT | O_RDONLY); + if (fd < 0) { + fprintf(stderr, "%s %s: cannot open '%s': %s\n", + progname, argv[0], fname, strerror(errno)); + return rc; } - rc = llapi_layout_flags_get(layout, &flr_state); + /* verify mirror id */ + rc = verify_mirror_id_by_fd(fd, mirror_id); if (rc) { - fprintf(stderr, "%s: '%s' llapi_layout_flags_get failed: %s.\n", - progname, fname, strerror(errno)); - rc = -errno; + fprintf(stderr, + "%s %s: cannot find mirror with ID %u in '%s'\n", + progname, argv[0], mirror_id, fname); goto close_fd; } - flr_state &= LCM_FL_FLR_MASK; - switch (flr_state) { - case LCM_FL_NOT_FLR: - rc = -EINVAL; - case LCM_FL_RDONLY: - fprintf(stderr, "%s: '%s' file state error: %s.\n", - progname, fname, lcm_flags_string(flr_state)); - goto close_fd; - default: - break; + /* open output file */ + if (outfile) { + outfd = open(outfile, O_EXCL | O_WRONLY | O_CREAT, 0644); + if (outfd < 0) { + fprintf(stderr, "%s %s: cannot create file '%s': %s\n", + progname, argv[0], outfile, strerror(errno)); + rc = -errno; + goto close_fd; + } + } else { + outfd = STDOUT_FILENO; } - /* get stale component info */ - comp_size = llapi_mirror_find_stale(layout, comp_array, - ARRAY_SIZE(comp_array), - mirror_ids, ids_nr); - if (comp_size < 0) { - rc = comp_size; - goto close_fd; + /* allocate buffer */ + rc = posix_memalign(&buf, sysconf(_SC_PAGESIZE), buflen); + if (rc) { + fprintf(stderr, "%s %s: posix_memalign returns %d\n", + progname, argv[0], rc); + goto close_outfd; } - idx = 0; - while (idx < comp_size) { - ssize_t result; - uint64_t end; - __u16 mirror_id; - int i; + pos = 0; + while (1) { + ssize_t bytes_read; + ssize_t written = 0; - rc = llapi_lease_check(fd); - if (rc != LL_LEASE_WRLCK) { - fprintf(stderr, "%s: '%s' lost lease lock.\n", - progname, fname); - goto close_fd; + bytes_read = llapi_mirror_read(fd, mirror_id, buf, buflen, pos); + if (bytes_read < 0) { + rc = bytes_read; + fprintf(stderr, + "%s %s: fail to read data from mirror %u: %s\n", + progname, argv[0], mirror_id, strerror(-rc)); + goto free_buf; } - mirror_id = comp_array[idx].lrc_mirror_id; - end = comp_array[idx].lrc_end; - - /* try to combine adjacent component */ - for (i = idx + 1; i < comp_size; i++) { - if (mirror_id != comp_array[i].lrc_mirror_id || - end != comp_array[i].lrc_start) - break; - end = comp_array[i].lrc_end; - } + /* EOF reached */ + if (bytes_read == 0) + break; - result = llapi_mirror_resync_one(fd, layout, mirror_id, - comp_array[idx].lrc_start, - end); - if (result < 0) { - fprintf(stderr, "%s: '%s' llapi_mirror_resync_one: " - "%ld.\n", progname, fname, result); - rc = result; - goto close_fd; - } else if (result > 0) { - int j; + while (written < bytes_read) { + ssize_t written2; - /* mark synced components */ - for (j = idx; j < i; j++) - comp_array[j].lrc_synced = true; + written2 = write(outfd, buf + written, + bytes_read - written); + if (written2 < 0) { + fprintf(stderr, + "%s %s: fail to write %s: %s\n", + progname, argv[0], outfile ? : "STDOUT", + strerror(errno)); + rc = -errno; + goto free_buf; + } + written += written2; } - idx = i; - } - - /* prepare ioc for lease put */ - ioc->lil_mode = LL_LEASE_UNLCK; - ioc->lil_flags = LL_LEASE_RESYNC_DONE; - ioc->lil_count = 0; - for (idx = 0; idx < comp_size; idx++) { - if (comp_array[idx].lrc_synced) { - ioc->lil_ids[ioc->lil_count] = comp_array[idx].lrc_id; - ioc->lil_count++; + if (written != bytes_read) { + fprintf(stderr, + "%s %s: written %ld bytes does not match with %ld read.\n", + progname, argv[0], written, bytes_read); + rc = -EIO; + goto free_buf; } - } - - llapi_layout_free(layout); - rc = llapi_lease_set(fd, ioc); - if (rc <= 0) { - if (rc == 0) /* lost lease lock */ - rc = -EBUSY; - fprintf(stderr, "%s: resync file '%s' failed: %s.\n", - progname, fname, strerror(errno)); - goto close_fd; + pos += bytes_read; } - /** - * llapi_lease_set returns lease mode when it request to unlock - * the lease lock - */ + + fsync(outfd); rc = 0; +free_buf: + free(buf); +close_outfd: + if (outfile) + close(outfd); close_fd: close(fd); -error: + return rc; } -static inline int lfs_mirror_resync(int argc, char **argv) +static inline int lfs_mirror_write(int argc, char **argv) { - struct ll_ioc_lease *ioc = NULL; - __u16 mirror_ids[128] = { 0 }; - int ids_nr = 0; + int rc = CMD_HELP; + __u16 mirror_id = 0; + const char *inputfile = NULL; + char *fname; + int fd = 0; + int inputfd; int c; - int rc = 0; + void *buf; + const size_t buflen = 4 << 20; + off_t pos; + size_t page_size = sysconf(_SC_PAGESIZE); + struct ll_ioc_lease_id ioc; struct option long_opts[] = { - { .val = 'o', .name = "only", .has_arg = required_argument }, + { .val = 'N', .name = "mirror-id", .has_arg = required_argument }, + { .val = 'i', .name = "inputfile", .has_arg = required_argument }, { .name = NULL } }; - while ((c = getopt_long(argc, argv, "o:", long_opts, NULL)) >= 0) { + while ((c = getopt_long(argc, argv, "N:i:", long_opts, NULL)) >= 0) { + char *end; + switch (c) { - case 'o': - rc = parse_mirror_ids(mirror_ids, - sizeof(mirror_ids) / sizeof(__u16), - optarg); - if (rc < 0) { + case 'N': + mirror_id = strtoul(optarg, &end, 0); + if (*end != '\0' || mirror_id == 0) { fprintf(stderr, - "%s: bad mirror ids '%s'.\n", - argv[0], optarg); - goto error; + "%s %s: invalid mirror ID '%s'\n", + progname, argv[0], optarg); + return rc; } - ids_nr = rc; + break; + case 'i': + inputfile = optarg; break; default: - fprintf(stderr, "%s: options '%s' unrecognized.\n", - argv[0], argv[optind - 1]); - rc = -EINVAL; - goto error; + fprintf(stderr, "%s: option '%s' unrecognized\n", + progname, argv[optind - 1]); + return -EINVAL; } } if (argc == optind) { - fprintf(stderr, "%s: no file name given.\n", argv[0]); - rc = CMD_HELP; - goto error; + fprintf(stderr, "%s %s: no mirrored file provided\n", + progname, argv[0]); + return rc; + } else if (argc > optind + 1) { + fprintf(stderr, "%s %s: too many files\n", progname, argv[0]); + return rc; } - if (ids_nr > 0 && argc > optind + 1) { + if (mirror_id == 0) { + fprintf(stderr, "%s %s: no valid mirror ID is provided\n", + progname, argv[0]); + return rc; + } + + /* open mirror file */ + fname = argv[optind]; + + if (inputfile) { + rc = check_same_file(fname, inputfile); + if (rc == 0) { + fprintf(stderr, + "%s %s: input file cannot be the mirrored file\n", + progname, argv[0]); + return -EINVAL; + } + if (rc < 0) + return rc; + } + + fd = open(fname, O_DIRECT | O_WRONLY); + if (fd < 0) { + fprintf(stderr, "%s %s: cannot open '%s': %s\n", + progname, argv[0], fname, strerror(errno)); + return rc; + } + + /* verify mirror id */ + rc = verify_mirror_id_by_fd(fd, mirror_id); + if (rc) { fprintf(stderr, - "%s: option '--only' cannot be used upon multiple files.\n", - argv[0]); - rc = CMD_HELP; - goto error; + "%s %s: cannot find mirror with ID %u in '%s'\n", + progname, argv[0], mirror_id, fname); + goto close_fd; + } + /* open input file */ + if (inputfile) { + inputfd = open(inputfile, O_RDONLY, 0644); + if (inputfd < 0) { + fprintf(stderr, "%s %s: cannot open file '%s': %s\n", + progname, argv[0], inputfile, strerror(errno)); + rc = -errno; + goto close_fd; + } + } else { + inputfd = STDIN_FILENO; } - if (ids_nr > 0) { - rc = verify_mirror_ids(argv[optind], mirror_ids, ids_nr); - if (rc < 0) - goto error; + /* allocate buffer */ + rc = posix_memalign(&buf, page_size, buflen); + if (rc) { + fprintf(stderr, "%s %s: posix_memalign returns %d\n", + progname, argv[0], rc); + goto close_inputfd; } - /* set the lease on the file */ - ioc = calloc(sizeof(*ioc) + sizeof(__u32) * 4096, 1); - if (ioc == NULL) { - fprintf(stderr, "%s: cannot alloc id array for ioc: %s.\n", - argv[0], strerror(errno)); - rc = -errno; - goto error; + /* prepare target mirror components instantiation */ + ioc.lil_mode = LL_LEASE_WRLCK; + ioc.lil_flags = LL_LEASE_RESYNC; + ioc.lil_mirror_id = mirror_id; + rc = llapi_lease_set(fd, (struct ll_ioc_lease *)&ioc); + if (rc < 0) { + fprintf(stderr, + "%s %s: '%s' llapi_lease_get_ext failed: %s\n", + progname, argv[0], fname, strerror(errno)); + goto free_buf; } - for (; optind < argc; optind++) { - rc = lfs_mirror_resync_file(argv[optind], ioc, - mirror_ids, ids_nr); - /* ignore previous file's error, continue with next file */ + pos = 0; + while (1) { + ssize_t bytes_read; + ssize_t written; + size_t to_write; - /* reset ioc */ - memset(ioc, 0, sizeof(__u32) * 4096); + rc = llapi_lease_check(fd); + if (rc != LL_LEASE_WRLCK) { + fprintf(stderr, "%s %s: '%s' lost lease lock\n", + progname, argv[0], fname); + goto free_buf; + } + + bytes_read = read(inputfd, buf, buflen); + if (bytes_read < 0) { + rc = bytes_read; + fprintf(stderr, + "%s %s: fail to read data from '%s': %s\n", + progname, argv[0], inputfile ? : "STDIN", + strerror(errno)); + rc = -errno; + goto free_buf; + } + + /* EOF reached */ + if (bytes_read == 0) + break; + + /* round up to page align to make direct IO happy. */ + to_write = (bytes_read + page_size - 1) & ~(page_size - 1); + + written = llapi_mirror_write(fd, mirror_id, buf, to_write, + pos); + if (written < 0) { + rc = written; + fprintf(stderr, + "%s %s: fail to write to mirror %u: %s\n", + progname, argv[0], mirror_id, + strerror(-rc)); + goto free_buf; + } + + pos += bytes_read; } - free(ioc); -error: + if (pos & (page_size - 1)) { + rc = llapi_mirror_truncate(fd, mirror_id, pos); + if (rc < 0) + goto free_buf; + } + + ioc.lil_mode = LL_LEASE_UNLCK; + ioc.lil_flags = LL_LEASE_RESYNC_DONE; + ioc.lil_count = 0; + rc = llapi_lease_set(fd, (struct ll_ioc_lease *)&ioc); + if (rc <= 0) { + if (rc == 0) + rc = -EBUSY; + fprintf(stderr, + "%s %s: release lease lock of '%s' failed: %s\n", + progname, argv[0], fname, strerror(errno)); + goto free_buf; + } + + rc = 0; + +free_buf: + free(buf); +close_inputfd: + if (inputfile) + close(inputfd); +close_fd: + close(fd); + return rc; } @@ -7800,9 +9193,9 @@ int lfs_mirror_verify_file(const char *fname, __u16 *mirror_ids, int ids_nr, goto error; } - rc = llapi_lease_get(fd, LL_LEASE_RDLCK); + rc = llapi_lease_acquire(fd, LL_LEASE_RDLCK); if (rc < 0) { - fprintf(stderr, "%s: '%s' llapi_lease_get failed: %s.\n", + fprintf(stderr, "%s: '%s' llapi_lease_acquire failed: %s.\n", progname, fname, strerror(errno)); goto close_fd; } @@ -7812,7 +9205,7 @@ int lfs_mirror_verify_file(const char *fname, __u16 *mirror_ids, int ids_nr, fprintf(stderr, "%s: '%s' llapi_layout_get_by_fd failed: %s.\n", progname, fname, strerror(errno)); rc = -errno; - llapi_lease_put(fd); + llapi_lease_release(fd); goto close_fd; } @@ -7826,10 +9219,10 @@ int lfs_mirror_verify_file(const char *fname, __u16 *mirror_ids, int ids_nr, flr_state &= LCM_FL_FLR_MASK; switch (flr_state) { - case LCM_FL_NOT_FLR: + case LCM_FL_NONE: rc = -EINVAL; fprintf(stderr, "%s: '%s' file state error: %s.\n", - progname, fname, lcm_flags_string(flr_state)); + progname, fname, llapi_layout_flags_string(flr_state)); goto free_layout; default: break; @@ -7909,7 +9302,7 @@ int lfs_mirror_verify_file(const char *fname, __u16 *mirror_ids, int ids_nr, free_layout: llapi_layout_free(layout); - llapi_lease_put(fd); + llapi_lease_release(fd); close_fd: close(fd); error: @@ -7968,7 +9361,7 @@ static inline int lfs_mirror_verify(int argc, char **argv) verbose++; break; default: - fprintf(stderr, "%s: options '%s' unrecognized.\n", + fprintf(stderr, "%s: option '%s' unrecognized.\n", progname, argv[optind - 1]); rc = -EINVAL; goto error; @@ -8037,6 +9430,94 @@ static int lfs_mirror(int argc, char **argv) return rc < 0 ? -rc : rc; } +static void lustre_som_swab(struct lustre_som_attrs *attrs) +{ +#if __BYTE_ORDER == __BIG_ENDIAN + __swab16s(&attrs->lsa_valid); + __swab64s(&attrs->lsa_size); + __swab64s(&attrs->lsa_blocks); +#endif +} + +enum lfs_som_type { + LFS_SOM_SIZE = 0x1, + LFS_SOM_BLOCKS = 0x2, + LFS_SOM_FLAGS = 0x4, + LFS_SOM_ATTR_ALL = LFS_SOM_SIZE | LFS_SOM_BLOCKS | + LFS_SOM_FLAGS, +}; + +static int lfs_getsom(int argc, char **argv) +{ + const char *path; + struct lustre_som_attrs *attrs; + char buf[sizeof(*attrs) + 64]; + enum lfs_som_type type = LFS_SOM_ATTR_ALL; + int rc = 0, c; + + while ((c = getopt(argc, argv, "sbf")) != -1) { + switch (c) { + case 's': + type = LFS_SOM_SIZE; + break; + case 'b': + type = LFS_SOM_BLOCKS; + break; + case 'f': + type = LFS_SOM_FLAGS; + break; + default: + fprintf(stderr, "%s: invalid option '%c'\n", + progname, optopt); + return CMD_HELP; + } + } + + argc -= optind; + argv += optind; + + if (argc != 1) { + fprintf(stderr, "%s: %s\n", + progname, argc == 0 ? "miss file target" : + "input more than 2 files"); + return CMD_HELP; + } + + path = argv[0]; + attrs = (void *)buf; + rc = lgetxattr(path, "trusted.som", attrs, sizeof(buf)); + if (rc < 0) { + rc = -errno; + fprintf(stderr, "%s failed to get som xattr: %s (%d)\n", + argv[0], strerror(errno), errno); + return rc; + } + + lustre_som_swab(attrs); + + switch (type) { + case LFS_SOM_ATTR_ALL: + printf("file: %s size: %llu blocks: %llu flags: %x\n", + path, attrs->lsa_size, attrs->lsa_blocks, + attrs->lsa_valid); + break; + case LFS_SOM_SIZE: + printf("%llu\n", attrs->lsa_size); + break; + case LFS_SOM_BLOCKS: + printf("%llu\n", attrs->lsa_blocks); + break; + case LFS_SOM_FLAGS: + printf("%x\n", attrs->lsa_valid); + break; + default: + fprintf(stderr, "%s: unknown option\n", progname); + return CMD_HELP; + } + + return 0; +} + /** * lfs_mirror_list_commands() - List lfs mirror commands. * @argc: The count of command line arguments.