X-Git-Url: https://git.whamcloud.com/?a=blobdiff_plain;f=e2fsck%2Fdirinfo.c;h=322f4da1d94b68fd5bafd737a0c5788cc832af02;hb=dc981d15c5de832f5675c13d53baeeaaa9bc232a;hp=dbaf4712b7779bbf63d6f94151b2cb2f489da173;hpb=253a96500a8fbe7266fe2daa066768cbaa1d3137;p=tools%2Fe2fsprogs.git diff --git a/e2fsck/dirinfo.c b/e2fsck/dirinfo.c index dbaf471..322f4da 100644 --- a/e2fsck/dirinfo.c +++ b/e2fsck/dirinfo.c @@ -7,26 +7,32 @@ #undef DIRINFO_DEBUG +#include #include "config.h" #include "e2fsck.h" #include #include #include "uuid/uuid.h" +#include "ext2fs/ext2fs.h" #include struct dir_info_db { - int count; - int size; + ext2_ino_t count; + ext2_ino_t size; struct dir_info *array; struct dir_info *last_lookup; +#ifdef CONFIG_TDB char *tdb_fn; TDB_CONTEXT *tdb; +#endif }; struct dir_info_iter { - int i; + ext2_ino_t i; +#ifdef CONFIG_TDB TDB_DATA tdb_iter; +#endif }; struct dir_info_ent { @@ -37,10 +43,11 @@ struct dir_info_ent { static void e2fsck_put_dir_info(e2fsck_t ctx, struct dir_info *dir); +#ifdef CONFIG_TDB static void setup_tdb(e2fsck_t ctx, ext2_ino_t num_dirs) { struct dir_info_db *db = ctx->dir_info; - unsigned int threshold; + ext2_ino_t threshold; errcode_t retval; mode_t save_umask; char *tdb_dir, uuid[40]; @@ -78,6 +85,7 @@ static void setup_tdb(e2fsck_t ctx, ext2_ino_t num_dirs) O_RDWR | O_CREAT | O_TRUNC, 0600); close(fd); } +#endif static void setup_db(e2fsck_t ctx) { @@ -97,6 +105,7 @@ static void setup_db(e2fsck_t ctx) if (retval) num_dirs = 1024; /* Guess */ +#ifdef CONFIG_TDB setup_tdb(ctx, num_dirs); if (db->tdb) { @@ -105,6 +114,7 @@ static void setup_db(e2fsck_t ctx) #endif return; } +#endif db->size = num_dirs + 10; db->array = (struct dir_info *) @@ -114,70 +124,218 @@ static void setup_db(e2fsck_t ctx) } /* + * Return the min index that has ino larger or equal to @ino + * If not found, return -ENOENT + */ +static int +e2fsck_dir_info_min_larger_equal(struct dir_info_db *dir_info, + ext2_ino_t ino, ext2_ino_t *index) +{ + ext2_ino_t low = 0; + ext2_ino_t mid, high; + ext2_ino_t tmp_ino; + int found = 0; + + if (dir_info->count == 0) + return -ENOENT; + + high = dir_info->count - 1; + while (low <= high) { + /* sum may overflow, but result will fit into mid again */ + mid = (unsigned long long)(low + high) / 2; + tmp_ino = dir_info->array[mid].ino; + if (ino == tmp_ino) { + *index = mid; + found = 1; + return 0; + } else if (ino < tmp_ino) { + /* + * The mid ino is larger than @ino, remember the index + * here so we won't miss this ino + */ + *index = mid; + found = 1; + if (mid == 0) + break; + high = mid - 1; + } else { + low = mid + 1; + } + } + + if (found) + return 0; + + return -ENOENT; +} + +/* + * Merge two sorted dir info to @dest + */ +void e2fsck_merge_dir_info(e2fsck_t ctx, struct dir_info_db *src, + struct dir_info_db *dest) +{ + size_t size_dir_info = sizeof(struct dir_info); + ext2_ino_t size = dest->size; + struct dir_info *src_array = src->array; + struct dir_info *dest_array = dest->array; + ext2_ino_t src_count = src->count; + ext2_ino_t dest_count = dest->count; + ext2_ino_t total_count = src_count + dest_count; + struct dir_info *tmp_array; + struct dir_info *array_ptr; + ext2_ino_t src_index = 0; + ext2_ino_t dest_index = 0; + + if (src->count == 0) + return; + + if (size < total_count) + size = total_count; + + if (size < src->size) + size = src->size; + + tmp_array = e2fsck_allocate_memory(ctx, size * size_dir_info, + "directory map"); + array_ptr = tmp_array; + /* + * This can be improved by binary search and memcpy, but codes + * would be more complex. And if the groups distributed to each + * thread are strided, this implementation won't be too bad + * comparing to the optimiztion. + */ + while (src_index < src_count || dest_index < dest_count) { + if (src_index >= src_count) { + memcpy(array_ptr, &dest_array[dest_index], + (dest_count - dest_index) * size_dir_info); + break; + } + if (dest_index >= dest_count) { + memcpy(array_ptr, &src_array[src_index], + (src_count - src_index) * size_dir_info); + break; + } + if (src_array[src_index].ino < dest_array[dest_index].ino) { + *array_ptr = src_array[src_index]; + src_index++; + } else { + assert(src_array[src_index].ino > + dest_array[dest_index].ino); + *array_ptr = dest_array[dest_index]; + dest_index++; + } + array_ptr++; + } + + if (dest->array) + ext2fs_free_mem(&dest->array); + dest->array = tmp_array; + dest->size = size; + dest->count = total_count; +} + +/* + * + * Insert an inode into the sorted array. The array should have at least one + * free slot. + * + * Normally, add_dir_info is called with each inode in + * sequential order; but once in a while (like when pass 3 + * needs to recreate the root directory or lost+found + * directory) it is called out of order. In those cases, we + * need to move the dir_info entries down to make room, since + * the dir_info array needs to be sorted by inode number for + * get_dir_info()'s sake. + */ +static void e2fsck_insert_dir_info(struct dir_info_db *dir_info, ext2_ino_t ino, ext2_ino_t parent) +{ + ext2_ino_t index; + struct dir_info *dir; + size_t dir_size = sizeof(*dir); + struct dir_info *array = dir_info->array; + ext2_ino_t array_count = dir_info->count; + int err; + + /* + * Removing this check won't break anything. But since seqential ino + * inserting happens a lot, this check avoids binary search. + */ + if (array_count == 0 || array[array_count - 1].ino < ino) { + dir = &array[array_count]; + dir_info->count++; + goto out; + } + + err = e2fsck_dir_info_min_larger_equal(dir_info, ino, &index); + if (err >= 0 && array[index].ino == ino) { + dir = &array[index]; + goto out; + } + if (err < 0) { + dir = &array[array_count]; + dir_info->count++; + goto out; + } + + dir = &array[index]; + memmove((char *)dir + dir_size, dir, dir_size * (array_count - index)); + dir_info->count++; +out: + dir->ino = ino; + dir->dotdot = parent; + dir->parent = parent; +} + +/* * This subroutine is called during pass1 to create a directory info * entry. During pass1, the passed-in parent is 0; it will get filled * in during pass2. */ void e2fsck_add_dir_info(e2fsck_t ctx, ext2_ino_t ino, ext2_ino_t parent) { - struct dir_info_db *db; - struct dir_info *dir, ent; - int i, j; + struct dir_info *old_array; errcode_t retval; unsigned long old_size; #ifdef DIRINFO_DEBUG - printf("add_dir_info for inode (%lu, %lu)...\n", ino, parent); + printf("add_dir_info for inode (%u, %u)...\n", ino, parent); #endif if (!ctx->dir_info) setup_db(ctx); - db = ctx->dir_info; if (ctx->dir_info->count >= ctx->dir_info->size) { old_size = ctx->dir_info->size * sizeof(struct dir_info); ctx->dir_info->size += 10; + old_array = ctx->dir_info->array; retval = ext2fs_resize_mem(old_size, ctx->dir_info->size * sizeof(struct dir_info), &ctx->dir_info->array); if (retval) { + fprintf(stderr, "Couldn't reallocate dir_info " + "structure to %u entries\n", + ctx->dir_info->size); + fatal_error(ctx, 0); ctx->dir_info->size -= 10; return; } + if (old_array != ctx->dir_info->array) + ctx->dir_info->last_lookup = NULL; } - ent.ino = ino; - ent.parent = parent; - ent.dotdot = parent; +#ifdef CONFIG_TDB + if (ctx->dir_info->tdb) { + struct dir_info ent; - if (db->tdb) { + ent.ino = ino; + ent.parent = parent; + ent.dotdot = parent; e2fsck_put_dir_info(ctx, &ent); return; } +#endif - /* - * Normally, add_dir_info is called with each inode in - * sequential order; but once in a while (like when pass 3 - * needs to recreate the root directory or lost+found - * directory) it is called out of order. In those cases, we - * need to move the dir_info entries down to make room, since - * the dir_info array needs to be sorted by inode number for - * get_dir_info()'s sake. - */ - if (ctx->dir_info->count && - ctx->dir_info->array[ctx->dir_info->count-1].ino >= ino) { - for (i = ctx->dir_info->count-1; i > 0; i--) - if (ctx->dir_info->array[i-1].ino < ino) - break; - dir = &ctx->dir_info->array[i]; - if (dir->ino != ino) - for (j = ctx->dir_info->count++; j > i; j--) - ctx->dir_info->array[j] = ctx->dir_info->array[j-1]; - } else - dir = &ctx->dir_info->array[ctx->dir_info->count++]; - - dir->ino = ino; - dir->dotdot = parent; - dir->parent = parent; + e2fsck_insert_dir_info(ctx->dir_info, ino, parent); } /* @@ -187,19 +345,21 @@ void e2fsck_add_dir_info(e2fsck_t ctx, ext2_ino_t ino, ext2_ino_t parent) static struct dir_info *e2fsck_get_dir_info(e2fsck_t ctx, ext2_ino_t ino) { struct dir_info_db *db = ctx->dir_info; - int low, high, mid; - struct dir_info_ent *buf; - static struct dir_info ret_dir_info; + ext2_ino_t index; + int err; if (!db) return 0; #ifdef DIRINFO_DEBUG - printf("e2fsck_get_dir_info %d...", ino); + printf("e2fsck_get_dir_info %u...", ino); #endif +#ifdef CONFIG_TDB if (db->tdb) { + static struct dir_info ret_dir_info; TDB_DATA key, data; + struct dir_info_ent *buf; key.dptr = (unsigned char *) &ino; key.dsize = sizeof(ext2_ino_t); @@ -217,65 +377,46 @@ static struct dir_info *e2fsck_get_dir_info(e2fsck_t ctx, ext2_ino_t ino) ret_dir_info.dotdot = buf->dotdot; ret_dir_info.parent = buf->parent; #ifdef DIRINFO_DEBUG - printf("(%d,%d,%d)\n", ino, buf->dotdot, buf->parent); + printf("(%u,%u,%u)\n", ino, buf->dotdot, buf->parent); #endif free(data.dptr); return &ret_dir_info; } +#endif if (db->last_lookup && db->last_lookup->ino == ino) return db->last_lookup; - low = 0; - high = ctx->dir_info->count-1; - if (ino == ctx->dir_info->array[low].ino) { + err = e2fsck_dir_info_min_larger_equal(ctx->dir_info, ino, &index); + if (err < 0) + return NULL; + assert(ino <= ctx->dir_info->array[index].ino); + if (ino == ctx->dir_info->array[index].ino) { #ifdef DIRINFO_DEBUG printf("(%d,%d,%d)\n", ino, - ctx->dir_info->array[low].dotdot, - ctx->dir_info->array[low].parent); + ctx->dir_info->array[index].dotdot, + ctx->dir_info->array[index].parent); #endif - return &ctx->dir_info->array[low]; + return &ctx->dir_info->array[index]; } - if (ino == ctx->dir_info->array[high].ino) { -#ifdef DIRINFO_DEBUG - printf("(%d,%d,%d)\n", ino, - ctx->dir_info->array[high].dotdot, - ctx->dir_info->array[high].parent); -#endif - return &ctx->dir_info->array[high]; - } - - while (low < high) { - mid = (low+high)/2; - if (mid == low || mid == high) - break; - if (ino == ctx->dir_info->array[mid].ino) { -#ifdef DIRINFO_DEBUG - printf("(%d,%d,%d)\n", ino, - ctx->dir_info->array[mid].dotdot, - ctx->dir_info->array[mid].parent); -#endif - return &ctx->dir_info->array[mid]; - } - if (ino < ctx->dir_info->array[mid].ino) - high = mid; - else - low = mid; - } - return 0; + return NULL; } -static void e2fsck_put_dir_info(e2fsck_t ctx, struct dir_info *dir) +static void e2fsck_put_dir_info(e2fsck_t ctx EXT2FS_NO_TDB_UNUSED, + struct dir_info *dir EXT2FS_NO_TDB_UNUSED) { +#ifdef CONFIG_TDB struct dir_info_db *db = ctx->dir_info; struct dir_info_ent buf; TDB_DATA key, data; +#endif #ifdef DIRINFO_DEBUG - printf("e2fsck_put_dir_info (%d, %d, %d)...", dir->ino, dir->dotdot, + printf("e2fsck_put_dir_info (%u, %u, %u)...", dir->ino, dir->dotdot, dir->parent); #endif +#ifdef CONFIG_TDB if (!db->tdb) return; @@ -290,7 +431,7 @@ static void e2fsck_put_dir_info(e2fsck_t ctx, struct dir_info *dir) if (tdb_store(db->tdb, key, data, TDB_REPLACE) == -1) { printf("store failed: %s\n", tdb_errorstr(db->tdb)); } - return; +#endif } /* @@ -299,12 +440,16 @@ static void e2fsck_put_dir_info(e2fsck_t ctx, struct dir_info *dir) void e2fsck_free_dir_info(e2fsck_t ctx) { if (ctx->dir_info) { +#ifdef CONFIG_TDB if (ctx->dir_info->tdb) tdb_close(ctx->dir_info->tdb); if (ctx->dir_info->tdb_fn) { - unlink(ctx->dir_info->tdb_fn); - free(ctx->dir_info->tdb_fn); + if (unlink(ctx->dir_info->tdb_fn) < 0) + com_err("e2fsck_free_dir_info", errno, + _("while freeing dir_info tdb file")); + ext2fs_free_mem(&ctx->dir_info->tdb_fn); } +#endif if (ctx->dir_info->array) ext2fs_free_mem(&ctx->dir_info->array); ctx->dir_info->array = 0; @@ -326,13 +471,14 @@ int e2fsck_get_num_dirinfo(e2fsck_t ctx) struct dir_info_iter *e2fsck_dir_info_iter_begin(e2fsck_t ctx) { struct dir_info_iter *iter; - struct dir_info_db *db = ctx->dir_info; iter = e2fsck_allocate_memory(ctx, sizeof(struct dir_info_iter), "dir_info iterator"); - if (db->tdb) - iter->tdb_iter = tdb_firstkey(db->tdb); +#ifdef CONFIG_TDB + if (ctx->dir_info->tdb) + iter->tdb_iter = tdb_firstkey(ctx->dir_info->tdb); +#endif return iter; } @@ -340,7 +486,9 @@ struct dir_info_iter *e2fsck_dir_info_iter_begin(e2fsck_t ctx) void e2fsck_dir_info_iter_end(e2fsck_t ctx EXT2FS_ATTR((unused)), struct dir_info_iter *iter) { +#ifdef CONFIG_TDB free(iter->tdb_iter.dptr); +#endif ext2fs_free_mem(&iter); } @@ -349,39 +497,40 @@ void e2fsck_dir_info_iter_end(e2fsck_t ctx EXT2FS_ATTR((unused)), */ struct dir_info *e2fsck_dir_info_iter(e2fsck_t ctx, struct dir_info_iter *iter) { - TDB_DATA data, key; - struct dir_info_db *db = ctx->dir_info; - struct dir_info_ent *buf; - static struct dir_info ret_dir_info; - if (!ctx->dir_info || !iter) return 0; - if (db->tdb) { +#ifdef CONFIG_TDB + if (ctx->dir_info->tdb) { + static struct dir_info ret_dir_info; + struct dir_info_ent *buf; + TDB_DATA data, key; + if (iter->tdb_iter.dptr == 0) return 0; key = iter->tdb_iter; - data = tdb_fetch(db->tdb, key); + data = tdb_fetch(ctx->dir_info->tdb, key); if (!data.dptr) { printf("iter fetch failed: %s\n", - tdb_errorstr(db->tdb)); + tdb_errorstr(ctx->dir_info->tdb)); return 0; } buf = (struct dir_info_ent *) data.dptr; ret_dir_info.ino = *((ext2_ino_t *) iter->tdb_iter.dptr); ret_dir_info.dotdot = buf->dotdot; ret_dir_info.parent = buf->parent; - iter->tdb_iter = tdb_nextkey(db->tdb, key); + iter->tdb_iter = tdb_nextkey(ctx->dir_info->tdb, key); free(key.dptr); free(data.dptr); return &ret_dir_info; } +#endif if (iter->i >= ctx->dir_info->count) return 0; #ifdef DIRINFO_DEBUG - printf("iter(%d, %d, %d)...", ctx->dir_info->array[iter->i].ino, + printf("iter(%u, %u, %u)...", ctx->dir_info->array[iter->i].ino, ctx->dir_info->array[iter->i].dotdot, ctx->dir_info->array[iter->i].parent); #endif