1 commit 2db3b2b33ee796f4ea61316773452d936303ad27
2 Author: Pravin Shelar <Pravin.Shelar@sun.com>
3 AuthorDate: Sun Oct 4 18:13:14 2009 +0000
4 Subject: ext4: add ext4-data-in-dirent patch
6 Allows ext4 to store extra data records inside the ext4_dirent
7 along with the regular directory entry (type, length, filename).
8 Data is stored in ext4 dirent after filename, with a bit flag in
9 de->file_type to indicate if any record after de->name is used.
10 Each in-use record is variable length and must store a 1-byte
11 length (including the length byte itself) at the start so that it
12 can be skipped if the record type is unknown/uneeded. The record
13 starts after a NUL byte terminator for the filename. This extra
14 space is accounted in de->rec_len but not de->name_len.
16 Flag EXT4_DIRENT_LUFID is used for a 128-bit file identifier.
17 Make use of dentry->d_fsdata to pass LUFID to ext4, so no changes
18 in ext4_add_entry() interface are required.
21 Signed-off-by: Pravin Shelar <Pravin.Shelar@sun.com>
22 Reviewed-by: Huang Hua <h.huang@sun.com>
23 Signed-off-by: Andreas Dilger <andreas.dilger@sun.com>
26 fs/ext4/ext4.h | 107 ++++++++++++++++--
27 fs/ext4/fast_commit.c | 2 +-
28 fs/ext4/inline.c | 8 +-
29 fs/ext4/namei.c | 251 ++++++++++++++++++++++++++++++++----------
30 fs/ext4/super.c | 12 +-
31 6 files changed, 314 insertions(+), 75 deletions(-)
33 diff --git a/fs/ext4/dir.c b/fs/ext4/dir.c
34 index 3985f8c3..b8e4df14 100644
37 @@ -465,12 +465,17 @@ int ext4_htree_store_dirent(struct file *dir_file, __u32 hash,
38 struct fname *fname, *new_fn;
39 struct dir_private_info *info;
43 info = dir_file->private_data;
44 p = &info->root.rb_node;
46 /* Create and allocate the fname structure */
47 - len = sizeof(struct fname) + ent_name->len + 1;
48 + if (dirent->file_type & EXT4_DIRENT_LUFID)
49 + extra_data = ext4_get_dirent_data_len(dirent);
51 + len = sizeof(struct fname) + ent_name->len + extra_data + 1;
53 new_fn = kzalloc(len, GFP_KERNEL);
56 @@ -479,7 +484,7 @@ int ext4_htree_store_dirent(struct file *dir_file, __u32 hash,
57 new_fn->inode = le32_to_cpu(dirent->inode);
58 new_fn->name_len = ent_name->len;
59 new_fn->file_type = dirent->file_type;
60 - memcpy(new_fn->name, ent_name->name, ent_name->len);
61 + memcpy(new_fn->name, ent_name->name, ent_name->len + extra_data);
65 diff --git a/fs/ext4/ext4.h b/fs/ext4/ext4.h
66 index a4af3ec8..930ca3a5 100644
69 @@ -1184,6 +1184,7 @@ struct ext4_inode_info {
77 @@ -1205,6 +1206,7 @@ struct ext4_inode_info {
78 * Mount flags set via mount options or defaults
80 #define EXT4_MOUNT_NO_MBCACHE 0x00001 /* Do not use mbcache */
81 +#define EXT4_MOUNT_DIRDATA 0x00002 /* Data in directory entries */
82 #define EXT4_MOUNT_GRPID 0x00004 /* Create files with directory's group */
83 #define EXT4_MOUNT_DEBUG 0x00008 /* Some debugging messages */
84 #define EXT4_MOUNT_ERRORS_CONT 0x00010 /* Continue on errors */
85 @@ -2174,6 +2176,7 @@ EXT4_FEATURE_INCOMPAT_FUNCS(casefold, CASEFOLD)
86 EXT4_FEATURE_INCOMPAT_FLEX_BG| \
87 EXT4_FEATURE_INCOMPAT_EA_INODE| \
88 EXT4_FEATURE_INCOMPAT_MMP | \
89 + EXT4_FEATURE_INCOMPAT_DIRDATA| \
90 EXT4_FEATURE_INCOMPAT_INLINE_DATA | \
91 EXT4_FEATURE_INCOMPAT_ENCRYPT | \
92 EXT4_FEATURE_INCOMPAT_CASEFOLD | \
93 @@ -2385,6 +2388,42 @@ struct ext4_dir_entry_tail {
94 #define EXT4_FT_SYMLINK 7
97 +#define EXT4_FT_MASK 0xf
99 +#if EXT4_FT_MAX > EXT4_FT_MASK
100 +#error "conflicting EXT4_FT_MAX and EXT4_FT_MASK"
104 + * d_type has 4 unused bits, so it can hold four types data. these different
105 + * type of data (e.g. lustre data, high 32 bits of 64-bit inode number) can be
106 + * stored, in flag order, after file-name in ext4 dirent.
109 + * this flag is added to d_type if ext4 dirent has extra data after
110 + * filename. this data length is variable and length is stored in first byte
111 + * of data. data start after filename NUL byte.
112 + * This is used by Lustre FS.
114 +#define EXT4_DIRENT_LUFID 0x10
116 +#define EXT4_LUFID_MAGIC 0xAD200907UL
117 +struct ext4_dentry_param {
118 + __u32 edp_magic; /* EXT4_LUFID_MAGIC */
119 + char edp_len; /* size of edp_data in bytes */
120 + char edp_data[0]; /* packed array of data */
123 +static inline unsigned char *ext4_dentry_get_data(struct super_block *sb,
124 + struct ext4_dentry_param *p)
126 + if (!ext4_has_feature_dirdata(sb))
128 + if (p && p->edp_magic == EXT4_LUFID_MAGIC)
129 + return &p->edp_len;
134 #define EXT4_FT_DIR_CSUM 0xDE
136 @@ -2396,6 +2435,17 @@ struct ext4_dir_entry_tail {
137 #define EXT4_DIR_PAD 4
138 #define EXT4_DIR_ROUND (EXT4_DIR_PAD - 1)
139 #define EXT4_MAX_REC_LEN ((1<<16)-1)
140 +#define EXT4_DIR_REC_LEN_(name_len, i_dir) \
141 + ext4_dir_rec_len((name_len), (i_dir))
142 +#define EXT4_DIR_ENTRY_LEN_(de, i_dir) \
143 + (EXT4_DIR_REC_LEN_((de)->name_len + ext4_get_dirent_data_len(de), \
146 +#define EXT4_DIR_REC_LEN(name_len, i_dir) EXT4_DIR_REC_LEN_((name_len), (i_dir))
147 +#define EXT4_DIR_ENTRY_LEN(de, i_dir) EXT4_DIR_ENTRY_LEN_((de), (i_dir))
148 +/* lustre osd_handler compat -- ifdef LDISKFS_DIR_REC_LEN_WITH_DIR */
149 +#define EXT4_DIR_REC_LEN_WITH_DIR 1
150 +#define __EXT4_DIR_REC_LEN(name_len) EXT4_DIR_REC_LEN_((name_len), NULL)
153 * The rec_len is dependent on the type of directory. Directories that are
154 @@ -2403,10 +2453,10 @@ struct ext4_dir_entry_tail {
155 * ext4_extended_dir_entry_2. For all entries related to '.' or '..' you should
156 * pass NULL for dir, as those entries do not use the extra fields.
158 -static inline unsigned int ext4_dir_rec_len(__u8 name_len,
159 +static inline unsigned int ext4_dir_rec_len(__u32 name_len,
160 const struct inode *dir)
162 - int rec_len = (name_len + 8 + EXT4_DIR_ROUND);
163 + __u32 rec_len = (name_len + 8 + EXT4_DIR_ROUND);
165 if (dir && ext4_hash_in_dirent(dir))
166 rec_len += sizeof(struct ext4_dir_entry_hash);
167 @@ -2831,11 +2881,13 @@ extern int ext4_find_dest_de(struct inode *dir, struct inode *inode,
168 struct buffer_head *bh,
169 void *buf, int buf_size,
170 struct ext4_filename *fname,
171 - struct ext4_dir_entry_2 **dest_de);
172 + struct ext4_dir_entry_2 **dest_de,
174 void ext4_insert_dentry(struct inode *dir, struct inode *inode,
175 struct ext4_dir_entry_2 *de,
177 - struct ext4_filename *fname);
178 + struct ext4_filename *fname,
180 static inline void ext4_update_dx_flag(struct inode *inode)
182 if (!ext4_has_feature_dir_index(inode->i_sb) &&
183 @@ -2851,10 +2903,17 @@ static const unsigned char ext4_filetype_table[] = {
185 static inline unsigned char get_dtype(struct super_block *sb, int filetype)
187 - if (!ext4_has_feature_filetype(sb) || filetype >= EXT4_FT_MAX)
188 + int fl_index = filetype & EXT4_FT_MASK;
190 + if (!ext4_has_feature_filetype(sb) || fl_index >= EXT4_FT_MAX)
193 - return ext4_filetype_table[filetype];
194 + if (!test_opt(sb, DIRDATA))
195 + return ext4_filetype_table[fl_index];
197 + return (ext4_filetype_table[fl_index]) |
198 + (filetype & EXT4_DIRENT_LUFID);
201 extern int ext4_check_all_de(struct inode *dir, struct buffer_head *bh,
202 void *buf, int buf_size);
203 @@ -3058,9 +3117,13 @@ extern int ext4_ind_migrate(struct inode *inode);
206 extern int ext4_init_new_dir(handle_t *handle, struct inode *dir,
207 - struct inode *inode);
208 + struct inode *inode,
209 + const void *data1, const void *data2);
210 extern int ext4_dirblock_csum_verify(struct inode *inode,
211 struct buffer_head *bh);
212 +extern int ext4_add_dot_dotdot(handle_t *handle, struct inode *dir,
213 + struct inode *inode,
214 + const void *data1, const void *data2);
215 extern int ext4_htree_fill_tree(struct file *dir_file, __u32 start_hash,
216 __u32 start_minor_hash, __u32 *next_hash);
217 extern struct inode *ext4_create_inode(handle_t *handle,
218 @@ -3887,6 +3950,36 @@ static inline int ext4_buffer_uptodate(struct buffer_head *bh)
219 return buffer_uptodate(bh);
223 + * Compute the total directory entry data length.
224 + * This includes the filename and an implicit NUL terminator (always present),
225 + * and optional extensions. Each extension has a bit set in the high 4 bits of
226 + * de->file_type, and the extension length is the first byte in each entry.
228 +static inline int ext4_get_dirent_data_len(struct ext4_dir_entry_2 *de)
230 + char *len = de->name + de->name_len + 1 /* NUL terminator */;
232 + __u8 extra_data_flags = (de->file_type & ~EXT4_FT_MASK) >> 4;
233 + struct ext4_dir_entry_tail *t = (struct ext4_dir_entry_tail *)de;
235 + if (!t->det_reserved_zero1 &&
236 + le16_to_cpu(t->det_rec_len) ==
237 + sizeof(struct ext4_dir_entry_tail) &&
238 + !t->det_reserved_zero2 &&
239 + t->det_reserved_ft == EXT4_FT_DIR_CSUM)
242 + while (extra_data_flags) {
243 + if (extra_data_flags & 1) {
244 + dlen += *len + (dlen == 0);
247 + extra_data_flags >>= 1;
252 #endif /* __KERNEL__ */
254 #define EFSBADCRC EBADMSG /* Bad CRC detected */
255 diff --git a/fs/ext4/fast_commit.c b/fs/ext4/fast_commit.c
256 index 8de354dc..00c4769b 100644
257 --- a/fs/ext4/fast_commit.c
258 +++ b/fs/ext4/fast_commit.c
259 @@ -1674,7 +1674,7 @@ static int ext4_fc_replay_create(struct super_block *sb,
260 ext4_debug("Dir %d not found.", darg.ino);
263 - ret = ext4_init_new_dir(NULL, dir, inode);
264 + ret = ext4_init_new_dir(NULL, dir, inode, NULL, NULL);
268 diff --git a/fs/ext4/inline.c b/fs/ext4/inline.c
269 index c4475a74..3fc75d80 100644
270 --- a/fs/ext4/inline.c
271 +++ b/fs/ext4/inline.c
272 @@ -1031,7 +1031,7 @@ static int ext4_add_dirent_to_inline(handle_t *handle,
273 struct ext4_dir_entry_2 *de;
275 err = ext4_find_dest_de(dir, inode, iloc->bh, inline_start,
276 - inline_size, fname, &de);
277 + inline_size, fname, &de, NULL);
281 @@ -1040,7 +1040,7 @@ static int ext4_add_dirent_to_inline(handle_t *handle,
285 - ext4_insert_dentry(dir, inode, de, inline_size, fname);
286 + ext4_insert_dentry(dir, inode, de, inline_size, fname, NULL);
288 ext4_show_inline_dir(dir, iloc->bh, inline_start, inline_size);
290 @@ -1398,7 +1398,7 @@ int ext4_inlinedir_to_tree(struct file *dir_file,
292 strcpy(fake.name, ".");
293 fake.rec_len = ext4_rec_len_to_disk(
294 - ext4_dir_rec_len(fake.name_len, NULL),
295 + EXT4_DIR_ENTRY_LEN(&fake, NULL),
297 ext4_set_de_type(inode->i_sb, &fake, S_IFDIR);
299 @@ -1408,7 +1408,7 @@ int ext4_inlinedir_to_tree(struct file *dir_file,
301 strcpy(fake.name, "..");
302 fake.rec_len = ext4_rec_len_to_disk(
303 - ext4_dir_rec_len(fake.name_len, NULL),
304 + EXT4_DIR_ENTRY_LEN(&fake, NULL),
306 ext4_set_de_type(inode->i_sb, &fake, S_IFDIR);
308 diff --git a/fs/ext4/namei.c b/fs/ext4/namei.c
309 index d0afa8f2..839d51ba 100644
310 --- a/fs/ext4/namei.c
311 +++ b/fs/ext4/namei.c
312 @@ -291,13 +291,14 @@ static unsigned dx_get_count(struct dx_entry *entries);
313 static unsigned dx_get_limit(struct dx_entry *entries);
314 static void dx_set_count(struct dx_entry *entries, unsigned value);
315 static void dx_set_limit(struct dx_entry *entries, unsigned value);
316 -static unsigned dx_root_limit(struct inode *dir, unsigned infosize);
317 +static inline unsigned dx_root_limit(struct inode *dir,
318 + struct ext4_dir_entry_2 *dot_de, unsigned infosize);
319 static unsigned dx_node_limit(struct inode *dir);
320 static struct dx_frame *dx_probe(struct ext4_filename *fname,
322 struct dx_hash_info *hinfo,
323 struct dx_frame *frame);
324 -static void dx_release(struct dx_frame *frames);
325 +static void dx_release(struct dx_frame *frames, struct inode *dir);
326 static int dx_make_map(struct inode *dir, struct buffer_head *bh,
327 struct dx_hash_info *hinfo,
328 struct dx_map_entry *map_tail);
329 @@ -437,22 +438,23 @@ static struct dx_countlimit *get_dx_countlimit(struct inode *inode,
331 struct ext4_dir_entry *dp;
332 struct dx_root_info *root;
334 + int count_offset, dot_rec_len, dotdot_rec_len;
336 if (le16_to_cpu(dirent->rec_len) == EXT4_BLOCK_SIZE(inode->i_sb))
338 - else if (le16_to_cpu(dirent->rec_len) == 12) {
339 - dp = (struct ext4_dir_entry *)(((void *)dirent) + 12);
341 + dot_rec_len = le16_to_cpu(dirent->rec_len);
342 + dp = (struct ext4_dir_entry *)(((void *)dirent) + dot_rec_len);
343 if (le16_to_cpu(dp->rec_len) !=
344 - EXT4_BLOCK_SIZE(inode->i_sb) - 12)
345 + EXT4_BLOCK_SIZE(inode->i_sb) - dot_rec_len)
347 - root = (struct dx_root_info *)(((void *)dp + 12));
348 + dotdot_rec_len = EXT4_DIR_ENTRY_LEN((struct ext4_dir_entry_2 *)dp, NULL);
349 + root = (struct dx_root_info *)(((void *)dp + dotdot_rec_len));
350 if (root->reserved_zero ||
351 root->info_length != sizeof(struct dx_root_info))
356 + count_offset = 8 + dot_rec_len + dotdot_rec_len;
360 *offset = count_offset;
361 @@ -555,13 +557,14 @@ ext4_next_entry(struct ext4_dir_entry_2 *p, unsigned long blocksize)
362 * Future: use high four bits of block for coalesce-on-delete flags
363 * Mask them off for now.
365 -struct dx_root_info *dx_get_dx_info(struct ext4_dir_entry_2 *de)
366 +struct dx_root_info *dx_get_dx_info(struct ext4_dir_entry_2 *de, struct inode *i_dir)
368 + BUG_ON(de->name_len != 1);
369 /* get dotdot first */
370 - de = (struct ext4_dir_entry_2 *)((char *)de + EXT4_DIR_REC_LEN(1));
371 + de = (struct ext4_dir_entry_2 *)((char *)de + EXT4_DIR_ENTRY_LEN(de, i_dir));
373 /* dx root info is after dotdot entry */
374 - de = (struct ext4_dir_entry_2 *)((char *)de + EXT4_DIR_REC_LEN(2));
375 + de = (struct ext4_dir_entry_2 *)((char *)de + EXT4_DIR_ENTRY_LEN(de, i_dir));
377 return (struct dx_root_info *)de;
379 @@ -606,11 +609,16 @@ static inline void dx_set_limit(struct dx_entry *entries, unsigned value)
380 ((struct dx_countlimit *) entries)->limit = cpu_to_le16(value);
383 -static inline unsigned dx_root_limit(struct inode *dir, unsigned infosize)
384 +static inline unsigned dx_root_limit(struct inode *dir,
385 + struct ext4_dir_entry_2 *dot_de, unsigned infosize)
387 - unsigned int entry_space = dir->i_sb->s_blocksize -
388 - ext4_dir_rec_len(1, NULL) -
389 - ext4_dir_rec_len(2, NULL) - infosize;
390 + struct ext4_dir_entry_2 *dotdot_de;
391 + unsigned entry_space;
393 + BUG_ON(dot_de->name_len != 1);
394 + dotdot_de = ext4_next_entry(dot_de, dir->i_sb->s_blocksize);
395 + entry_space = dir->i_sb->s_blocksize - EXT4_DIR_ENTRY_LEN(dot_de, NULL) -
396 + EXT4_DIR_ENTRY_LEN(dotdot_de, NULL) - infosize;
398 if (ext4_has_metadata_csum(dir->i_sb))
399 entry_space -= sizeof(struct dx_tail);
400 @@ -728,7 +736,7 @@ static struct stats dx_show_leaf(struct inode *dir,
401 (unsigned) ((char *) de - base));
404 - space += ext4_dir_rec_len(de->name_len, dir);
405 + space += EXT4_DIR_ENTRY_LEN(de, dir);
408 de = ext4_next_entry(de, size);
409 @@ -822,7 +830,7 @@ dx_probe(struct ext4_filename *fname, struct inode *dir,
410 if (IS_ERR(frame->bh))
411 return (struct dx_frame *) frame->bh;
413 - info = dx_get_dx_info((struct ext4_dir_entry_2 *)frame->bh->b_data);
414 + info = dx_get_dx_info((struct ext4_dir_entry_2 *)frame->bh->b_data, dir);
415 if (info->hash_version != DX_HASH_TEA &&
416 info->hash_version != DX_HASH_HALF_MD4 &&
417 info->hash_version != DX_HASH_LEGACY &&
418 @@ -878,11 +886,14 @@ dx_probe(struct ext4_filename *fname, struct inode *dir,
420 entries = (struct dx_entry *)(((char *)info) + info->info_length);
422 - if (dx_get_limit(entries) != dx_root_limit(dir,
423 - info->info_length)) {
424 + if (dx_get_limit(entries) !=
425 + dx_root_limit(dir, (struct ext4_dir_entry_2 *)frame->bh->b_data,
426 + info->info_length)) {
427 ext4_warning_inode(dir, "dx entry: limit %u != root limit %u",
428 dx_get_limit(entries),
429 - dx_root_limit(dir, info->info_length));
431 + (struct ext4_dir_entry_2 *)frame->bh->b_data,
432 + info->info_length));
436 @@ -959,7 +970,7 @@ fail:
440 -static void dx_release(struct dx_frame *frames)
441 +static void dx_release(struct dx_frame *frames, struct inode *dir)
443 struct dx_root_info *info;
445 @@ -968,7 +979,7 @@ static void dx_release(struct dx_frame *frames)
446 if (frames[0].bh == NULL)
449 - info = dx_get_dx_info((struct ext4_dir_entry_2 *)frames[0].bh->b_data);
450 + info = dx_get_dx_info((struct ext4_dir_entry_2 *)frames[0].bh->b_data, dir);
451 /* save local copy, "info" may be freed after brelse() */
452 indirect_levels = info->indirect_levels;
453 for (i = 0; i <= indirect_levels; i++) {
454 @@ -1269,12 +1280,12 @@ int ext4_htree_fill_tree(struct file *dir_file, __u32 start_hash,
455 (count && ((hashval & 1) == 0)))
458 - dx_release(frames);
459 + dx_release(frames, dir);
460 dxtrace(printk(KERN_DEBUG "Fill tree: returned %d entries, "
461 "next hash: %x\n", count, *next_hash));
464 - dx_release(frames);
465 + dx_release(frames, dir);
469 @@ -1806,7 +1817,7 @@ static struct buffer_head * ext4_dx_find_entry(struct inode *dir,
471 dxtrace(printk(KERN_DEBUG "%s not found\n", fname->usr_fname->name));
473 - dx_release(frames);
474 + dx_release(frames, dir);
478 @@ -1930,7 +1941,7 @@ dx_move_dirents(struct inode *dir, char *from, char *to,
480 struct ext4_dir_entry_2 *de = (struct ext4_dir_entry_2 *)
481 (from + (map->offs<<2));
482 - rec_len = ext4_dir_rec_len(de->name_len, dir);
483 + rec_len = EXT4_DIR_ENTRY_LEN(de, dir);
485 memcpy (to, de, rec_len);
486 ((struct ext4_dir_entry_2 *) to)->rec_len =
487 @@ -1963,7 +1974,7 @@ static struct ext4_dir_entry_2 *dx_pack_dirents(struct inode *dir, char *base,
488 while ((char*)de < base + blocksize) {
489 next = ext4_next_entry(de, blocksize);
490 if (de->inode && de->name_len) {
491 - rec_len = ext4_dir_rec_len(de->name_len, dir);
492 + rec_len = EXT4_DIR_ENTRY_LEN(de, dir);
494 memmove(to, de, rec_len);
495 to->rec_len = ext4_rec_len_to_disk(rec_len, blocksize);
496 @@ -2106,14 +2117,22 @@ int ext4_find_dest_de(struct inode *dir, struct inode *inode,
497 struct buffer_head *bh,
498 void *buf, int buf_size,
499 struct ext4_filename *fname,
500 - struct ext4_dir_entry_2 **dest_de)
501 + struct ext4_dir_entry_2 **dest_de,
504 struct ext4_dir_entry_2 *de;
505 - unsigned short reclen = ext4_dir_rec_len(fname_len(fname), dir);
506 + unsigned short reclen;
508 unsigned int offset = 0;
512 + reclen = ext4_dir_rec_len(fname_len(fname) + *dlen, dir);
515 + reclen = ext4_dir_rec_len(fname_len(fname), dir);
519 top = buf + buf_size - reclen;
520 while ((char *) de <= top) {
521 @@ -2122,10 +2141,31 @@ int ext4_find_dest_de(struct inode *dir, struct inode *inode,
522 return -EFSCORRUPTED;
523 if (ext4_match(dir, fname, de))
525 - nlen = ext4_dir_rec_len(de->name_len, dir);
526 + nlen = EXT4_DIR_ENTRY_LEN(de, dir);
527 rlen = ext4_rec_len_from_disk(de->rec_len, buf_size);
528 if ((de->inode ? rlen - nlen : rlen) >= reclen)
531 + /* Then for dotdot entries, check for the smaller space
532 + * required for just the entry, no FID
534 + if (fname_len(fname) == 2 && memcmp(fname_name(fname), "..", 2) == 0) {
535 + if ((de->inode ? rlen - nlen : rlen) >=
536 + ext4_dir_rec_len(fname_len(fname), dir)) {
537 + /* set dlen = 1 to indicate not
538 + * enough space store fid
544 + /* The new ".." entry must be written over the
545 + * previous ".." entry, which is the first
546 + * entry traversed by this scan. If it doesn't
547 + * fit, something is badly wrong, so -EIO.
551 de = (struct ext4_dir_entry_2 *)((char *)de + rlen);
554 @@ -2140,12 +2180,13 @@ void ext4_insert_dentry(struct inode *dir,
556 struct ext4_dir_entry_2 *de,
558 - struct ext4_filename *fname)
559 + struct ext4_filename *fname,
565 - nlen = ext4_dir_rec_len(de->name_len, dir);
566 + nlen = EXT4_DIR_ENTRY_LEN(de, dir);
567 rlen = ext4_rec_len_from_disk(de->rec_len, buf_size);
569 struct ext4_dir_entry_2 *de1 =
570 @@ -2166,6 +2207,12 @@ void ext4_insert_dentry(struct inode *dir,
571 EXT4_DIRENT_HASHES(de)->minor_hash =
572 cpu_to_le32(hinfo->minor_hash);
575 + de->name[fname_len(fname)] = 0;
576 + memcpy(&de->name[fname_len(fname) + 1], data, *(char *)data);
577 + de->file_type |= EXT4_DIRENT_LUFID;
583 @@ -2183,14 +2230,19 @@ static int add_dirent_to_buf(handle_t *handle, struct ext4_filename *fname,
585 unsigned int blocksize = dir->i_sb->s_blocksize;
588 + int err, err2, dlen = 0;
589 + unsigned char *data;
591 + data = ext4_dentry_get_data(inode->i_sb, (struct ext4_dentry_param *)
592 + EXT4_I(inode)->i_dirdata);
593 if (ext4_has_metadata_csum(inode->i_sb))
594 csum_size = sizeof(struct ext4_dir_entry_tail);
598 + dlen = (*data) + 1;
599 err = ext4_find_dest_de(dir, inode, bh, bh->b_data,
600 - blocksize - csum_size, fname, &de);
601 + blocksize - csum_size, fname, &de, &dlen);
605 @@ -2203,7 +2255,10 @@ static int add_dirent_to_buf(handle_t *handle, struct ext4_filename *fname,
608 /* By now the buffer is marked for journaling */
609 - ext4_insert_dentry(dir, inode, de, blocksize, fname);
610 + /* If writing the short form of "dotdot", don't add the data section */
613 + ext4_insert_dentry(dir, inode, de, blocksize, fname, data);
616 * XXX shouldn't update any times until successful
617 @@ -2309,7 +2364,7 @@ static int make_indexed_dir(handle_t *handle, struct ext4_filename *fname,
620 /* initialize hashing info */
621 - dx_info = dx_get_dx_info(dot_de);
622 + dx_info = dx_get_dx_info(dot_de, dir);
623 memset(dx_info, 0, sizeof(*dx_info));
624 dx_info->info_length = sizeof(*dx_info);
625 if (ext4_hash_in_dirent(dir))
626 @@ -2320,7 +2375,8 @@ static int make_indexed_dir(handle_t *handle, struct ext4_filename *fname,
627 entries = (void *)dx_info + sizeof(*dx_info);
628 dx_set_block(entries, 1);
629 dx_set_count(entries, 1);
630 - dx_set_limit(entries, dx_root_limit(dir, sizeof(*dx_info)));
631 + dx_set_limit(entries, dx_root_limit(dir,
632 + dot_de, sizeof(*dx_info)));
634 /* Initialize as for dx_probe */
635 fname->hinfo.hash_version = dx_info->hash_version;
636 @@ -2361,7 +2417,7 @@ out_frames:
639 ext4_mark_inode_dirty(handle, dir);
640 - dx_release(frames);
641 + dx_release(frames, dir);
645 @@ -2374,6 +2430,8 @@ static int ext4_update_dotdot(handle_t *handle, struct dentry *dentry,
646 struct buffer_head *dir_block;
647 struct ext4_dir_entry_2 *de;
648 int len, journal = 0, err = 0;
653 return PTR_ERR(handle);
654 @@ -2389,21 +2447,26 @@ static int ext4_update_dotdot(handle_t *handle, struct dentry *dentry,
656 de = (struct ext4_dir_entry_2 *)dir_block->b_data;
657 /* the first item must be "." */
658 - assert(de->name_len == 1 && de->name[0] == '.');
659 + ASSERT(de->name_len == 1 && de->name[0] == '.');
660 len = le16_to_cpu(de->rec_len);
661 - assert(len >= EXT4_DIR_REC_LEN(1));
662 - if (len > EXT4_DIR_REC_LEN(1)) {
663 + ASSERT(len >= EXT4_DIR_REC_LEN(1, dir));
664 + if (len > EXT4_DIR_REC_LEN(1, dir)) {
665 BUFFER_TRACE(dir_block, "get_write_access");
666 err = ext4_journal_get_write_access(handle, dir->i_sb, dir_block, EXT4_JTR_NONE);
671 - de->rec_len = cpu_to_le16(EXT4_DIR_REC_LEN(1));
672 + de->rec_len = cpu_to_le16(EXT4_DIR_ENTRY_LEN(de, dir));
675 - len -= EXT4_DIR_REC_LEN(1);
676 - assert(len == 0 || len >= EXT4_DIR_REC_LEN(2));
677 + len -= EXT4_DIR_ENTRY_LEN(de, NULL);
678 + data = ext4_dentry_get_data(dir->i_sb,
679 + (struct ext4_dentry_param *)dentry->d_fsdata);
682 + ASSERT(len == 0 || len >= EXT4_DIR_REC_LEN(2 + dlen, dir));
684 de = (struct ext4_dir_entry_2 *)
685 ((char *) de + le16_to_cpu(de->rec_len));
687 @@ -2417,10 +2480,15 @@ static int ext4_update_dotdot(handle_t *handle, struct dentry *dentry,
689 de->rec_len = cpu_to_le16(len);
691 - assert(le16_to_cpu(de->rec_len) >= EXT4_DIR_REC_LEN(2));
692 + ASSERT(le16_to_cpu(de->rec_len) >= EXT4_DIR_REC_LEN(2, dir));
694 strcpy(de->name, "..");
695 - ext4_set_de_type(dir->i_sb, de, S_IFDIR);
696 + if (data != NULL && ext4_get_dirent_data_len(de) >= dlen) {
698 + memcpy(&de->name[2 + 1], data, *data);
699 + ext4_set_de_type(dir->i_sb, de, S_IFDIR);
700 + de->file_type |= EXT4_DIRENT_LUFID;
705 @@ -2458,6 +2526,7 @@ static int ext4_add_entry(handle_t *handle, struct dentry *dentry,
706 ext4_lblk_t block, blocks;
709 + EXT4_I(inode)->i_dirdata = dentry->d_fsdata;
710 if (ext4_has_metadata_csum(inode->i_sb))
711 csum_size = sizeof(struct ext4_dir_entry_tail);
713 @@ -2700,7 +2769,7 @@ again:
714 dx_set_count(entries, 1);
715 dx_set_block(entries + 0, newblock);
716 info = dx_get_dx_info((struct ext4_dir_entry_2 *)
717 - frames[0].bh->b_data);
718 + frames[0].bh->b_data, dir);
719 info->indirect_levels = 1;
720 dxtrace(printk(KERN_DEBUG
721 "Creating %d level index...\n",
722 @@ -2726,7 +2795,7 @@ journal_error:
723 ext4_std_error(dir->i_sb, err); /* this is a no-op if err == 0 */
726 - dx_release(frames);
727 + dx_release(frames, dir);
728 /* @restart is true means htree-path has been changed, we need to
729 * repeat dx_probe() to find out valid htree-path
731 @@ -3029,38 +3098,73 @@ err_unlock_inode:
736 + struct inode *inode;
741 struct ext4_dir_entry_2 *ext4_init_dot_dotdot(struct inode *inode,
742 struct ext4_dir_entry_2 *de,
743 int blocksize, int csum_size,
744 unsigned int parent_ino, int dotdot_real_len)
746 + void *data1 = NULL, *data2 = NULL;
747 + int dot_reclen = 0;
749 + if (dotdot_real_len == 10) {
750 + struct tp_block *tpb = (struct tp_block *)inode;
751 + data1 = tpb->data1;
752 + data2 = tpb->data2;
753 + inode = tpb->inode;
754 + dotdot_real_len = 0;
756 de->inode = cpu_to_le32(inode->i_ino);
758 - de->rec_len = ext4_rec_len_to_disk(ext4_dir_rec_len(de->name_len, NULL),
760 strcpy(de->name, ".");
761 ext4_set_de_type(inode->i_sb, de, S_IFDIR);
763 + /* get packed fid data*/
764 + data1 = ext4_dentry_get_data(inode->i_sb,
765 + (struct ext4_dentry_param *) data1);
768 + memcpy(&de->name[2], data1, *(char *) data1);
769 + de->file_type |= EXT4_DIRENT_LUFID;
771 + de->rec_len = cpu_to_le16(EXT4_DIR_ENTRY_LEN(de, NULL));
773 + dot_reclen = cpu_to_le16(de->rec_len);
774 de = ext4_next_entry(de, blocksize);
775 de->inode = cpu_to_le32(parent_ino);
778 + strcpy(de->name, "..");
779 + ext4_set_de_type(inode->i_sb, de, S_IFDIR);
780 + data2 = ext4_dentry_get_data(inode->i_sb,
781 + (struct ext4_dentry_param *) data2);
784 + memcpy(&de->name[3], data2, *(char *) data2);
785 + de->file_type |= EXT4_DIRENT_LUFID;
788 if (!dotdot_real_len)
789 de->rec_len = ext4_rec_len_to_disk(blocksize -
790 - (csum_size + ext4_dir_rec_len(1, NULL)),
792 + (csum_size + dot_reclen), blocksize);
794 de->rec_len = ext4_rec_len_to_disk(
795 - ext4_dir_rec_len(de->name_len, NULL),
796 + EXT4_DIR_ENTRY_LEN(de, NULL),
798 - strcpy(de->name, "..");
799 - ext4_set_de_type(inode->i_sb, de, S_IFDIR);
801 return ext4_next_entry(de, blocksize);
804 int ext4_init_new_dir(handle_t *handle, struct inode *dir,
805 - struct inode *inode)
806 + struct inode *inode,
807 + const void *data1, const void *data2)
809 + struct tp_block param;
810 struct buffer_head *dir_block = NULL;
811 struct ext4_dir_entry_2 *de;
812 ext4_lblk_t block = 0;
813 @@ -3084,7 +3188,11 @@ int ext4_init_new_dir(handle_t *handle, struct inode *dir,
814 if (IS_ERR(dir_block))
815 return PTR_ERR(dir_block);
816 de = (struct ext4_dir_entry_2 *)dir_block->b_data;
817 - ext4_init_dot_dotdot(inode, de, blocksize, csum_size, dir->i_ino, 0);
818 + param.inode = inode;
819 + param.data1 = (void *)data1;
820 + param.data2 = (void *)data2;
821 + ext4_init_dot_dotdot((struct inode *)(¶m), de, blocksize,
822 + csum_size, dir->i_ino, 10);
825 ext4_initialize_dirent_tail(dir_block, blocksize);
826 @@ -3099,6 +3207,29 @@ out:
830 +/* Initialize @inode as a subdirectory of @dir, and add the
831 + * "." and ".." entries into the first directory block. */
832 +int ext4_add_dot_dotdot(handle_t *handle, struct inode *dir,
833 + struct inode *inode,
834 + const void *data1, const void *data2)
838 + if (IS_ERR(handle))
839 + return PTR_ERR(handle);
841 + if (IS_DIRSYNC(dir))
842 + ext4_handle_sync(handle);
844 + inode->i_op = &ext4_dir_inode_operations;
845 + inode->i_fop = &ext4_dir_operations;
846 + rc = ext4_init_new_dir(handle, dir, inode, data1, data2);
848 + rc = ext4_mark_inode_dirty(handle, inode);
851 +EXPORT_SYMBOL(ext4_add_dot_dotdot);
853 static int ext4_mkdir(struct user_namespace *mnt_userns, struct inode *dir,
854 struct dentry *dentry, umode_t mode)
856 @@ -3126,7 +3257,7 @@ retry:
858 inode->i_op = &ext4_dir_inode_operations;
859 inode->i_fop = &ext4_dir_operations;
860 - err = ext4_init_new_dir(handle, dir, inode);
861 + err = ext4_init_new_dir(handle, dir, inode, NULL, NULL);
863 goto out_clear_inode;
864 err = ext4_mark_inode_dirty(handle, inode);
865 diff --git a/fs/ext4/super.c b/fs/ext4/super.c
866 index c013357d..1838ee86 100644
867 --- a/fs/ext4/super.c
868 +++ b/fs/ext4/super.c
869 @@ -1571,7 +1571,7 @@ enum {
870 Opt_data_err_abort, Opt_data_err_ignore, Opt_test_dummy_encryption,
872 Opt_usrjquota, Opt_grpjquota, Opt_quota,
873 - Opt_noquota, Opt_barrier, Opt_nobarrier, Opt_err,
874 + Opt_noquota, Opt_barrier, Opt_nobarrier, Opt_err, Opt_dirdata,
875 Opt_usrquota, Opt_grpquota, Opt_prjquota,
876 Opt_dax, Opt_dax_always, Opt_dax_inode, Opt_dax_never,
877 Opt_stripe, Opt_delalloc, Opt_nodelalloc, Opt_warn_on_error,
878 @@ -1687,6 +1687,7 @@ static const struct fs_parameter_spec ext4_param_specs[] = {
879 fsparam_u32 ("stripe", Opt_stripe),
880 fsparam_flag ("delalloc", Opt_delalloc),
881 fsparam_flag ("nodelalloc", Opt_nodelalloc),
882 + fsparam_flag ("dirdata", Opt_dirdata),
883 fsparam_flag ("warn_on_error", Opt_warn_on_error),
884 fsparam_flag ("nowarn_on_error", Opt_nowarn_on_error),
885 fsparam_u32 ("debug_want_extra_isize",
886 @@ -1823,6 +1824,7 @@ static const struct mount_opts {
887 MOPT_CLEAR | MOPT_Q},
888 {Opt_usrjquota, 0, MOPT_Q},
889 {Opt_grpjquota, 0, MOPT_Q},
890 + {Opt_dirdata, EXT4_MOUNT_DIRDATA, MOPT_SET},
891 {Opt_jqfmt, 0, MOPT_QFMT},
892 {Opt_nombcache, EXT4_MOUNT_NO_MBCACHE, MOPT_SET},
893 {Opt_no_prefetch_block_bitmaps, EXT4_MOUNT_NO_PREFETCH_BLOCK_BITMAPS,
894 @@ -3563,6 +3565,14 @@ int ext4_feature_set_ok(struct super_block *sb, int readonly)
898 + if ((ext4_has_feature_casefold(sb) || ext4_has_feature_encrypt(sb)) &&
899 + ext4_has_feature_dirdata(sb)) {
900 + ext4_msg(sb, KERN_ERR,
901 + "Filesystem with casefold and encrypt are incompatible "