2 * punch.c --- deallocate blocks allocated to an inode
4 * Copyright (C) 2010 Theodore Ts'o.
7 * This file may be redistributed under the terms of the GNU Library
8 * General Public License, version 2.
26 * This function returns 1 if the specified block is all zeros
28 static int check_zero_block(char *buf, int blocksize)
42 * This clever recursive function handles i_blocks[] as well as
43 * indirect, double indirect, and triple indirect blocks. It iterates
44 * over the entries in the i_blocks array or indirect blocks, and for
45 * each one, will recursively handle any indirect blocks and then
46 * frees and deallocates the blocks.
48 static errcode_t ind_punch(ext2_filsys fs, struct ext2_inode *inode,
49 char *block_buf, blk_t *p, int level,
50 blk64_t start, blk64_t count, int max)
59 printf("Entering ind_punch, level %d, start %llu, count %llu, "
60 "max %d\n", level, start, count, max);
62 incr = 1ULL << ((EXT2_BLOCK_SIZE_BITS(fs->super) - 2) * level);
63 for (i = 0, offset = 0; i < max; i++, p++, offset += incr) {
64 if (offset >= start + count)
66 if (*p == 0 || (offset+incr) <= start)
72 printf("Reading indirect block %u\n", b);
74 retval = ext2fs_read_ind_block(fs, b, block_buf);
77 start2 = (start > offset) ? start - offset : 0;
78 retval = ind_punch(fs, inode, block_buf + fs->blocksize,
79 (blk_t *) block_buf, level - 1,
80 start2, count - offset,
84 retval = ext2fs_write_ind_block(fs, b, block_buf);
87 if (!check_zero_block(block_buf, fs->blocksize))
91 printf("Freeing block %u (offset %llu)\n", b, offset);
93 ext2fs_block_alloc_stats(fs, b, -1);
98 printf("Freed %d blocks\n", freed);
100 return ext2fs_iblk_sub_blocks(fs, inode, freed);
103 #define BLK_T_MAX ((blk_t)~0ULL)
104 static errcode_t ext2fs_punch_ind(ext2_filsys fs, struct ext2_inode *inode,
105 char *block_buf, blk64_t start, blk64_t end)
110 int num = EXT2_NDIR_BLOCKS;
111 blk_t *bp = inode->i_block;
112 blk_t addr_per_block;
113 blk64_t max = EXT2_NDIR_BLOCKS;
116 /* Check start/end don't overflow the 2^32-1 indirect block limit */
117 if (start > BLK_T_MAX)
119 if (end >= BLK_T_MAX || end - start + 1 >= BLK_T_MAX)
120 count = BLK_T_MAX - start;
122 count = end - start + 1;
125 retval = ext2fs_get_array(3, fs->blocksize, &buf);
131 addr_per_block = (blk_t)fs->blocksize >> 2;
133 for (level = 0; level < 4; level++, max *= (blk64_t)addr_per_block) {
135 printf("Main loop level %d, start %llu count %u "
136 "max %llu num %d\n", level, start, count, max, num);
139 retval = ind_punch(fs, inode, block_buf, bp, level,
144 count -= max - start;
159 ext2fs_free_mem(&buf);
166 #define dbg_printf(f, a...) printf(f, ## a)
168 static void dbg_print_extent(char *desc, struct ext2fs_extent *extent)
171 printf("%s: ", desc);
172 printf("extent: lblk %llu--%llu, len %u, pblk %llu, flags: ",
173 extent->e_lblk, extent->e_lblk + extent->e_len - 1,
174 extent->e_len, extent->e_pblk);
175 if (extent->e_flags & EXT2_EXTENT_FLAGS_LEAF)
176 fputs("LEAF ", stdout);
177 if (extent->e_flags & EXT2_EXTENT_FLAGS_UNINIT)
178 fputs("UNINIT ", stdout);
179 if (extent->e_flags & EXT2_EXTENT_FLAGS_SECOND_VISIT)
180 fputs("2ND_VISIT ", stdout);
181 if (!extent->e_flags)
182 fputs("(none)", stdout);
187 #define dbg_print_extent(desc, ex) do { } while (0)
188 #define dbg_printf(f, a...) do { } while (0)
191 /* Free a range of blocks, respecting cluster boundaries */
192 static errcode_t punch_extent_blocks(ext2_filsys fs, ext2_ino_t ino,
193 struct ext2_inode *inode,
194 blk64_t lfree_start, blk64_t free_start,
195 __u32 free_count, int *freed)
200 errcode_t retval = 0;
202 /* No bigalloc? Just free each block. */
203 if (EXT2FS_CLUSTER_RATIO(fs) == 1) {
204 *freed += free_count;
205 while (free_count-- > 0)
206 ext2fs_block_alloc_stats2(fs, free_start++, -1);
211 * Try to free up to the next cluster boundary. We assume that all
212 * blocks in a logical cluster map to blocks from the same physical
213 * cluster, and that the offsets within the [pl]clusters match.
215 if (free_start & EXT2FS_CLUSTER_MASK(fs)) {
216 retval = ext2fs_map_cluster_block(fs, ino, inode,
221 ext2fs_block_alloc_stats2(fs, free_start, -1);
224 cluster_freed = EXT2FS_CLUSTER_RATIO(fs) -
225 (free_start & EXT2FS_CLUSTER_MASK(fs));
226 if (cluster_freed > free_count)
227 cluster_freed = free_count;
228 free_count -= cluster_freed;
229 free_start += cluster_freed;
230 lfree_start += cluster_freed;
233 /* Free whole clusters from the middle of the range. */
234 while (free_count > 0 && free_count >= EXT2FS_CLUSTER_RATIO(fs)) {
235 ext2fs_block_alloc_stats2(fs, free_start, -1);
237 cluster_freed = EXT2FS_CLUSTER_RATIO(fs);
238 free_count -= cluster_freed;
239 free_start += cluster_freed;
240 lfree_start += cluster_freed;
243 /* Try to free the last cluster. */
244 if (free_count > 0) {
245 retval = ext2fs_map_cluster_block(fs, ino, inode,
250 ext2fs_block_alloc_stats2(fs, free_start, -1);
260 static errcode_t ext2fs_punch_extent(ext2_filsys fs, ext2_ino_t ino,
261 struct ext2_inode *inode,
262 blk64_t start, blk64_t end)
264 ext2_extent_handle_t handle = 0;
265 struct ext2fs_extent extent;
267 blk64_t free_start, next, lfree_start;
268 __u32 free_count, newlen;
272 retval = ext2fs_extent_open2(fs, ino, inode, &handle);
276 * Find the extent closest to the start of the punch range. We don't
277 * check the return value because _goto() sets the current node to the
278 * next-lowest extent if 'start' is in a hole, and doesn't set a
279 * current node if there was a real error reading the extent tree.
280 * In that case, _get() will error out.
282 * Note: If _get() returns 'no current node', that simply means that
283 * there aren't any blocks mapped past this point in the file, so we're
286 ext2fs_extent_goto(handle, start);
287 retval = ext2fs_extent_get(handle, EXT2_EXTENT_CURRENT, &extent);
288 if (retval == EXT2_ET_NO_CURRENT_NODE) {
294 op = EXT2_EXTENT_NEXT_LEAF;
295 dbg_print_extent("main loop", &extent);
296 next = extent.e_lblk + extent.e_len;
297 dbg_printf("start %llu, end %llu, next %llu\n",
298 (unsigned long long) start,
299 (unsigned long long) end,
300 (unsigned long long) next);
301 if (start <= extent.e_lblk) {
303 * Have we iterated past the end of the punch region?
304 * If so, we can stop.
306 if (end < extent.e_lblk)
308 dbg_printf("Case #%d\n", 1);
309 /* Start of deleted region before extent;
310 adjust beginning of extent */
311 free_start = extent.e_pblk;
312 lfree_start = extent.e_lblk;
314 free_count = end - extent.e_lblk + 1;
316 free_count = extent.e_len;
317 extent.e_len -= free_count;
318 extent.e_lblk += free_count;
319 extent.e_pblk += free_count;
320 } else if (end >= next-1) {
322 * Is the punch region beyond this extent? This can
323 * happen if start is already inside a hole. Try to
324 * advance to the next extent if this is the case.
328 /* End of deleted region after extent;
329 adjust end of extent */
330 dbg_printf("Case #%d\n", 2);
331 newlen = start - extent.e_lblk;
332 free_start = extent.e_pblk + newlen;
333 lfree_start = extent.e_lblk + newlen;
334 free_count = extent.e_len - newlen;
335 extent.e_len = newlen;
337 struct ext2fs_extent newex;
339 dbg_printf("Case #%d\n", 3);
340 /* The hard case; we need to split the extent */
341 newex.e_pblk = extent.e_pblk +
342 (end + 1 - extent.e_lblk);
343 newex.e_lblk = end + 1;
344 newex.e_len = next - end - 1;
345 newex.e_flags = extent.e_flags;
347 extent.e_len = start - extent.e_lblk;
348 free_start = extent.e_pblk + extent.e_len;
349 lfree_start = extent.e_lblk + extent.e_len;
350 free_count = end - start + 1;
352 dbg_print_extent("inserting", &newex);
353 retval = ext2fs_extent_insert(handle,
354 EXT2_EXTENT_INSERT_AFTER, &newex);
357 retval = ext2fs_extent_fix_parents(handle);
361 * Now pointing at inserted extent; so go back.
363 * We cannot use EXT2_EXTENT_PREV to go back; note the
364 * subtlety in the comment for fix_parents().
366 retval = ext2fs_extent_goto(handle, extent.e_lblk);
371 dbg_print_extent("replacing", &extent);
372 retval = ext2fs_extent_replace(handle, 0, &extent);
375 retval = ext2fs_extent_fix_parents(handle);
377 struct ext2fs_extent newex;
378 blk64_t old_lblk, next_lblk;
379 dbg_printf("deleting current extent%s\n", "");
382 * Save the location of the next leaf, then slip
383 * back to the current extent.
385 retval = ext2fs_extent_get(handle, EXT2_EXTENT_CURRENT,
389 old_lblk = newex.e_lblk;
391 retval = ext2fs_extent_get(handle,
392 EXT2_EXTENT_NEXT_LEAF,
394 if (retval == EXT2_ET_EXTENT_NO_NEXT)
395 next_lblk = old_lblk;
399 next_lblk = newex.e_lblk;
401 retval = ext2fs_extent_goto(handle, old_lblk);
405 /* Now delete the extent. */
406 retval = ext2fs_extent_delete(handle, 0);
410 retval = ext2fs_extent_fix_parents(handle);
411 if (retval && retval != EXT2_ET_NO_CURRENT_NODE)
415 /* Jump forward to the next extent. */
416 ext2fs_extent_goto(handle, next_lblk);
417 op = EXT2_EXTENT_CURRENT;
421 dbg_printf("Free start %llu, free count = %u\n",
422 free_start, free_count);
423 retval = punch_extent_blocks(fs, ino, inode, lfree_start,
424 free_start, free_count, &freed);
428 retval = ext2fs_extent_get(handle, op,
430 if (retval == EXT2_ET_EXTENT_NO_NEXT ||
431 retval == EXT2_ET_NO_CURRENT_NODE)
436 dbg_printf("Freed %d blocks\n", freed);
437 retval = ext2fs_iblk_sub_blocks(fs, inode, freed);
439 ext2fs_extent_free(handle);
444 * Deallocate all logical _blocks_ starting at start to end, inclusive.
445 * If end is ~0ULL, then this is effectively truncate.
447 errcode_t ext2fs_punch(ext2_filsys fs, ext2_ino_t ino,
448 struct ext2_inode *inode,
449 char *block_buf, blk64_t start,
453 struct ext2_inode inode_buf;
458 /* Read inode structure if necessary */
460 retval = ext2fs_read_inode(fs, ino, &inode_buf);
465 if (inode->i_flags & EXT4_EXTENTS_FL)
466 retval = ext2fs_punch_extent(fs, ino, inode, start, end);
468 retval = ext2fs_punch_ind(fs, inode, block_buf, start, end);
473 printf("%u: write inode size now %u blocks %u\n",
474 ino, inode->i_size, inode->i_blocks);
476 return ext2fs_write_inode(fs, ino, inode);