2 * punch.c --- deallocate blocks allocated to an inode
4 * Copyright (C) 2010 Theodore Ts'o.
7 * This file may be redistributed under the terms of the GNU Library
8 * General Public License, version 2.
27 * This function returns 1 if the specified block is all zeros
29 static int check_zero_block(char *buf, int blocksize)
43 * This clever recursive function handles i_blocks[] as well as
44 * indirect, double indirect, and triple indirect blocks. It iterates
45 * over the entries in the i_blocks array or indirect blocks, and for
46 * each one, will recursively handle any indirect blocks and then
47 * frees and deallocates the blocks.
49 static errcode_t ind_punch(ext2_filsys fs, struct ext2_inode *inode,
50 char *block_buf, blk_t *p, int level,
51 blk_t start, blk_t count, int max)
60 printf("Entering ind_punch, level %d, start %u, count %u, "
61 "max %d\n", level, start, count, max);
63 incr = 1ULL << ((EXT2_BLOCK_SIZE_BITS(fs->super)-2)*level);
64 for (i=0, offset=0; i < max; i++, p++, offset += incr) {
65 if (offset >= start + count)
67 if (*p == 0 || (offset+incr) <= start)
73 printf("Reading indirect block %u\n", b);
75 retval = ext2fs_read_ind_block(fs, b, block_buf);
78 start2 = (start > offset) ? start - offset : 0;
79 retval = ind_punch(fs, inode, block_buf + fs->blocksize,
80 (blk_t *) block_buf, level - 1,
81 start2, count - offset,
85 retval = ext2fs_write_ind_block(fs, b, block_buf);
88 if (!check_zero_block(block_buf, fs->blocksize))
92 printf("Freeing block %u (offset %llu)\n", b, offset);
94 ext2fs_block_alloc_stats(fs, b, -1);
99 printf("Freed %d blocks\n", freed);
101 return ext2fs_iblk_sub_blocks(fs, inode, freed);
104 static errcode_t ext2fs_punch_ind(ext2_filsys fs, struct ext2_inode *inode,
105 char *block_buf, blk_t start, blk_t count)
110 int num = EXT2_NDIR_BLOCKS;
111 blk_t *bp = inode->i_block;
112 blk_t addr_per_block;
113 blk64_t max = EXT2_NDIR_BLOCKS;
116 retval = ext2fs_get_array(3, fs->blocksize, &buf);
122 addr_per_block = (blk_t) fs->blocksize >> 2;
124 for (level = 0; level < 4; level++, max *= (blk64_t)addr_per_block) {
126 printf("Main loop level %d, start %u count %u "
127 "max %llu num %d\n", level, start, count, max, num);
130 retval = ind_punch(fs, inode, block_buf, bp, level,
135 count -= max - start;
150 ext2fs_free_mem(&buf);
156 #define dbg_printf(f, a...) printf(f, ## a)
158 static void dbg_print_extent(char *desc, struct ext2fs_extent *extent)
161 printf("%s: ", desc);
162 printf("extent: lblk %llu--%llu, len %u, pblk %llu, flags: ",
163 extent->e_lblk, extent->e_lblk + extent->e_len - 1,
164 extent->e_len, extent->e_pblk);
165 if (extent->e_flags & EXT2_EXTENT_FLAGS_LEAF)
166 fputs("LEAF ", stdout);
167 if (extent->e_flags & EXT2_EXTENT_FLAGS_UNINIT)
168 fputs("UNINIT ", stdout);
169 if (extent->e_flags & EXT2_EXTENT_FLAGS_SECOND_VISIT)
170 fputs("2ND_VISIT ", stdout);
171 if (!extent->e_flags)
172 fputs("(none)", stdout);
177 #define dbg_print_extent(desc, ex) do { } while (0)
178 #define dbg_printf(f, a...) do { } while (0)
181 /* Free a range of blocks, respecting cluster boundaries */
182 static errcode_t punch_extent_blocks(ext2_filsys fs, ext2_ino_t ino,
183 struct ext2_inode *inode,
184 blk64_t lfree_start, blk64_t free_start,
185 __u32 free_count, int *freed)
190 errcode_t retval = 0;
192 /* No bigalloc? Just free each block. */
193 if (EXT2FS_CLUSTER_RATIO(fs) == 1) {
194 *freed += free_count;
195 while (free_count-- > 0)
196 ext2fs_block_alloc_stats2(fs, free_start++, -1);
201 * Try to free up to the next cluster boundary. We assume that all
202 * blocks in a logical cluster map to blocks from the same physical
203 * cluster, and that the offsets within the [pl]clusters match.
205 if (free_start & EXT2FS_CLUSTER_MASK(fs)) {
206 retval = ext2fs_map_cluster_block(fs, ino, inode,
211 ext2fs_block_alloc_stats2(fs, free_start, -1);
214 cluster_freed = EXT2FS_CLUSTER_RATIO(fs) -
215 (free_start & EXT2FS_CLUSTER_MASK(fs));
216 if (cluster_freed > free_count)
217 cluster_freed = free_count;
218 free_count -= cluster_freed;
219 free_start += cluster_freed;
220 lfree_start += cluster_freed;
223 /* Free whole clusters from the middle of the range. */
224 while (free_count > 0 && free_count >= EXT2FS_CLUSTER_RATIO(fs)) {
225 ext2fs_block_alloc_stats2(fs, free_start, -1);
227 cluster_freed = EXT2FS_CLUSTER_RATIO(fs);
228 free_count -= cluster_freed;
229 free_start += cluster_freed;
230 lfree_start += cluster_freed;
233 /* Try to free the last cluster. */
234 if (free_count > 0) {
235 retval = ext2fs_map_cluster_block(fs, ino, inode,
240 ext2fs_block_alloc_stats2(fs, free_start, -1);
250 static errcode_t ext2fs_punch_extent(ext2_filsys fs, ext2_ino_t ino,
251 struct ext2_inode *inode,
252 blk64_t start, blk64_t end)
254 ext2_extent_handle_t handle = 0;
255 struct ext2fs_extent extent;
257 blk64_t free_start, next, lfree_start;
258 __u32 free_count, newlen;
262 retval = ext2fs_extent_open2(fs, ino, inode, &handle);
266 * Find the extent closest to the start of the punch range. We don't
267 * check the return value because _goto() sets the current node to the
268 * next-lowest extent if 'start' is in a hole, and doesn't set a
269 * current node if there was a real error reading the extent tree.
270 * In that case, _get() will error out.
272 * Note: If _get() returns 'no current node', that simply means that
273 * there aren't any blocks mapped past this point in the file, so we're
276 ext2fs_extent_goto(handle, start);
277 retval = ext2fs_extent_get(handle, EXT2_EXTENT_CURRENT, &extent);
278 if (retval == EXT2_ET_NO_CURRENT_NODE) {
284 op = EXT2_EXTENT_NEXT_LEAF;
285 dbg_print_extent("main loop", &extent);
286 next = extent.e_lblk + extent.e_len;
287 dbg_printf("start %llu, end %llu, next %llu\n",
288 (unsigned long long) start,
289 (unsigned long long) end,
290 (unsigned long long) next);
291 if (start <= extent.e_lblk) {
293 * Have we iterated past the end of the punch region?
294 * If so, we can stop.
296 if (end < extent.e_lblk)
298 dbg_printf("Case #%d\n", 1);
299 /* Start of deleted region before extent;
300 adjust beginning of extent */
301 free_start = extent.e_pblk;
302 lfree_start = extent.e_lblk;
304 free_count = end - extent.e_lblk + 1;
306 free_count = extent.e_len;
307 extent.e_len -= free_count;
308 extent.e_lblk += free_count;
309 extent.e_pblk += free_count;
310 } else if (end >= next-1) {
312 * Is the punch region beyond this extent? This can
313 * happen if start is already inside a hole. Try to
314 * advance to the next extent if this is the case.
318 /* End of deleted region after extent;
319 adjust end of extent */
320 dbg_printf("Case #%d\n", 2);
321 newlen = start - extent.e_lblk;
322 free_start = extent.e_pblk + newlen;
323 lfree_start = extent.e_lblk + newlen;
324 free_count = extent.e_len - newlen;
325 extent.e_len = newlen;
327 struct ext2fs_extent newex;
329 dbg_printf("Case #%d\n", 3);
330 /* The hard case; we need to split the extent */
331 newex.e_pblk = extent.e_pblk +
332 (end + 1 - extent.e_lblk);
333 newex.e_lblk = end + 1;
334 newex.e_len = next - end - 1;
335 newex.e_flags = extent.e_flags;
337 extent.e_len = start - extent.e_lblk;
338 free_start = extent.e_pblk + extent.e_len;
339 lfree_start = extent.e_lblk + extent.e_len;
340 free_count = end - start + 1;
342 dbg_print_extent("inserting", &newex);
343 retval = ext2fs_extent_insert(handle,
344 EXT2_EXTENT_INSERT_AFTER, &newex);
347 retval = ext2fs_extent_fix_parents(handle);
351 * Now pointing at inserted extent; so go back.
353 * We cannot use EXT2_EXTENT_PREV to go back; note the
354 * subtlety in the comment for fix_parents().
356 retval = ext2fs_extent_goto(handle, extent.e_lblk);
361 dbg_print_extent("replacing", &extent);
362 retval = ext2fs_extent_replace(handle, 0, &extent);
365 retval = ext2fs_extent_fix_parents(handle);
367 struct ext2fs_extent newex;
368 blk64_t old_lblk, next_lblk;
369 dbg_printf("deleting current extent%s\n", "");
372 * Save the location of the next leaf, then slip
373 * back to the current extent.
375 retval = ext2fs_extent_get(handle, EXT2_EXTENT_CURRENT,
379 old_lblk = newex.e_lblk;
381 retval = ext2fs_extent_get(handle,
382 EXT2_EXTENT_NEXT_LEAF,
384 if (retval == EXT2_ET_EXTENT_NO_NEXT)
385 next_lblk = old_lblk;
389 next_lblk = newex.e_lblk;
391 retval = ext2fs_extent_goto(handle, old_lblk);
395 /* Now delete the extent. */
396 retval = ext2fs_extent_delete(handle, 0);
400 retval = ext2fs_extent_fix_parents(handle);
401 if (retval && retval != EXT2_ET_NO_CURRENT_NODE)
405 /* Jump forward to the next extent. */
406 ext2fs_extent_goto(handle, next_lblk);
407 op = EXT2_EXTENT_CURRENT;
411 dbg_printf("Free start %llu, free count = %u\n",
412 free_start, free_count);
413 retval = punch_extent_blocks(fs, ino, inode, lfree_start,
414 free_start, free_count, &freed);
418 retval = ext2fs_extent_get(handle, op,
420 if (retval == EXT2_ET_EXTENT_NO_NEXT ||
421 retval == EXT2_ET_NO_CURRENT_NODE)
426 dbg_printf("Freed %d blocks\n", freed);
427 retval = ext2fs_iblk_sub_blocks(fs, inode, freed);
429 ext2fs_extent_free(handle);
433 static errcode_t ext2fs_punch_inline_data(ext2_filsys fs, ext2_ino_t ino,
434 struct ext2_inode *inode,
435 blk64_t start, blk64_t end)
440 * In libext2fs ext2fs_punch is based on block unit. So that
441 * means that if start > 0 we don't need to do nothing. Due
442 * to this we will remove all inline data in ext2fs_punch()
448 memset((char *)inode->i_block, 0, EXT4_MIN_INLINE_DATA_SIZE);
450 retval = ext2fs_write_inode(fs, ino, inode);
454 return ext2fs_inline_data_ea_remove(fs, ino);
458 * Deallocate all logical blocks starting at start to end, inclusive.
459 * If end is ~0, then this is effectively truncate.
461 errcode_t ext2fs_punch(ext2_filsys fs, ext2_ino_t ino,
462 struct ext2_inode *inode,
463 char *block_buf, blk64_t start,
467 struct ext2_inode inode_buf;
472 /* Read inode structure if necessary */
474 retval = ext2fs_read_inode(fs, ino, &inode_buf);
479 if (inode->i_flags & EXT4_INLINE_DATA_FL)
480 return ext2fs_punch_inline_data(fs, ino, inode, start, end);
481 else if (inode->i_flags & EXT4_EXTENTS_FL)
482 retval = ext2fs_punch_extent(fs, ino, inode, start, end);
490 count = ((end - start + 1) < ~0U) ? (end - start + 1) : ~0U;
491 retval = ext2fs_punch_ind(fs, inode, block_buf,
492 (blk_t) start, count);
497 return ext2fs_write_inode(fs, ino, inode);