lists.openwall.net   lists  /  announce  owl-users  owl-dev  john-users  john-dev  passwdqc-users  yescrypt  popa3d-users  /  oss-security  kernel-hardening  musl  sabotage  tlsify  passwords  /  crypt-dev  xvendor  /  Bugtraq  Full-Disclosure  linux-kernel  linux-netdev  linux-ext4  linux-hardening  linux-cve-announce  PHC 
Open Source and information security mailing list archives
 
Hash Suite: Windows password security audit tool. GUI, reports in PDF.
[<prev] [next>] [<thread-prev] [thread-next>] [day] [month] [year] [list]
Message-Id: <8B852D41-28F6-4280-9DF0-7A370ADC5B2D@dilger.ca>
Date:	Fri, 4 Dec 2015 15:06:04 -0700
From:	Andreas Dilger <adilger@...ger.ca>
To:	"Darrick J. Wong" <darrick.wong@...cle.com>
Cc:	Theodore Ts'o <tytso@....edu>, linux-ext4@...r.kernel.org
Subject: Re: [PATCH v2] filefrag: accommodate holes when calculating expected values

On Dec 3, 2015, at 1:37 PM, Darrick J. Wong <darrick.wong@...cle.com> wrote:
> 
> Currently, filefrag's "expected physical block" column expects extent
> records to be physically adjacent regardless of the amount of logical
> block space between the two records.  This means that if we punch a
> hole in a file, we get reports like this:
> 
> ext:   logical_offset:   physical_offset: length:  expected: flags:
> 4:     4096..    8343:   57376..  61623:   4248:
> 5:     8345..   10313:   61625..  63593:   1969:   61624:
> 
> Notice how it expects 8345 to map to 61624, and scores this against
> the fragmentation of the file.  Flagging this as "unexpected" is
> incorrect because the gap in the logical mapping is exactly the same
> size as the gap in the physical extents.
> 
> Furthermore, this particular mapping leaves the door open to the
> optimal mapping -- if a write to block 8344 causes it to be mapped to
> 61624, the entire range 4096-10313 can be mapped with a single extent.
> Until that happens, there's no way to combine extents 4 and 5 because
> of the gap in the logical mapping at block 8344.
> 
> Therefore, tweak the extent report to account for holes.
> 
> v2: Make it work for extents crossing FIEMAP calls, and clean up the
> FIBMAP version to report correct expected values.
> 
> Signed-off-by: Darrick J. Wong <darrick.wong@...cle.com>
> ---
> misc/filefrag.c |   74 +++++++++++++++++++++++++++++++++----------------------
> 1 file changed, 45 insertions(+), 29 deletions(-)
> 
> diff --git a/misc/filefrag.c b/misc/filefrag.c
> index 5bcde91..5ad6ee0 100644
> --- a/misc/filefrag.c
> +++ b/misc/filefrag.c
> @@ -208,6 +208,7 @@ static int filefrag_fiemap(int fd, int blk_shift, int *num_extents,
> 	__u64 buf[2048];	/* __u64 for proper field alignment */
> 	struct fiemap *fiemap = (struct fiemap *)buf;
> 	struct fiemap_extent *fm_ext = &fiemap->fm_extents[0];
> +	struct fiemap_extent fm_last;
> 	int count = (sizeof(buf) - sizeof(*fiemap)) /
> 			sizeof(struct fiemap_extent);
> 	unsigned long long expected = 0;
> @@ -219,6 +220,7 @@ static int filefrag_fiemap(int fd, int blk_shift, int *num_extents,
> 	int rc;
> 
> 	memset(fiemap, 0, sizeof(struct fiemap));
> +	memset(&fm_last, 0, sizeof(struct fiemap_extent));

This could just be an initializer at declaration time?

> 	if (sync_file)
> 		flags |= FIEMAP_FLAG_SYNC;
> @@ -254,6 +256,8 @@ static int filefrag_fiemap(int fd, int blk_shift, int *num_extents,
> 		}
> 
> 		for (i = 0; i < fiemap->fm_mapped_extents; i++) {
> +			expected = fm_last.fe_physical +
> +				   fm_ext[i].fe_logical - fm_last.fe_logical;

Does it make sense to allow two "expected" values? Either the sparse one that
leaves a gap for the block, or the dense one that packs physical blocks adjacent
to each other seem acceptable, depending on the application.  It doesn't make
sense to preserve holes in files that are never going to be modified in-place
(e.g. core dump or something).  Something like:

			expected_dense = fm_last.fe_physical + fm_last.fe_length;
			expected_sparse = fm_last.fe_physical +
				   fm_ext[i].fe_logical - fm_last.fe_logical;

			if (fm_ext[i].fe_logical != 0 &&
			    fm_ext[i].fe_physical != expected_dense &&
			    fm_ext[i].fe_physical != expected_sparse) {
				tot_extents++;

Cheers, Andreas

> @@ -265,10 +269,9 @@ static int filefrag_fiemap(int fd, int blk_shift, int *num_extents,
> 			if (verbose)
> 				print_extent_info(&fm_ext[i], n, expected,
> 						  blk_shift, st);
> -
> -			expected = fm_ext[i].fe_physical + fm_ext[i].fe_length;
> 			if (fm_ext[i].fe_flags & FIEMAP_EXTENT_LAST)
> 				last = 1;
> +			fm_last = fm_ext[i];
> 			n++;
> 		}
> 
> @@ -287,14 +290,15 @@ static int filefrag_fibmap(int fd, int blk_shift, int *num_extents,
> 			   ext2fs_struct_stat *st,
> 			   unsigned long numblocks, int is_ext2)
> {
> -	struct fiemap_extent	fm_ext;
> +	struct fiemap_extent	fm_ext, fm_last;
> 	unsigned long		i, last_block;
> -	unsigned long long	logical;
> +	unsigned long long	logical, expected = 0;
> 				/* Blocks per indirect block */
> 	const long		bpib = st->st_blksize / 4;
> 	int			count;
> 
> 	memset(&fm_ext, 0, sizeof(fm_ext));
> +	memset(&fm_last, 0, sizeof(fm_last));

These could be declaration initializers.

> 	if (force_extent) {
> 		fm_ext.fe_flags = FIEMAP_EXTENT_MERGED;
> 	}
> @@ -322,40 +326,52 @@ static int filefrag_fibmap(int fd, int blk_shift, int *num_extents,
> 			return rc;
> 		if (block == 0)
> 			continue;
> -		if (*num_extents == 0) {
> -			(*num_extents)++;
> -			if (force_extent) {
> +
> +		if (*num_extents == 0 || block != last_block + 1 ||
> +		    fm_ext.fe_logical + fm_ext.fe_length != logical) {
> +			/*
> +			 * This is the start of a new extent; figure out where
> +			 * we expected it to be and report the extent.
> +			 */
> +			if (*num_extents != 0 && fm_last.fe_length) {
> +				expected = fm_last.fe_physical +
> +					(fm_ext.fe_logical - fm_last.fe_logical);
> +				if (expected == fm_ext.fe_physical)
> +					expected = 0;
> +			}
> +			if (force_extent && *num_extents == 0)
> 				print_extent_header();
> -				fm_ext.fe_physical = block * st->st_blksize;
> +			if (force_extent && *num_extents != 0) {
> +				print_extent_info(&fm_ext, *num_extents - 1,
> +						  expected, blk_shift, st);
> 			}
> -		}
> -		count++;
> -		if (force_extent && last_block != 0 &&
> -		    (block != last_block + 1 ||
> -		     fm_ext.fe_logical + fm_ext.fe_length != logical)) {
> -			print_extent_info(&fm_ext, *num_extents - 1,
> -					  (last_block + 1) * st->st_blksize,
> -					  blk_shift, st);
> -			fm_ext.fe_length = 0;
> +			if (verbose && expected != 0) {
> +				printf("Discontinuity: Block %llu is at %llu "
> +				       "(was %llu)\n",
> +					fm_ext.fe_logical / st->st_blksize,
> +					fm_ext.fe_physical / st->st_blksize,
> +					expected / st->st_blksize);
> +			}
> +			/* create the new extent */
> +			fm_last = fm_ext;
> 			(*num_extents)++;
> -			fm_ext.fe_logical = logical;
> 			fm_ext.fe_physical = block * st->st_blksize;
> -		} else if (last_block && (block != last_block + 1)) {
> -			if (verbose)
> -				printf("Discontinuity: Block %ld is at %lu (was "
> -				       "%lu)\n", i, block, last_block + 1);
> -			fm_ext.fe_length = 0;
> -			(*num_extents)++;
> 			fm_ext.fe_logical = logical;
> -			fm_ext.fe_physical = block * st->st_blksize;
> +			fm_ext.fe_length = 0;
> 		}
> 		fm_ext.fe_length += st->st_blksize;
> 		last_block = block;
> 	}
> -
> -	if (force_extent)
> -		print_extent_info(&fm_ext, *num_extents - 1,
> -				  last_block * st->st_blksize, blk_shift, st);
> +	if (force_extent && *num_extents != 0) {
> +		if (fm_last.fe_length) {
> +			expected = fm_last.fe_physical +
> +				   (fm_ext.fe_logical - fm_last.fe_logical);
> +			if (expected == fm_ext.fe_physical)
> +				expected = 0;
> +		}
> +		print_extent_info(&fm_ext, *num_extents - 1, expected,
> +				  blk_shift, st);
> +	}
> 
> 	return count;
> }
> --
> To unsubscribe from this list: send the line "unsubscribe linux-ext4" in
> the body of a message to majordomo@...r.kernel.org
> More majordomo info at  http://vger.kernel.org/majordomo-info.html


Cheers, Andreas






Download attachment "signature.asc" of type "application/pgp-signature" (834 bytes)

Powered by blists - more mailing lists

Powered by Openwall GNU/*/Linux Powered by OpenVZ