lzx_compress: fix corruption with long literal run

author Eric Biggers <ebiggers3@gmail.com>

Sat, 14 Jan 2017 08:56:39 +0000 (00:56 -0800)

committer Eric Biggers <ebiggers3@gmail.com>

Sat, 14 Jan 2017 09:19:41 +0000 (01:19 -0800)
author Eric Biggers <ebiggers3@gmail.com>
Sat, 14 Jan 2017 08:56:39 +0000 (00:56 -0800)
committer Eric Biggers <ebiggers3@gmail.com>
Sat, 14 Jan 2017 09:19:41 +0000 (01:19 -0800)
diff --git a/NEWS b/NEWS

index d519010a9e69ea2399455843eb0ae933f5a9a59d..46cd676c561dc3065330a159376fda58b90b3007 100644 (file)
--- a/NEWS
+++ b/NEWS
@@ -1,4 +1,13 @@
  Version 1.11.0-BETA5:
  Version 1.11.0-BETA5:
+       Fixed a data corruption bug (incorrect compression) when storing an
+       already highly-compressed file in an LZX-compressed WIM with a chunk
+       size greater than or equal to 64K.  Note that this is not the default
+       setting and such WIMs are not supported by Microsoft's WIM software, so
+       only users who used the --chunk-size option to wimlib-imagex or the
+       wimlib_set_output_chunk_size() API function may have been affected.
+       This bug was introduced in wimlib v1.10.0.  See
+       https://wimlib.net/forums/viewtopic.php?f=1&t=300 for more details.
+
         On all platforms, sparse files are now extracted as sparse.
  
         Sparse files captured from UNIX-style filesystems are now marked as
         On all platforms, sparse files are now extracted as sparse.
  
         Sparse files captured from UNIX-style filesystems are now marked as
diff --git a/src/lzx_compress.c b/src/lzx_compress.c

index ca25d92f2ae9e35416765577e59e5726bbf201c5..b4930ee0df7c4ac16c2a371e086b264fe55b0427 100644 (file)
--- a/src/lzx_compress.c
+++ b/src/lzx_compress.c
@@ -266,11 +266,11 @@ struct lzx_sequence {
         /* The number of literals in the run.  This may be 0.  The literals are
          * not stored explicitly in this structure; instead, they are read
          * directly from the uncompressed data.  */
         /* The number of literals in the run.  This may be 0.  The literals are
          * not stored explicitly in this structure; instead, they are read
          * directly from the uncompressed data.  */
-       u16 litrunlen;
+       u32 litrunlen : 24;
  
         /* If the next field doesn't indicate end-of-block, then this is the
          * match length minus LZX_MIN_MATCH_LEN.  */
  
         /* If the next field doesn't indicate end-of-block, then this is the
          * match length minus LZX_MIN_MATCH_LEN.  */
-       u16 adjusted_length;
+       u32 adjusted_length : 8;
  
         /* If bit 31 is clear, then this field contains the match header in bits
          * 0-8, and either the match offset plus LZX_OFFSET_ADJUSTMENT or a
  
         /* If bit 31 is clear, then this field contains the match header in bits
          * 0-8, and either the match offset plus LZX_OFFSET_ADJUSTMENT or a
author	Eric Biggers <ebiggers3@gmail.com>
	Sat, 14 Jan 2017 08:56:39 +0000 (00:56 -0800)
committer	Eric Biggers <ebiggers3@gmail.com>
	Sat, 14 Jan 2017 09:19:41 +0000 (01:19 -0800)
NEWS		patch \| blob \| history
src/lzx_compress.c		patch \| blob \| history