New compression/decompression API

author Eric Biggers <ebiggers3@gmail.com>

Wed, 25 Dec 2013 04:53:18 +0000 (22:53 -0600)

committer Eric Biggers <ebiggers3@gmail.com>

Wed, 25 Dec 2013 05:40:16 +0000 (23:40 -0600)
author Eric Biggers <ebiggers3@gmail.com>
Wed, 25 Dec 2013 04:53:18 +0000 (22:53 -0600)
committer Eric Biggers <ebiggers3@gmail.com>
Wed, 25 Dec 2013 05:40:16 +0000 (23:40 -0600)
diff --git a/Makefile.am b/Makefile.am

index 7b20b58a9bda9790b66bdc04c827e28f81207c43..4ebcf64b2f8eaa86d067afaff8c5f6c1632aa437 100644 (file)
--- a/Makefile.am
+++ b/Makefile.am
@@ -21,10 +21,11 @@ libwim_la_SOURCES =         \
         src/add_image.c         \
         src/capture_common.c    \
         src/compress.c          \
-       src/compress_chunk.c    \
+       src/compress_common.c   \
         src/compress_parallel.c \
         src/compress_serial.c   \
         src/decompress.c        \
+       src/decompress_common.c \
         src/delete_image.c      \
         src/dentry.c            \
         src/encoding.c          \
@@ -36,6 +37,7 @@ libwim_la_SOURCES =           \
         src/integrity.c         \
         src/join.c              \
         src/lookup_table.c      \
+       src/lzms-compress.c     \
         src/lzms-decompress.c   \
         src/lz77.c              \
         src/divsufsort/divsufsort.c             \
@@ -69,9 +71,11 @@ libwim_la_SOURCES =          \
         include/wimlib/callback.h       \
         include/wimlib/capture.h        \
         include/wimlib/compiler.h       \
-       include/wimlib/compress.h       \
-       include/wimlib/compress_chunks.h \
-       include/wimlib/decompress.h     \
+       include/wimlib/compressor_ops.h \
+       include/wimlib/compress_common.h        \
+       include/wimlib/chunk_compressor.h       \
+       include/wimlib/decompressor_ops.h       \
+       include/wimlib/decompress_common.h      \
         include/wimlib/dentry.h         \
         include/wimlib/encoding.h       \
         include/wimlib/endianness.h     \
diff --git a/include/wimlib.h b/include/wimlib.h

index afed2af1147b62ad37376af53cb150938e568ff8..e5efcdfa30cfa4c94cff5b4247bec7f819b05991 100644 (file)
--- a/include/wimlib.h
+++ b/include/wimlib.h
@@ -330,12 +330,6 @@
   * specialized function (wimlib_split()) is needed to create a split WIM.
   */
  
-/** @defgroup G_compression Compression and decompression functions
- *
- * @brief Functions for LZX and XPRESS compression and decompression, exported
- * for convenience only.  These functions normally do not need to be used.
- */
-
  #ifndef _WIMLIB_H
  #define _WIMLIB_H
  
@@ -1717,97 +1711,6 @@ struct wimlib_extract_command {
         int extract_flags;
  };
  
-/** @} */
-/** @ingroup G_compression
- * @{ */
-
-/** LZX compression parameters to pass to wimlib_lzx_alloc_context().  */
-struct wimlib_lzx_params {
-       /** Must be set to the size of this structure, in bytes.  */
-       uint32_t size_of_this;
-
-       /** Relatively fast LZX compression algorithm with a decent compression
-        * ratio; the suggested default.  */
-#define WIMLIB_LZX_ALGORITHM_FAST 0
-
-       /** Slower LZX compression algorithm that provides a better compression
-        * ratio.  */
-#define WIMLIB_LZX_ALGORITHM_SLOW 1
-
-       /** Algorithm to use to perform the compression: either
-        * ::WIMLIB_LZX_ALGORITHM_FAST or ::WIMLIB_LZX_ALGORITHM_SLOW.  The
-        * format is still LZX; this refers to the method the code will use to
-        * perform LZX-compatible compression.  */
-       uint32_t algorithm : 3;
-
-       /** If set to 1, the default parameters for the specified algorithm are
-        * used rather than the ones specified in the following union.  */
-       uint32_t use_defaults : 1;
-
-       union {
-               /** Parameters for the fast algorithm.  */
-               struct wimlib_lzx_fast_params {
-                       uint32_t fast_reserved1[10];
-               } fast;
-
-               /** Parameters for the slow algorithm.  */
-               struct wimlib_lzx_slow_params {
-                       /** If set to 1, the compressor can output length 2
-                        * matches.  If set 0, the compressor only outputs
-                        * matches of length 3 or greater.  Suggested value: 1
-                        */
-                       uint32_t use_len2_matches : 1;
-
-                       uint32_t slow_reserved1 : 31;
-
-                       /** Matches with length (in bytes) longer than this
-                        * value are immediately taken without spending time on
-                        * minimum-cost measurements.  Suggested value: 32.  */
-                       uint32_t num_fast_bytes;
-
-                       /** Number of passes to compute a match/literal sequence
-                        * for each LZX block.  This is for an iterative
-                        * algorithm that attempts to minimize the cost of the
-                        * match/literal sequence by using a cost model provided
-                        * by the previous iteration.  Must be at least 1.
-                        * Suggested value: 2.  */
-                       uint32_t num_optim_passes;
-
-                       /** Reserved; set to 0.  */
-                       uint32_t slow_reserved_blocksplit;
-
-                       /** Maximum depth to search for matches at each
-                        * position.  Suggested value: 50.  */
-                       uint32_t max_search_depth;
-
-                       /** Maximum number of potentially good matches to
-                        * consider for each position.  Suggested value: 3.  */
-                       uint32_t max_matches_per_pos;
-
-                       uint32_t slow_reserved2[2];
-
-                       /** Assumed cost of a main symbol with zero frequency.
-                        * Must be at least 1 and no more than 16.  Suggested
-                        * value: 15.  */
-                       uint8_t main_nostat_cost;
-
-                       /** Assumed cost of a length symbol with zero frequency.
-                        * Must be at least 1 and no more than 16.  Suggested
-                        * value: 15.  */
-                       uint8_t len_nostat_cost;
-
-                       /** Assumed cost of an aligned symbol with zero
-                        * frequency.  Must be at least 1 and no more than 8.
-                        * Suggested value: 7.  */
-                       uint8_t aligned_nostat_cost;
-
-                       uint8_t slow_reserved3[5];
-               } slow;
-       } alg_params;
-};
-
-/** Opaque LZX compression context.  */
-struct wimlib_lzx_context;
  
  /** @} */
  /** @ingroup G_general
@@ -2787,198 +2690,6 @@ wimlib_join(const wimlib_tchar * const *swms,
             int wim_write_flags,
             wimlib_progress_func_t progress_func);
  
-/**
- * @ingroup G_compression
- *
- * Decompresses a block of LZMS-compressed data.
- *
- * This function is exported for convenience only and should only be used by
- * library clients looking to make use of wimlib's compression code for another
- * purpose.
- *
- * This decompressor only implements "raw" decompression, which decompresses a
- * single LZMS-compressed block.  This behavior is the same as that of
- * Decompress() in the Windows 8 compression API when using a compression handle
- * created with CreateDecompressor() with the Algorithm parameter specified as
- * COMPRESS_ALGORITHM_LZMS | COMPRESS_RAW.  Presumably, non-raw LZMS data
- * is a container format from which the locations and sizes (both compressed and
- * uncompressed) of the constituent blocks can be determined.
- *
- * This function should not be called for blocks with compressed size equal to
- * uncompressed size, since such blocks are actually stored uncompressed.
- *
- * @param compressed_data
- *     Pointer to the compressed data.
- *
- * @param compressed_len
- *     Length of the compressed data, in bytes.
- *
- * @param uncompressed_data
- *     Pointer to the buffer into which to write the uncompressed data.
- *
- * @param uncompressed_len
- *     Length of the uncompressed data.
- *
- * @return
- *     0 on success; non-zero on failure.
- */
-extern int
-wimlib_lzms_decompress(const void *compressed_data, unsigned compressed_len,
-                      void *uncompressed_data, unsigned uncompressed_len);
-
-/**
- * @ingroup G_compression
- *
- * Compress a chunk of a WIM resource using LZX compression.
- *
- * This function is exported for convenience only and should only be used by
- * library clients looking to make use of wimlib's compression code for another
- * purpose.
- *
- * @param chunk
- *     Uncompressed data of the chunk.
- * @param chunk_size
- *     Size of the uncompressed chunk, in bytes.
- * @param out
- *     Pointer to output buffer of size at least (@p chunk_size - 1) bytes.
- *
- * @return
- *     The size of the compressed data written to @p out in bytes, or 0 if the
- *     data could not be compressed to (@p chunk_size - 1) bytes or fewer.
- *
- * As a special requirement, the compression code is optimized for the WIM
- * format and therefore requires (@p chunk_size <= 32768).
- */
-extern unsigned
-wimlib_lzx_compress(const void *chunk, unsigned chunk_size, void *out)
-                       _wimlib_deprecated;
-
-/**
- * @ingroup G_compression
- *
- * Equivalent to wimlib_lzx_compress(), but uses the specified compression
- * context, allocated by wimlib_lzx_alloc_context().
- */
-extern unsigned
-wimlib_lzx_compress2(const void *chunk, unsigned chunk_size, void *out,
-                    struct wimlib_lzx_context *ctx);
-
-/**
- * @ingroup G_compression
- *
- * Allocate a LZX compression context using the specified parameters.
- *
- * This function is exported for convenience only and should only be used by
- * library clients looking to make use of wimlib's compression code for another
- * purpose.
- *
- * @param window_size
- *     Size of the LZX window.  Must be a power of 2 between 2^15 and 2^21,
- *     inclusively.
- *
- * @param params
- *     Compression parameters to use, or @c NULL to use the default parameters.
- *
- * @param ctx_ret
- *     A pointer to either @c NULL or an existing ::wimlib_lzx_context.  If
- *     <code>*ctx_ret == NULL</code>, the new context is allocated.  If
- *     <code>*ctx_ret != NULL</code>, the existing context is re-used if
- *     possible.  Alternatively, this argument can itself be @c NULL to
- *     indicate that only parameter validation is to be performed.
- *
- * @return 0 on success; nonzero on error.
- *
- * @retval ::WIMLIB_ERR_INVALID_PARAM
- *     The window size or compression parameters were invalid.
- * @retval ::WIMLIB_ERR_NOMEM
- *     Not enough memory to allocate the compression context.
- */
-extern int
-wimlib_lzx_alloc_context(uint32_t window_size,
-                        const struct wimlib_lzx_params *params,
-                        struct wimlib_lzx_context **ctx_pp);
-
-/**
- * @ingroup G_compression
- *
- * Decompresses a block of LZX-compressed data as used in the WIM file format.
- *
- * Note that this will NOT work unmodified for LZX as used in the cabinet
- * format, which is not the same as in the WIM format!
- *
- * This function is exported for convenience only and should only be used by
- * library clients looking to make use of wimlib's compression code for another
- * purpose.
- *
- * @param compressed_data
- *     Pointer to the compressed data.
- *
- * @param compressed_len
- *     Length of the compressed data, in bytes.
- *
- * @param uncompressed_data
- *     Pointer to the buffer into which to write the uncompressed data.
- *
- * @param uncompressed_len
- *     Length of the uncompressed data.  It must be 32768 bytes or less.
- *
- * @return
- *     0 on success; non-zero on failure.
- */
-extern int
-wimlib_lzx_decompress(const void *compressed_data, unsigned compressed_len,
-                     void *uncompressed_data, unsigned uncompressed_len);
-
-/**
- * @ingroup G_compression
- *
- * Equivalent to wimlib_lzx_decompress(), except the window size is specified in
- * @p max_window_size as any power of 2 between 2^15 and 2^21, inclusively, and
- * @p uncompressed_len may be any size less than or equal to @p max_window_size.
- */
-extern int
-wimlib_lzx_decompress2(const void *compressed_data, unsigned compressed_len,
-                      void *uncompressed_data, unsigned uncompressed_len,
-                      uint32_t max_window_size);
-
-/**
- * @ingroup G_compression
- *
- * Free the specified LZX compression context, allocated with
- * wimlib_lzx_alloc_context().
- */
-extern void
-wimlib_lzx_free_context(struct wimlib_lzx_context *ctx);
-
-/**
- * @ingroup G_compression
- *
- * Set the global default LZX compression parameters.
- *
- * @param params
- *     The LZX compression parameters to set.  These default parameters will be
- *     used by any calls to wimlib_lzx_alloc_context() with @c NULL LZX
- *     parameters specified, as well as by any future compression performed by
- *     the library itself.  Passing @p NULL here resets the default LZX
- *     parameters to their original value.
- *
- * @return 0 on success; nonzero on error.
- *
- * @retval ::WIMLIB_ERR_INVALID_PARAM
- *     The compression parameters were invalid.
- */
-extern int
-wimlib_lzx_set_default_params(const struct wimlib_lzx_params *params);
-
-/**
- * @ingroup G_compression
- *
- * Free the specified LZX compression context, allocated with
- * wimlib_lzx_alloc_context().
- */
-extern void
-wimlib_lzx_free_context(struct wimlib_lzx_context *ctx);
-
  
  /**
   * @ingroup G_mounting_wim_images
@@ -4032,62 +3743,322 @@ wimlib_write_to_fd(WIMStruct *wim,
                    unsigned num_threads,
                    wimlib_progress_func_t progress_func);
  
+/**
+ * @defgroup G_compression Compression and decompression functions
+ *
+ * @brief Functions for LZX, XPRESS, and LZMS compression and decompression,
+ * exported for convenience only, as they are already used by wimlib internally
+ * when appropriate.
+ *
+ * These functions can be used for general-purpose lossless data compression,
+ * but some limitations apply; for example, none of the compressors or
+ * decompressors currently support sliding windows, and there also exist
+ * slightly different variants of these formats that are not supported
+ * unmodified.
+ *
+ * @{
+ */
+
+/** Header for compression parameters to pass to wimlib_create_compressor() or
+ * wimlib_set_default_compressor_params().  */
+struct wimlib_compressor_params_header {
+       /** Size of the parameters, in bytes.  */
+       uint32_t size;
+
+       uint32_t reserved;
+};
+
+/** Header for decompression parameters to pass to wimlib_create_decompressor()
+ * or wimlib_set_default_decompressor_params() */
+struct wimlib_decompressor_params_header {
+       /** Size of the parameters, in bytes.  */
+       uint32_t size;
+
+       uint32_t reserved;
+};
+
+/** LZX compression parameters that can optionally be passed to
+ * wimlib_create_compressor() with the compression type
+ * ::WIMLIB_COMPRESSION_TYPE_LZX.  */
+struct wimlib_lzx_compressor_params {
+       /** hdr.size Must be set to the size of this structure, in bytes.  */
+       struct wimlib_compressor_params_header hdr;
+
+       /** Relatively fast LZX compression algorithm with a decent compression
+        * ratio; the suggested default.  */
+#define WIMLIB_LZX_ALGORITHM_FAST 0
+
+       /** Slower LZX compression algorithm that provides a better compression
+        * ratio.  */
+#define WIMLIB_LZX_ALGORITHM_SLOW 1
+
+       /** Algorithm to use to perform the compression: either
+        * ::WIMLIB_LZX_ALGORITHM_FAST or ::WIMLIB_LZX_ALGORITHM_SLOW.  The
+        * format is still LZX; this refers to the method the code will use to
+        * perform LZX-compatible compression.  */
+       uint32_t algorithm : 3;
+
+       /** If set to 1, the default parameters for the specified algorithm are
+        * used rather than the ones specified in the following union.  */
+       uint32_t use_defaults : 1;
+
+       union {
+               /** Parameters for the fast algorithm.  */
+               struct wimlib_lzx_fast_params {
+                       uint32_t fast_reserved1[10];
+               } fast;
+
+               /** Parameters for the slow algorithm.  */
+               struct wimlib_lzx_slow_params {
+                       /** If set to 1, the compressor can output length 2
+                        * matches.  If set 0, the compressor only outputs
+                        * matches of length 3 or greater.  Suggested value: 1
+                        */
+                       uint32_t use_len2_matches : 1;
+
+                       uint32_t slow_reserved1 : 31;
+
+                       /** Matches with length (in bytes) longer than this
+                        * value are immediately taken without spending time on
+                        * minimum-cost measurements.  Suggested value: 32.  */
+                       uint32_t num_fast_bytes;
+
+                       /** Number of passes to compute a match/literal sequence
+                        * for each LZX block.  This is for an iterative
+                        * algorithm that attempts to minimize the cost of the
+                        * match/literal sequence by using a cost model provided
+                        * by the previous iteration.  Must be at least 1.
+                        * Suggested value: 2.  */
+                       uint32_t num_optim_passes;
+
+                       /** Reserved; set to 0.  */
+                       uint32_t slow_reserved_blocksplit;
+
+                       /** Maximum depth to search for matches at each
+                        * position.  Suggested value: 50.  */
+                       uint32_t max_search_depth;
+
+                       /** Maximum number of potentially good matches to
+                        * consider for each position.  Suggested value: 3.  */
+                       uint32_t max_matches_per_pos;
+
+                       uint32_t slow_reserved2[2];
+
+                       /** Assumed cost of a main symbol with zero frequency.
+                        * Must be at least 1 and no more than 16.  Suggested
+                        * value: 15.  */
+                       uint8_t main_nostat_cost;
+
+                       /** Assumed cost of a length symbol with zero frequency.
+                        * Must be at least 1 and no more than 16.  Suggested
+                        * value: 15.  */
+                       uint8_t len_nostat_cost;
+
+                       /** Assumed cost of an aligned symbol with zero
+                        * frequency.  Must be at least 1 and no more than 8.
+                        * Suggested value: 7.  */
+                       uint8_t aligned_nostat_cost;
+
+                       uint8_t slow_reserved3[5];
+               } slow;
+       } alg_params;
+};
+
+/** Opaque compressor handle.  */
+struct wimlib_compressor;
+
+/** Opaque decompressor handle.  */
+struct wimlib_decompressor;
+
+/**
+ * @ingroup G_compression
+ *
+ * Set the default compression parameters for the specified compression type.
+ * This will affect both explicit and wimlib-internal calls to
+ * wimlib_create_compressor().
+ *
+ * @param ctype
+ *     Compression type for which to set the default compression parameters.
+ * @param params
+ *     Compression-type specific parameters.  This may be @ NULL, in which case
+ *     the "default default" parameters are restored.
+ *
+ * @return 0 on success; nonzero on error.
+ *
+ * @retval ::WIMLIB_ERR_INVALID_COMPRESSION_TYPE
+ *     @p ctype was not a supported compression type.
+ */
+extern int
+wimlib_set_default_compressor_params(enum wimlib_compression_type ctype,
+                                    const struct wimlib_compressor_params_header *params);
+
  /**
   * @ingroup G_compression
   *
- * Compress a chunk of data using XPRESS compression.
+ * Allocate a compressor for the specified compression type using the specified
+ * parameters.
   *
- * This function is exported for convenience only and should only be used by
- * library clients looking to make use of wimlib's compression code for another
- * purpose.
+ * @param ctype
+ *     Compression type for which to create the compressor.
+ * @param max_block_size
+ *     Maximum block size to support.  The exact meaning and allowed values for
+ *     this parameter depend on the compression type, but it at least specifies
+ *     the maximum allowed value for @p uncompressed_size to wimlib_compress().
+ * @param extra_params
+ *     An optional pointer to extra compressor parameters for the specified
+ *     compression type.  For LZX, a pointer to ::wimlib_lzx_compressor_params
+ *     may be specified here.  If left @c NULL, the default parameters are
+ *     used.
+ * @param compressor_ret
+ *     A location into which to return the pointer to the allocated compressor,
+ *     which can be used for any number of calls to wimlib_compress() before
+ *     being freed with wimlib_free_compressor().
+ *
+ * @return 0 on success; nonzero on error.
+ *
+ * @retval ::WIMLIB_ERR_INVALID_COMPRESSION_TYPE
+ *     @p ctype was not a supported compression type.
+ * @retval ::WIMLIB_ERR_INVALID_PARAM
+ *     The compression parameters were invalid.
+ * @retval ::WIMLIB_ERR_NOMEM
+ *     Insufficient memory to allocate the compressor.
+ */
+extern int
+wimlib_create_compressor(enum wimlib_compression_type ctype,
+                        size_t max_block_size,
+                        const struct wimlib_compressor_params_header *extra_params,
+                        struct wimlib_compressor **compressor_ret);
+
+/**
+ * @ingroup G_compression
   *
- * As of wimlib v1.6.0, this function can be used with @p chunk_size greater
- * than 32768 bytes and is only limited by available memory.  However, the
- * XPRESS format itself still caps match offsets to 65535, so if a larger chunk
- * size is chosen, then the matching will effectively occur in a sliding window
- * over it.
+ * Losslessly compress a block of data using a compressor previously created
+ * with wimlib_create_compressor().
   *
- * @param chunk
- *     Uncompressed data of the chunk.
- * @param chunk_size
- *     Size of the uncompressed chunk, in bytes.
- * @param out
- *     Pointer to output buffer of size at least (@p chunk_size - 1) bytes.
+ * @param uncompressed_data
+ *     Buffer containing the data to compress.
+ * @param uncompressed_size
+ *     Size, in bytes, of the data to compress.
+ * @param compressed_data
+ *     Buffer into which to write the compressed data.
+ * @param compressed_size_avail
+ *     Number of bytes available in @compressed_data.
+ * @param compressor
+ *     A compressor previously allocated with wimlib_create_compressor().
   *
   * @return
- *     The size of the compressed data written to @p out in bytes, or 0 if the
- *     data could not be compressed to (@p chunk_size - 1) bytes or fewer.
+ *     The size of the compressed data, in bytes, or 0 if the input data could
+ *     not be compressed to @compressed_size_avail or fewer bytes.
   */
-extern unsigned
-wimlib_xpress_compress(const void *chunk, unsigned chunk_size, void *out);
+extern size_t
+wimlib_compress(const void *uncompressed_data, size_t uncompressed_size,
+               void *compressed_data, size_t compressed_size_avail,
+               struct wimlib_compressor *compressor);
  
  /**
   * @ingroup G_compression
   *
- * Decompresses a chunk of XPRESS-compressed data.
+ * Free a compressor previously allocated with wimlib_create_compressor().
   *
- * This function is exported for convenience only and should only be used by
- * library clients looking to make use of wimlib's compression code for another
- * purpose.
+ * @param compressor
+ *     The compressor to free.
+ */
+extern void
+wimlib_free_compressor(struct wimlib_compressor *compressor);
+
+/**
+ * @ingroup G_compression
   *
- * @param compressed_data
- *     Pointer to the compressed data.
+ * Set the default decompression parameters for the specified compression type.
+ * This will affect both explicit and wimlib-internal calls to
+ * wimlib_create_decompressor().
   *
- * @param compressed_len
- *     Length of the compressed data, in bytes.
+ * @param ctype
+ *     Compression type for which to set the default decompression parameters.
+ * @param params
+ *     Compression-type specific parameters.  This may be @ NULL, in which case
+ *     the "default default" parameters are restored.
   *
- * @param uncompressed_data
- *     Pointer to the buffer into which to write the uncompressed data.
+ * @return 0 on success; nonzero on error.
+ *
+ * @retval ::WIMLIB_ERR_INVALID_COMPRESSION_TYPE
+ *     @p ctype was not a supported compression type.
+ */
+extern int
+wimlib_set_default_decompressor_params(enum wimlib_compression_type ctype,
+                                      const struct wimlib_decompressor_params_header *params);
+
+/**
+ * @ingroup G_compression
   *
- * @param uncompressed_len
- *     Length of the uncompressed data.
+ * Allocate a decompressor for the specified compression type using the
+ * specified parameters.
   *
- * @return
- *     0 on success; non-zero on failure.
+ * @param ctype
+ *     Compression type for which to create the decompressor.
+ * @param max_block_size
+ *     Maximum block size to support.  The exact meaning and allowed values for
+ *     this parameter depend on the compression type, but it at least specifies
+ *     the maximum allowed value for @p uncompressed_size to
+ *     wimlib_decompress().
+ * @param extra_params
+ *     An optional pointer to extra decompressor parameters for the specified
+ *     compression type.  If @c NULL, the default parameters are used.
+ * @param decompressor_ret
+ *     A location into which to return the pointer to the allocated
+ *     decompressor, which can be used for any number of calls to
+ *     wimlib_decompress() before being freed with wimlib_free_decompressor().
+ *
+ * @return 0 on success; nonzero on error.
+ *
+ * @retval ::WIMLIB_ERR_INVALID_COMPRESSION_TYPE
+ *     @p ctype was not a supported compression type.
+ * @retval ::WIMLIB_ERR_INVALID_PARAM
+ *     The decompression parameters were invalid.
+ * @retval ::WIMLIB_ERR_NOMEM
+ *     Insufficient memory to allocate the decompressor.
   */
  extern int
-wimlib_xpress_decompress(const void *compressed_data, unsigned compressed_len,
-                        void *uncompressed_data, unsigned uncompressed_len);
+wimlib_create_decompressor(enum wimlib_compression_type ctype,
+                          size_t max_block_size,
+                          const struct wimlib_decompressor_params_header *extra_params,
+                          struct wimlib_decompressor **decompressor_ret);
+
+/**
+ * @ingroup G_compression
+ *
+ * Decompress a block of data using a decompressor previously created with
+ * wimlib_create_decompressor().
+ *
+ * @param compressed_data
+ *     Buffer containing the data to decompress.
+ * @param compressed_size
+ *     Size, in bytes, of the data to decompress.
+ * @param uncompressed_data
+ *     Buffer into which to write the uncompressed data.
+ * @param uncompressed_size
+ *     Size, in bytes, of the data when uncompressed.
+ * @param decompressor
+ *     A decompressor previously allocated with wimlib_create_decompressor().
+ *
+ * @return 0 on success; nonzero on error.
+ */
+extern int
+wimlib_decompress(const void *compressed_data, size_t compressed_size,
+                 void *uncompressed_data, size_t uncompressed_size,
+                 struct wimlib_decompressor *decompressor);
+
+/**
+ * @ingroup G_compression
+ *
+ * Free a decompressor previously allocated with wimlib_create_decompressor().
+ *
+ * @param decompressor
+ *     The decompressor to free.
+ */
+extern void
+wimlib_free_decompressor(struct wimlib_decompressor *decompressor);
+
  
  #ifdef __cplusplus
  }
diff --git a/include/wimlib/compress_chunks.h b/include/wimlib/chunk_compressor.h

similarity index 87%

rename from include/wimlib/compress_chunks.h

rename to include/wimlib/chunk_compressor.h

index cfd733360ecdc173c653eadca7e531735935bd93..176dc531710d8e82a5b10db7f6ae6af6e4c4689b 100644 (file)
--- a/include/wimlib/compress_chunks.h
+++ b/include/wimlib/chunk_compressor.h
@@ -1,16 +1,13 @@
-#ifndef _WIMLIB_COMPRESS_CHUNK_H
-#define _WIMLIB_COMPRESS_CHUNK_H
+/*
+ * chunk_compressor.h
+ *
+ * Interface for serial/parallel chunk compression.
+ */
  
-#include <wimlib/types.h>
-
-struct wimlib_lzx_context;
+#ifndef _WIMLIB_CHUNK_COMPRESSOR_H
+#define _WIMLIB_CHUNK_COMPRESSOR_H
  
-unsigned
-compress_chunk(const void * uncompressed_data,
-              unsigned uncompressed_len,
-              void *compressed_data,
-              int out_ctype,
-              struct wimlib_lzx_context *comp_ctx);
+#include <wimlib/types.h>
  
  /* Interface for chunk compression.  Users can submit chunks of data to be
   * compressed, then retrieve them later in order.  This interface can be
@@ -69,7 +66,6 @@ new_parallel_chunk_compressor(int out_ctype, u32 out_chunk_size,
  
  int
  new_serial_chunk_compressor(int out_ctype, u32 out_chunk_size,
-                           struct wimlib_lzx_context *comp_ctx,
                             struct chunk_compressor **compressor_ret);
  
-#endif
+#endif /* _WIMLIB_CHUNK_COMPRESSOR_H  */
diff --git a/include/wimlib/compress.h b/include/wimlib/compress_common.h

similarity index 96%

rename from include/wimlib/compress.h

rename to include/wimlib/compress_common.h

index fcd3c4119f16c9e37298a87760ddbd99b56186b3..14b32f488b488a0084e4a4ac31a72f4769932c5f 100644 (file)
--- a/include/wimlib/compress.h
+++ b/include/wimlib/compress_common.h
@@ -1,11 +1,11 @@
  /*
- * compress.h
+ * compress_common.h
   *
   * Header for compression code shared by multiple compression formats.
   */
  
-#ifndef _WIMLIB_COMPRESS_H
-#define _WIMLIB_COMPRESS_H
+#ifndef _WIMLIB_COMPRESS_COMMON_H
+#define _WIMLIB_COMPRESS_COMMON_H
  
  #include "wimlib/types.h"
  
diff --git a/include/wimlib/compressor_ops.h b/include/wimlib/compressor_ops.h

new file mode 100644 (file)

index 0000000..4c36bb3
--- /dev/null
+++ b/include/wimlib/compressor_ops.h
@@ -0,0 +1,34 @@
+/*
+ * compressor_ops.h
+ *
+ * Interface implemented by compressors for specific formats.
+ */
+
+#ifndef _WIMLIB_COMPRESSOR_OPS_H
+#define _WIMLIB_COMPRESSOR_OPS_H
+
+#include <stddef.h>
+
+struct compressor_ops {
+
+       int (*create_compressor)(size_t max_block_size,
+                                const struct wimlib_compressor_params_header *extra_params,
+                                void **private_ret);
+
+       size_t (*compress)(const void *uncompressed_data,
+                          size_t uncompressed_size,
+                          void *compressed_data,
+                          size_t compressed_size_avail,
+                          void *private);
+
+       void (*free_compressor)(void *private);
+};
+
+extern const struct compressor_ops lzx_compressor_ops;
+extern const struct compressor_ops xpress_compressor_ops;
+extern const struct compressor_ops lzms_compressor_ops;
+
+extern void
+cleanup_compressor_params(void);
+
+#endif /* _WIMLIB_COMPRESSOR_OPS_H */
diff --git a/include/wimlib/decompress.h b/include/wimlib/decompress_common.h

similarity index 98%

rename from include/wimlib/decompress.h

rename to include/wimlib/decompress_common.h

index ec8804e67f530ceab940349106c62070a8549381..4b5a7e3cdf89a34c407ab123ad7e603bf90d9acd 100644 (file)
--- a/include/wimlib/decompress.h
+++ b/include/wimlib/decompress_common.h
@@ -1,11 +1,11 @@
  /*
- * decompress.h
+ * decompress_common.h
   *
   * Header for decompression code shared by multiple compression formats.
   */
  
-#ifndef _WIMLIB_DECOMPRESS_H
-#define _WIMLIB_DECOMPRESS_H
+#ifndef _WIMLIB_DECOMPRESS_COMMON_H
+#define _WIMLIB_DECOMPRESS_COMMON_H
  
  #include "wimlib/assert.h"
  #include "wimlib/compiler.h"
diff --git a/include/wimlib/decompressor_ops.h b/include/wimlib/decompressor_ops.h

new file mode 100644 (file)

index 0000000..9e64285
--- /dev/null
+++ b/include/wimlib/decompressor_ops.h
@@ -0,0 +1,34 @@
+/*
+ * decompressor_ops.h
+ *
+ * Interface implemented by decompressors for specific formats.
+ */
+
+#ifndef _WIMLIB_DECOMPRESSOR_OPS_H
+#define _WIMLIB_DECOMPRESSOR_OPS_H
+
+#include <stddef.h>
+
+struct decompressor_ops {
+
+       int (*create_decompressor)(size_t max_block_size,
+                                  const struct wimlib_decompressor_params_header *extra_params,
+                                  void **private_ret);
+
+       int (*decompress)(const void *compressed_data,
+                         size_t compressed_size,
+                         void *uncompressed_data,
+                         size_t uncompressed_size,
+                         void *private);
+
+       void (*free_decompressor)(void *private);
+};
+
+extern const struct decompressor_ops lzx_decompressor_ops;
+extern const struct decompressor_ops xpress_decompressor_ops;
+extern const struct decompressor_ops lzms_decompressor_ops;
+
+extern void
+cleanup_decompressor_params(void);
+
+#endif /* _WIMLIB_DECOMPRESSOR_OPS_H */
diff --git a/include/wimlib/lookup_table.h b/include/wimlib/lookup_table.h

index f99f38d40a7b67e81610233d44ef45aa8120660d..c96373859dd17ced425683fcb603b432493d4453 100644 (file)
--- a/include/wimlib/lookup_table.h
+++ b/include/wimlib/lookup_table.h
@@ -303,8 +303,7 @@ write_wim_lookup_table_from_stream_list(struct list_head *stream_list,
                                         struct filedes *out_fd,
                                         u16 part_number,
                                         struct wim_reshdr *out_reshdr,
-                                       int write_resource_flags,
-                                       struct wimlib_lzx_context **comp_ctx);
+                                       int write_resource_flags);
  
  extern void
  free_lookup_table(struct wim_lookup_table *table);
diff --git a/include/wimlib/lzx.h b/include/wimlib/lzx.h

index 1332645f10274b3e22d17c184a25e9ec64f47c27..28408b328dc56695746aff83954c596618d4e923 100644 (file)
--- a/include/wimlib/lzx.h
+++ b/include/wimlib/lzx.h
@@ -134,7 +134,7 @@ lzx_get_position_slot_raw(unsigned formatted_offset)
         }
  }
  
-extern bool lzx_window_size_valid(u32 window_size);
+extern bool lzx_window_size_valid(size_t window_size);
  extern unsigned lzx_get_num_main_syms(u32 window_size);
  
  #define LZX_NUM_RECENT_OFFSETS 3
diff --git a/include/wimlib/wim.h b/include/wimlib/wim.h

index 83b1dbcb359e3587ccfc1ef0cbfde3133a5fff1e..99a37362eefd6420d0e7a0b15b2b0733edc7e750 100644 (file)
--- a/include/wimlib/wim.h
+++ b/include/wimlib/wim.h
@@ -42,8 +42,9 @@ struct WIMStruct {
         /* Temporary field */
         void *private;
  
-       /* LZX compression context for default thread  */
-       struct wimlib_lzx_context *lzx_context;
+       struct wimlib_decompressor *decompressor;
+       enum wimlib_compression_type decompressor_ctype;
+       u32 decompressor_max_block_size;
  
         struct list_head subwims;
  
diff --git a/include/wimlib/write.h b/include/wimlib/write.h

index 9857fc03d7bfdb13f009ab714a94335fc24b5c53..3665eea44fdc71be8004d07604dab26021699ef9 100644 (file)
--- a/include/wimlib/write.h
+++ b/include/wimlib/write.h
@@ -47,7 +47,6 @@ write_wim_resource_from_buffer(const void *buf, size_t buf_size,
                                u32 out_chunk_size,
                                struct wim_reshdr *out_reshdr,
                                u8 *hash,
-                              int write_resource_flags,
-                              struct wimlib_lzx_context **comp_ctx);
+                              int write_resource_flags);
  
  #endif /* _WIMLIB_WRITE_H */
diff --git a/programs/imagex.c b/programs/imagex.c

index b2164402749e57b8b6f94a6804ef7a1909fb33fd..33274616d6604700058f396c5d9f239aea898cec 100644 (file)
--- a/programs/imagex.c
+++ b/programs/imagex.c
@@ -434,8 +434,10 @@ static int
  set_compress_slow(void)
  {
         int ret;
-       static const struct wimlib_lzx_params slow_params = {
-               .size_of_this = sizeof(struct wimlib_lzx_params),
+       static const struct wimlib_lzx_compressor_params slow_params = {
+               .hdr = {
+                       .size = sizeof(struct wimlib_lzx_compressor_params),
+               },
                 .algorithm = WIMLIB_LZX_ALGORITHM_SLOW,
                 .alg_params = {
                         .slow = {
@@ -450,7 +452,8 @@ set_compress_slow(void)
                         },
                 },
         };
-       ret = wimlib_lzx_set_default_params(&slow_params);
+       ret = wimlib_set_default_compressor_params(WIMLIB_COMPRESSION_TYPE_LZX,
+                                                  &slow_params.hdr);
         if (ret)
                 imagex_error(T("Couldn't set slow compression parameters.!"));
         return ret;
@@ -1866,13 +1869,14 @@ imagex_capture_or_append(int argc, tchar **argv, int cmd)
  
         /* Set default compression type.  */
         if (compression_type == WIMLIB_COMPRESSION_TYPE_INVALID) {
-               struct wimlib_lzx_params params;
+               struct wimlib_lzx_compressor_params params;
                 memset(&params, 0, sizeof(params));
-               params.size_of_this = sizeof(params);
+               params.hdr.size = sizeof(params);
                 params.algorithm = WIMLIB_LZX_ALGORITHM_FAST;
                 params.use_defaults = 1;
  
-               wimlib_lzx_set_default_params(&params);
+               wimlib_set_default_compressor_params(WIMLIB_COMPRESSION_TYPE_LZX,
+                                                    &params.hdr);
                 compression_type = WIMLIB_COMPRESSION_TYPE_LZX;
         }
  
diff --git a/src/compress.c b/src/compress.c

index 79fe4ddf54e320aeeac7da13e8110a6ada23944c..32d5fb49fc28b0885ef261dfeece9bc3231d82f5 100644 (file)
--- a/src/compress.c
+++ b/src/compress.c
@@ -1,11 +1,12 @@
  /*
   * compress.c
   *
- * Functions used for compression.
+ * Generic functions for compression, wrapping around actual compression
+ * implementations.
   */
  
  /*
- * Copyright (C) 2012, 2013 Eric Biggers
+ * Copyright (C) 2013 Eric Biggers
   *
   * This file is part of wimlib, a library for working with WIM files.
   *
@@ -27,445 +28,120 @@
  #  include "config.h"
  #endif
  
-#include "wimlib/assert.h"
-#include "wimlib/endianness.h"
-#include "wimlib/compiler.h"
-#include "wimlib/compress.h"
+#include "wimlib.h"
+#include "wimlib/compressor_ops.h"
  #include "wimlib/util.h"
  
-#include <stdlib.h>
-#include <string.h>
-
-/* Writes @num_bits bits, given by the @num_bits least significant bits of
- * @bits, to the output @ostream. */
-void
-bitstream_put_bits(struct output_bitstream *ostream, u32 bits,
-                  unsigned num_bits)
+struct wimlib_compressor {
+       const struct compressor_ops *ops;
+       void *private;
+};
+
+static const struct compressor_ops *compressor_ops[] = {
+       [WIMLIB_COMPRESSION_TYPE_LZX]    = &lzx_compressor_ops,
+       [WIMLIB_COMPRESSION_TYPE_XPRESS] = &xpress_compressor_ops,
+       [WIMLIB_COMPRESSION_TYPE_LZMS]   = &lzms_compressor_ops,
+};
+
+static struct wimlib_compressor_params_header *
+compressor_default_params[ARRAY_LEN(compressor_ops)] = {
+       [WIMLIB_COMPRESSION_TYPE_LZX]    = NULL,
+       [WIMLIB_COMPRESSION_TYPE_XPRESS] = NULL,
+       [WIMLIB_COMPRESSION_TYPE_LZMS]   = NULL,
+};
+
+static bool
+compressor_ctype_valid(int ctype)
  {
-       bits &= (1U << num_bits) - 1;
-       while (num_bits > ostream->free_bits) {
-               /* Buffer variable does not have space for the new bits.  It
-                * needs to be flushed as a 16-bit integer.  Bits in the second
-                * byte logically precede those in the first byte
-                * (little-endian), but within each byte the bits are ordered
-                * from high to low.  This is true for both XPRESS and LZX
-                * compression.  */
-
-               /* There must be at least 2 bytes of space remaining.  */
-               if (unlikely(ostream->bytes_remaining < 2)) {
-                       ostream->overrun = true;
-                       return;
-               }
-
-               /* Fill the buffer with as many bits that fit.  */
-               unsigned fill_bits = ostream->free_bits;
-
-               ostream->bitbuf <<= fill_bits;
-               ostream->bitbuf |= bits >> (num_bits - fill_bits);
-
-               *(le16*)ostream->bit_output = cpu_to_le16(ostream->bitbuf);
-               ostream->bit_output = ostream->next_bit_output;
-               ostream->next_bit_output = ostream->output;
-               ostream->output += 2;
-               ostream->bytes_remaining -= 2;
-
-               ostream->free_bits = 16;
-               num_bits -= fill_bits;
-               bits &= (1U << num_bits) - 1;
-       }
-
-       /* Buffer variable has space for the new bits.  */
-       ostream->bitbuf = (ostream->bitbuf << num_bits) | bits;
-       ostream->free_bits -= num_bits;
+       return (ctype >= 0 &&
+               ctype < ARRAY_LEN(compressor_ops) &&
+               compressor_ops[ctype] != NULL);
  }
  
-void
-bitstream_put_byte(struct output_bitstream *ostream, u8 n)
+WIMLIBAPI int
+wimlib_set_default_compressor_params(enum wimlib_compression_type ctype,
+                                    const struct wimlib_compressor_params_header *params)
  {
-       if (unlikely(ostream->bytes_remaining < 1)) {
-               ostream->overrun = true;
-               return;
-       }
-       *ostream->output++ = n;
-       ostream->bytes_remaining--;
-}
+       struct wimlib_compressor_params_header *dup;
  
-/* Flushes any remaining bits to the output bitstream.
- *
- * Returns -1 if the stream has overrun; otherwise returns the total number of
- * bytes in the output.  */
-input_idx_t
-flush_output_bitstream(struct output_bitstream *ostream)
-{
-       if (unlikely(ostream->overrun))
-               return ~(input_idx_t)0;
+       if (!compressor_ctype_valid(ctype))
+               return WIMLIB_ERR_INVALID_COMPRESSION_TYPE;
  
-       *(le16*)ostream->bit_output =
-               cpu_to_le16((u16)((u32)ostream->bitbuf << ostream->free_bits));
-       *(le16*)ostream->next_bit_output =
-               cpu_to_le16(0);
+       dup = NULL;
+       if (params) {
+               dup = memdup(params, params->size);
+               if (dup == NULL)
+                       return WIMLIB_ERR_NOMEM;
+       }
  
-       return ostream->output - ostream->output_start;
+       FREE(compressor_default_params[ctype]);
+       compressor_default_params[ctype] = dup;
+       return 0;
  }
  
-/* Initializes an output bit buffer to write its output to the memory location
- * pointer to by @data. */
  void
-init_output_bitstream(struct output_bitstream *ostream,
-                     void *data, unsigned num_bytes)
-{
-       wimlib_assert(num_bytes >= 4);
-
-       ostream->bitbuf              = 0;
-       ostream->free_bits           = 16;
-       ostream->output_start        = data;
-       ostream->bit_output          = data;
-       ostream->next_bit_output     = data + 2;
-       ostream->output              = data + 4;
-       ostream->bytes_remaining     = num_bytes - 4;
-       ostream->overrun             = false;
-}
-
-typedef struct {
-       input_idx_t freq;
-       u16 sym;
-       union {
-               u16 path_len;
-               u16 height;
-       };
-} HuffmanNode;
-
-typedef struct HuffmanIntermediateNode {
-       HuffmanNode node_base;
-       HuffmanNode *left_child;
-       HuffmanNode *right_child;
-} HuffmanIntermediateNode;
-
-
-/* Comparator function for HuffmanNodes.  Sorts primarily by symbol
- * frequency and secondarily by symbol value. */
-static int
-cmp_nodes_by_freq(const void *_leaf1, const void *_leaf2)
+cleanup_compressor_params(void)
  {
-       const HuffmanNode *leaf1 = _leaf1;
-       const HuffmanNode *leaf2 = _leaf2;
-
-       if (leaf1->freq > leaf2->freq)
-               return 1;
-       else if (leaf1->freq < leaf2->freq)
-               return -1;
-       else
-               return (int)leaf1->sym - (int)leaf2->sym;
+       for (size_t i = 0; i < ARRAY_LEN(compressor_default_params); i++) {
+               FREE(compressor_default_params[i]);
+               compressor_default_params[i] = NULL;
+       }
  }
  
-/* Comparator function for HuffmanNodes.  Sorts primarily by code length and
- * secondarily by symbol value. */
-static int
-cmp_nodes_by_code_len(const void *_leaf1, const void *_leaf2)
+WIMLIBAPI int
+wimlib_create_compressor(enum wimlib_compression_type ctype,
+                        size_t max_block_size,
+                        const struct wimlib_compressor_params_header *extra_params,
+                        struct wimlib_compressor **c_ret)
  {
-       const HuffmanNode *leaf1 = _leaf1;
-       const HuffmanNode *leaf2 = _leaf2;
-
-       int code_len_diff = (int)leaf1->path_len - (int)leaf2->path_len;
-
-       if (code_len_diff == 0)
-               return (int)leaf1->sym - (int)leaf2->sym;
-       else
-               return code_len_diff;
+       struct wimlib_compressor *c;
+
+       if (c_ret == NULL)
+               return WIMLIB_ERR_INVALID_PARAM;
+
+       if (!compressor_ctype_valid(ctype))
+               return WIMLIB_ERR_INVALID_COMPRESSION_TYPE;
+
+       c = MALLOC(sizeof(*c));
+       if (c == NULL)
+               return WIMLIB_ERR_NOMEM;
+       c->ops = compressor_ops[ctype];
+       c->private = NULL;
+       if (c->ops->create_compressor) {
+               const struct wimlib_compressor_params_header *params;
+               int ret;
+
+               if (extra_params)
+                       params = extra_params;
+               else
+                       params = compressor_default_params[ctype];
+               ret = c->ops->create_compressor(max_block_size,
+                                               params, &c->private);
+               if (ret) {
+                       FREE(c);
+                       return ret;
+               }
+       }
+       *c_ret = c;
+       return 0;
  }
  
-#define INVALID_SYMBOL 0xffff
-
-/* Recursive function to calculate the depth of the leaves in a Huffman tree.
- * */
-static void
-huffman_tree_compute_path_lengths(HuffmanNode *base_node, u16 cur_len)
+WIMLIBAPI size_t
+wimlib_compress(const void *uncompressed_data, size_t uncompressed_size,
+               void *compressed_data, size_t compressed_size_avail,
+               struct wimlib_compressor *c)
  {
-       if (base_node->sym == INVALID_SYMBOL) {
-               /* Intermediate node. */
-               HuffmanIntermediateNode *node = (HuffmanIntermediateNode*)base_node;
-               huffman_tree_compute_path_lengths(node->left_child, cur_len + 1);
-               huffman_tree_compute_path_lengths(node->right_child, cur_len + 1);
-       } else {
-               /* Leaf node. */
-               base_node->path_len = cur_len;
-       }
+       return c->ops->compress(uncompressed_data, uncompressed_size,
+                               compressed_data, compressed_size_avail,
+                               c->private);
  }
  
-/* make_canonical_huffman_code: - Creates a canonical Huffman code from an array
- *                               of symbol frequencies.
- *
- * The algorithm used is similar to the well-known algorithm that builds a
- * Huffman tree using a minheap.  In that algorithm, the leaf nodes are
- * initialized and inserted into the minheap with the frequency as the key.
- * Repeatedly, the top two nodes (nodes with the lowest frequency) are taken out
- * of the heap and made the children of a new node that has a frequency equal to
- * the sum of the two frequencies of its children.  This new node is inserted
- * into the heap.  When all the nodes have been removed from the heap, what
- * remains is the Huffman tree. The Huffman code for a symbol is given by the
- * path to it in the tree, where each left pointer is mapped to a 0 bit and each
- * right pointer is mapped to a 1 bit.
- *
- * The algorithm used here uses an optimization that removes the need to
- * actually use a heap.  The leaf nodes are first sorted by frequency, as
- * opposed to being made into a heap.  Note that this sorting step takes O(n log
- * n) time vs.  O(n) time for heapifying the array, where n is the number of
- * symbols.  However, the heapless method is probably faster overall, due to the
- * time saved later.  In the heapless method, whenever an intermediate node is
- * created, it is not inserted into the sorted array.  Instead, the intermediate
- * nodes are kept in a separate array, which is easily kept sorted because every
- * time an intermediate node is initialized, it will have a frequency at least
- * as high as that of the previous intermediate node that was initialized.  So
- * whenever we want the 2 nodes, leaf or intermediate, that have the lowest
- * frequency, we check the low-frequency ends of both arrays, which is an O(1)
- * operation.
- *
- * The function builds a canonical Huffman code, not just any Huffman code.  A
- * Huffman code is canonical if the codeword for each symbol numerically
- * precedes the codeword for all other symbols of the same length that are
- * numbered higher than the symbol, and additionally, all shorter codewords,
- * 0-extended, numerically precede longer codewords.  A canonical Huffman code
- * is useful because it can be reconstructed by only knowing the path lengths in
- * the tree.  See the make_huffman_decode_table() function to see how to
- * reconstruct a canonical Huffman code from only the lengths of the codes.
- *
- * @num_syms:  The number of symbols in the alphabet.
- *
- * @max_codeword_len:  The maximum allowed length of a codeword in the code.
- *                     Note that if the code being created runs up against
- *                     this restriction, the code ultimately created will be
- *                     suboptimal, although there are some advantages for
- *                     limiting the length of the codewords.
- *
- * @freq_tab:  An array of length @num_syms that contains the frequencies
- *                     of each symbol in the uncompressed data.
- *
- * @lens:         An array of length @num_syms into which the lengths of the
- *                     codewords for each symbol will be written.
- *
- * @codewords:    An array of @num_syms short integers into which the
- *                     codewords for each symbol will be written.  The first
- *                     lens[i] bits of codewords[i] will contain the codeword
- *                     for symbol i.
- */
-void
-make_canonical_huffman_code(unsigned num_syms,
-                           unsigned max_codeword_len,
-                           const input_idx_t freq_tab[restrict],
-                           u8 lens[restrict],
-                           u16 codewords[restrict])
+WIMLIBAPI void
+wimlib_free_compressor(struct wimlib_compressor *c)
  {
-       /* We require at least 2 possible symbols in the alphabet to produce a
-        * valid Huffman decoding table. It is allowed that fewer than 2 symbols
-        * are actually used, though. */
-       wimlib_assert(num_syms >= 2 && num_syms < INVALID_SYMBOL);
-
-       /* Initialize the lengths and codewords to 0 */
-       memset(lens, 0, num_syms * sizeof(lens[0]));
-       memset(codewords, 0, num_syms * sizeof(codewords[0]));
-
-       /* Calculate how many symbols have non-zero frequency.  These are the
-        * symbols that actually appeared in the input. */
-       unsigned num_used_symbols = 0;
-       for (unsigned i = 0; i < num_syms; i++)
-               if (freq_tab[i] != 0)
-                       num_used_symbols++;
-
-
-       /* It is impossible to make a code for num_used_symbols symbols if there
-        * aren't enough code bits to uniquely represent all of them. */
-       wimlib_assert((1 << max_codeword_len) > num_used_symbols);
-
-       /* Initialize the array of leaf nodes with the symbols and their
-        * frequencies. */
-       HuffmanNode leaves[num_used_symbols];
-       unsigned leaf_idx = 0;
-       for (unsigned i = 0; i < num_syms; i++) {
-               if (freq_tab[i] != 0) {
-                       leaves[leaf_idx].freq = freq_tab[i];
-                       leaves[leaf_idx].sym  = i;
-                       leaves[leaf_idx].height = 0;
-                       leaf_idx++;
-               }
-       }
-
-       /* Deal with the special cases where num_used_symbols < 2. */
-       if (num_used_symbols < 2) {
-               if (num_used_symbols == 0) {
-                       /* If num_used_symbols is 0, there are no symbols in the
-                        * input, so it must be empty.  This should be an error,
-                        * but the LZX format expects this case to succeed.  All
-                        * the codeword lengths are simply marked as 0 (which
-                        * was already done.) */
-               } else {
-                       /* If only one symbol is present, the LZX format
-                        * requires that the Huffman code include two codewords.
-                        * One is not used.  Note that this doesn't make the
-                        * encoded data take up more room anyway, since binary
-                        * data itself has 2 symbols. */
-
-                       unsigned sym = leaves[0].sym;
-
-                       codewords[0] = 0;
-                       lens[0]      = 1;
-                       if (sym == 0) {
-                               /* dummy symbol is 1, real symbol is 0 */
-                               codewords[1] = 1;
-                               lens[1]      = 1;
-                       } else {
-                               /* dummy symbol is 0, real symbol is sym */
-                               codewords[sym] = 1;
-                               lens[sym]      = 1;
-                       }
-               }
-               return;
-       }
-
-       /* Otherwise, there are at least 2 symbols in the input, so we need to
-        * find a real Huffman code. */
-
-
-       /* Declare the array of intermediate nodes.  An intermediate node is not
-        * associated with a symbol. Instead, it represents some binary code
-        * prefix that is shared between at least 2 codewords.  There can be at
-        * most num_used_symbols - 1 intermediate nodes when creating a Huffman
-        * code.  This is because if there were at least num_used_symbols nodes,
-        * the code would be suboptimal because there would be at least one
-        * unnecessary intermediate node.
-        *
-        * The worst case (greatest number of intermediate nodes) would be if
-        * all the intermediate nodes were chained together.  This results in
-        * num_used_symbols - 1 intermediate nodes.  If num_used_symbols is at
-        * least 17, this configuration would not be allowed because the LZX
-        * format constrains codes to 16 bits or less each.  However, it is
-        * still possible for there to be more than 16 intermediate nodes, as
-        * long as no leaf has a depth of more than 16.  */
-       HuffmanIntermediateNode inodes[num_used_symbols - 1];
-
-
-       /* Pointer to the leaf node of lowest frequency that hasn't already been
-        * added as the child of some intermediate note. */
-       HuffmanNode *cur_leaf;
-
-       /* Pointer past the end of the array of leaves. */
-       HuffmanNode *end_leaf = &leaves[num_used_symbols];
-
-       /* Pointer to the intermediate node of lowest frequency. */
-       HuffmanIntermediateNode     *cur_inode;
-
-       /* Pointer to the next unallocated intermediate node. */
-       HuffmanIntermediateNode     *next_inode;
-
-       /* Only jump back to here if the maximum length of the codewords allowed
-        * by the LZX format (16 bits) is exceeded. */
-try_building_tree_again:
-
-       /* Sort the leaves from those that correspond to the least frequent
-        * symbol, to those that correspond to the most frequent symbol.  If two
-        * leaves have the same frequency, they are sorted by symbol. */
-       qsort(leaves, num_used_symbols, sizeof(leaves[0]), cmp_nodes_by_freq);
-
-       cur_leaf   = &leaves[0];
-       cur_inode  = &inodes[0];
-       next_inode = &inodes[0];
-
-       /* The following loop takes the two lowest frequency nodes of those
-        * remaining and makes them the children of the next available
-        * intermediate node.  It continues until all the leaf nodes and
-        * intermediate nodes have been used up, or the maximum allowed length
-        * for the codewords is exceeded.  For the latter case, we must adjust
-        * the frequencies to be more equal and then execute this loop again. */
-       while (1) {
-
-               /* Lowest frequency node. */
-               HuffmanNode *f1;
-
-               /* Second lowest frequency node. */
-               HuffmanNode *f2;
-
-               /* Get the lowest and second lowest frequency nodes from the
-                * remaining leaves or from the intermediate nodes. */
-
-               if (cur_leaf != end_leaf && (cur_inode == next_inode ||
-                                       cur_leaf->freq <= cur_inode->node_base.freq)) {
-                       f1 = cur_leaf++;
-               } else if (cur_inode != next_inode) {
-                       f1 = (HuffmanNode*)cur_inode++;
-               }
-
-               if (cur_leaf != end_leaf && (cur_inode == next_inode ||
-                                       cur_leaf->freq <= cur_inode->node_base.freq)) {
-                       f2 = cur_leaf++;
-               } else if (cur_inode != next_inode) {
-                       f2 = (HuffmanNode*)cur_inode++;
-               } else {
-                       /* All nodes used up! */
-                       break;
-               }
-
-               /* next_inode becomes the parent of f1 and f2. */
-
-               next_inode->node_base.freq = f1->freq + f2->freq;
-               next_inode->node_base.sym  = INVALID_SYMBOL;
-               next_inode->left_child     = f1;
-               next_inode->right_child    = f2;
-
-               /* We need to keep track of the height so that we can detect if
-                * the length of a codeword has execeed max_codeword_len.   The
-                * parent node has a height one higher than the maximum height
-                * of its children. */
-               next_inode->node_base.height = max(f1->height, f2->height) + 1;
-
-               /* Check to see if the code length of the leaf farthest away
-                * from next_inode has exceeded the maximum code length. */
-               if (next_inode->node_base.height > max_codeword_len) {
-                       /* The code lengths can be made more uniform by making
-                        * the frequencies more uniform.  Divide all the
-                        * frequencies by 2, leaving 1 as the minimum frequency.
-                        * If this keeps happening, the symbol frequencies will
-                        * approach equality, which makes their Huffman
-                        * codewords approach the length
-                        * log_2(num_used_symbols).
-                        * */
-                       for (unsigned i = 0; i < num_used_symbols; i++)
-                               leaves[i].freq = (leaves[i].freq + 1) >> 1;
-
-                       goto try_building_tree_again;
-               }
-               next_inode++;
-       }
-
-       /* The Huffman tree is now complete, and its height is no more than
-        * max_codeword_len.  */
-
-       HuffmanIntermediateNode *root = next_inode - 1;
-       wimlib_assert(root->node_base.height <= max_codeword_len);
-
-       /* Compute the path lengths for the leaf nodes. */
-       huffman_tree_compute_path_lengths(&root->node_base, 0);
-
-       /* Sort the leaf nodes primarily by code length and secondarily by
-        * symbol.  */
-       qsort(leaves, num_used_symbols, sizeof(leaves[0]), cmp_nodes_by_code_len);
-
-       u16 cur_codeword = 0;
-       unsigned cur_codeword_len = 0;
-       for (unsigned i = 0; i < num_used_symbols; i++) {
-
-               /* Each time a codeword becomes one longer, the current codeword
-                * is left shifted by one place.  This is part of the procedure
-                * for enumerating the canonical Huffman code.  Additionally,
-                * whenever a codeword is used, 1 is added to the current
-                * codeword.  */
-
-               unsigned len_diff = leaves[i].path_len - cur_codeword_len;
-               cur_codeword <<= len_diff;
-               cur_codeword_len += len_diff;
-
-               u16 sym = leaves[i].sym;
-               codewords[sym] = cur_codeword;
-               lens[sym] = cur_codeword_len;
-
-               cur_codeword++;
+       if (c) {
+               if (c->ops->free_compressor)
+                       c->ops->free_compressor(c->private);
+               FREE(c);
         }
  }
diff --git a/src/compress_chunk.c b/src/compress_chunk.c

deleted file mode 100644 (file)

index bd92cd6..0000000
--- a/src/compress_chunk.c
+++ /dev/null
@@ -1,35 +0,0 @@
-#ifdef HAVE_CONFIG_H
-#  include "config.h"
-#endif
-
-#include "wimlib.h"
-#include "wimlib/compress_chunks.h"
-#include "wimlib/error.h"
-#include "wimlib/assert.h"
-
-unsigned
-compress_chunk(const void * uncompressed_data,
-              unsigned uncompressed_len,
-              void *compressed_data,
-              int out_ctype,
-              struct wimlib_lzx_context *comp_ctx)
-{
-       switch (out_ctype) {
-       case WIMLIB_COMPRESSION_TYPE_XPRESS:
-               return wimlib_xpress_compress(uncompressed_data,
-                                             uncompressed_len,
-                                             compressed_data);
-       case WIMLIB_COMPRESSION_TYPE_LZX:
-               return wimlib_lzx_compress2(uncompressed_data,
-                                           uncompressed_len,
-                                           compressed_data,
-                                           comp_ctx);
-       case WIMLIB_COMPRESSION_TYPE_LZMS:
-               return 0;
-
-       default:
-               wimlib_assert(0);
-               WARNING("Unknown compression type!");
-               return 0;
-       }
-}
diff --git a/src/compress_common.c b/src/compress_common.c

new file mode 100644 (file)

index 0000000..9659d07
--- /dev/null
+++ b/src/compress_common.c
@@ -0,0 +1,471 @@
+/*
+ * compress_common.c
+ *
+ * Code for compression shared among multiple compression formats.
+ */
+
+/*
+ * Copyright (C) 2012, 2013 Eric Biggers
+ *
+ * This file is part of wimlib, a library for working with WIM files.
+ *
+ * wimlib is free software; you can redistribute it and/or modify it under the
+ * terms of the GNU General Public License as published by the Free
+ * Software Foundation; either version 3 of the License, or (at your option)
+ * any later version.
+ *
+ * wimlib is distributed in the hope that it will be useful, but WITHOUT ANY
+ * WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR
+ * A PARTICULAR PURPOSE. See the GNU General Public License for more
+ * details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with wimlib; if not, see http://www.gnu.org/licenses/.
+ */
+
+#ifdef HAVE_CONFIG_H
+#  include "config.h"
+#endif
+
+#include "wimlib/assert.h"
+#include "wimlib/endianness.h"
+#include "wimlib/compiler.h"
+#include "wimlib/compress_common.h"
+#include "wimlib/util.h"
+
+#include <stdlib.h>
+#include <string.h>
+
+/* Writes @num_bits bits, given by the @num_bits least significant bits of
+ * @bits, to the output @ostream. */
+void
+bitstream_put_bits(struct output_bitstream *ostream, u32 bits,
+                  unsigned num_bits)
+{
+       bits &= (1U << num_bits) - 1;
+       while (num_bits > ostream->free_bits) {
+               /* Buffer variable does not have space for the new bits.  It
+                * needs to be flushed as a 16-bit integer.  Bits in the second
+                * byte logically precede those in the first byte
+                * (little-endian), but within each byte the bits are ordered
+                * from high to low.  This is true for both XPRESS and LZX
+                * compression.  */
+
+               /* There must be at least 2 bytes of space remaining.  */
+               if (unlikely(ostream->bytes_remaining < 2)) {
+                       ostream->overrun = true;
+                       return;
+               }
+
+               /* Fill the buffer with as many bits that fit.  */
+               unsigned fill_bits = ostream->free_bits;
+
+               ostream->bitbuf <<= fill_bits;
+               ostream->bitbuf |= bits >> (num_bits - fill_bits);
+
+               *(le16*)ostream->bit_output = cpu_to_le16(ostream->bitbuf);
+               ostream->bit_output = ostream->next_bit_output;
+               ostream->next_bit_output = ostream->output;
+               ostream->output += 2;
+               ostream->bytes_remaining -= 2;
+
+               ostream->free_bits = 16;
+               num_bits -= fill_bits;
+               bits &= (1U << num_bits) - 1;
+       }
+
+       /* Buffer variable has space for the new bits.  */
+       ostream->bitbuf = (ostream->bitbuf << num_bits) | bits;
+       ostream->free_bits -= num_bits;
+}
+
+void
+bitstream_put_byte(struct output_bitstream *ostream, u8 n)
+{
+       if (unlikely(ostream->bytes_remaining < 1)) {
+               ostream->overrun = true;
+               return;
+       }
+       *ostream->output++ = n;
+       ostream->bytes_remaining--;
+}
+
+/* Flushes any remaining bits to the output bitstream.
+ *
+ * Returns -1 if the stream has overrun; otherwise returns the total number of
+ * bytes in the output.  */
+input_idx_t
+flush_output_bitstream(struct output_bitstream *ostream)
+{
+       if (unlikely(ostream->overrun))
+               return ~(input_idx_t)0;
+
+       *(le16*)ostream->bit_output =
+               cpu_to_le16((u16)((u32)ostream->bitbuf << ostream->free_bits));
+       *(le16*)ostream->next_bit_output =
+               cpu_to_le16(0);
+
+       return ostream->output - ostream->output_start;
+}
+
+/* Initializes an output bit buffer to write its output to the memory location
+ * pointer to by @data. */
+void
+init_output_bitstream(struct output_bitstream *ostream,
+                     void *data, unsigned num_bytes)
+{
+       wimlib_assert(num_bytes >= 4);
+
+       ostream->bitbuf              = 0;
+       ostream->free_bits           = 16;
+       ostream->output_start        = data;
+       ostream->bit_output          = data;
+       ostream->next_bit_output     = data + 2;
+       ostream->output              = data + 4;
+       ostream->bytes_remaining     = num_bytes - 4;
+       ostream->overrun             = false;
+}
+
+typedef struct {
+       input_idx_t freq;
+       u16 sym;
+       union {
+               u16 path_len;
+               u16 height;
+       };
+} HuffmanNode;
+
+typedef struct HuffmanIntermediateNode {
+       HuffmanNode node_base;
+       HuffmanNode *left_child;
+       HuffmanNode *right_child;
+} HuffmanIntermediateNode;
+
+
+/* Comparator function for HuffmanNodes.  Sorts primarily by symbol
+ * frequency and secondarily by symbol value. */
+static int
+cmp_nodes_by_freq(const void *_leaf1, const void *_leaf2)
+{
+       const HuffmanNode *leaf1 = _leaf1;
+       const HuffmanNode *leaf2 = _leaf2;
+
+       if (leaf1->freq > leaf2->freq)
+               return 1;
+       else if (leaf1->freq < leaf2->freq)
+               return -1;
+       else
+               return (int)leaf1->sym - (int)leaf2->sym;
+}
+
+/* Comparator function for HuffmanNodes.  Sorts primarily by code length and
+ * secondarily by symbol value. */
+static int
+cmp_nodes_by_code_len(const void *_leaf1, const void *_leaf2)
+{
+       const HuffmanNode *leaf1 = _leaf1;
+       const HuffmanNode *leaf2 = _leaf2;
+
+       int code_len_diff = (int)leaf1->path_len - (int)leaf2->path_len;
+
+       if (code_len_diff == 0)
+               return (int)leaf1->sym - (int)leaf2->sym;
+       else
+               return code_len_diff;
+}
+
+#define INVALID_SYMBOL 0xffff
+
+/* Recursive function to calculate the depth of the leaves in a Huffman tree.
+ * */
+static void
+huffman_tree_compute_path_lengths(HuffmanNode *base_node, u16 cur_len)
+{
+       if (base_node->sym == INVALID_SYMBOL) {
+               /* Intermediate node. */
+               HuffmanIntermediateNode *node = (HuffmanIntermediateNode*)base_node;
+               huffman_tree_compute_path_lengths(node->left_child, cur_len + 1);
+               huffman_tree_compute_path_lengths(node->right_child, cur_len + 1);
+       } else {
+               /* Leaf node. */
+               base_node->path_len = cur_len;
+       }
+}
+
+/* make_canonical_huffman_code: - Creates a canonical Huffman code from an array
+ *                               of symbol frequencies.
+ *
+ * The algorithm used is similar to the well-known algorithm that builds a
+ * Huffman tree using a minheap.  In that algorithm, the leaf nodes are
+ * initialized and inserted into the minheap with the frequency as the key.
+ * Repeatedly, the top two nodes (nodes with the lowest frequency) are taken out
+ * of the heap and made the children of a new node that has a frequency equal to
+ * the sum of the two frequencies of its children.  This new node is inserted
+ * into the heap.  When all the nodes have been removed from the heap, what
+ * remains is the Huffman tree. The Huffman code for a symbol is given by the
+ * path to it in the tree, where each left pointer is mapped to a 0 bit and each
+ * right pointer is mapped to a 1 bit.
+ *
+ * The algorithm used here uses an optimization that removes the need to
+ * actually use a heap.  The leaf nodes are first sorted by frequency, as
+ * opposed to being made into a heap.  Note that this sorting step takes O(n log
+ * n) time vs.  O(n) time for heapifying the array, where n is the number of
+ * symbols.  However, the heapless method is probably faster overall, due to the
+ * time saved later.  In the heapless method, whenever an intermediate node is
+ * created, it is not inserted into the sorted array.  Instead, the intermediate
+ * nodes are kept in a separate array, which is easily kept sorted because every
+ * time an intermediate node is initialized, it will have a frequency at least
+ * as high as that of the previous intermediate node that was initialized.  So
+ * whenever we want the 2 nodes, leaf or intermediate, that have the lowest
+ * frequency, we check the low-frequency ends of both arrays, which is an O(1)
+ * operation.
+ *
+ * The function builds a canonical Huffman code, not just any Huffman code.  A
+ * Huffman code is canonical if the codeword for each symbol numerically
+ * precedes the codeword for all other symbols of the same length that are
+ * numbered higher than the symbol, and additionally, all shorter codewords,
+ * 0-extended, numerically precede longer codewords.  A canonical Huffman code
+ * is useful because it can be reconstructed by only knowing the path lengths in
+ * the tree.  See the make_huffman_decode_table() function to see how to
+ * reconstruct a canonical Huffman code from only the lengths of the codes.
+ *
+ * @num_syms:  The number of symbols in the alphabet.
+ *
+ * @max_codeword_len:  The maximum allowed length of a codeword in the code.
+ *                     Note that if the code being created runs up against
+ *                     this restriction, the code ultimately created will be
+ *                     suboptimal, although there are some advantages for
+ *                     limiting the length of the codewords.
+ *
+ * @freq_tab:  An array of length @num_syms that contains the frequencies
+ *                     of each symbol in the uncompressed data.
+ *
+ * @lens:         An array of length @num_syms into which the lengths of the
+ *                     codewords for each symbol will be written.
+ *
+ * @codewords:    An array of @num_syms short integers into which the
+ *                     codewords for each symbol will be written.  The first
+ *                     lens[i] bits of codewords[i] will contain the codeword
+ *                     for symbol i.
+ */
+void
+make_canonical_huffman_code(unsigned num_syms,
+                           unsigned max_codeword_len,
+                           const input_idx_t freq_tab[restrict],
+                           u8 lens[restrict],
+                           u16 codewords[restrict])
+{
+       /* We require at least 2 possible symbols in the alphabet to produce a
+        * valid Huffman decoding table. It is allowed that fewer than 2 symbols
+        * are actually used, though. */
+       wimlib_assert(num_syms >= 2 && num_syms < INVALID_SYMBOL);
+
+       /* Initialize the lengths and codewords to 0 */
+       memset(lens, 0, num_syms * sizeof(lens[0]));
+       memset(codewords, 0, num_syms * sizeof(codewords[0]));
+
+       /* Calculate how many symbols have non-zero frequency.  These are the
+        * symbols that actually appeared in the input. */
+       unsigned num_used_symbols = 0;
+       for (unsigned i = 0; i < num_syms; i++)
+               if (freq_tab[i] != 0)
+                       num_used_symbols++;
+
+
+       /* It is impossible to make a code for num_used_symbols symbols if there
+        * aren't enough code bits to uniquely represent all of them. */
+       wimlib_assert((1 << max_codeword_len) > num_used_symbols);
+
+       /* Initialize the array of leaf nodes with the symbols and their
+        * frequencies. */
+       HuffmanNode leaves[num_used_symbols];
+       unsigned leaf_idx = 0;
+       for (unsigned i = 0; i < num_syms; i++) {
+               if (freq_tab[i] != 0) {
+                       leaves[leaf_idx].freq = freq_tab[i];
+                       leaves[leaf_idx].sym  = i;
+                       leaves[leaf_idx].height = 0;
+                       leaf_idx++;
+               }
+       }
+
+       /* Deal with the special cases where num_used_symbols < 2. */
+       if (num_used_symbols < 2) {
+               if (num_used_symbols == 0) {
+                       /* If num_used_symbols is 0, there are no symbols in the
+                        * input, so it must be empty.  This should be an error,
+                        * but the LZX format expects this case to succeed.  All
+                        * the codeword lengths are simply marked as 0 (which
+                        * was already done.) */
+               } else {
+                       /* If only one symbol is present, the LZX format
+                        * requires that the Huffman code include two codewords.
+                        * One is not used.  Note that this doesn't make the
+                        * encoded data take up more room anyway, since binary
+                        * data itself has 2 symbols. */
+
+                       unsigned sym = leaves[0].sym;
+
+                       codewords[0] = 0;
+                       lens[0]      = 1;
+                       if (sym == 0) {
+                               /* dummy symbol is 1, real symbol is 0 */
+                               codewords[1] = 1;
+                               lens[1]      = 1;
+                       } else {
+                               /* dummy symbol is 0, real symbol is sym */
+                               codewords[sym] = 1;
+                               lens[sym]      = 1;
+                       }
+               }
+               return;
+       }
+
+       /* Otherwise, there are at least 2 symbols in the input, so we need to
+        * find a real Huffman code. */
+
+
+       /* Declare the array of intermediate nodes.  An intermediate node is not
+        * associated with a symbol. Instead, it represents some binary code
+        * prefix that is shared between at least 2 codewords.  There can be at
+        * most num_used_symbols - 1 intermediate nodes when creating a Huffman
+        * code.  This is because if there were at least num_used_symbols nodes,
+        * the code would be suboptimal because there would be at least one
+        * unnecessary intermediate node.
+        *
+        * The worst case (greatest number of intermediate nodes) would be if
+        * all the intermediate nodes were chained together.  This results in
+        * num_used_symbols - 1 intermediate nodes.  If num_used_symbols is at
+        * least 17, this configuration would not be allowed because the LZX
+        * format constrains codes to 16 bits or less each.  However, it is
+        * still possible for there to be more than 16 intermediate nodes, as
+        * long as no leaf has a depth of more than 16.  */
+       HuffmanIntermediateNode inodes[num_used_symbols - 1];
+
+
+       /* Pointer to the leaf node of lowest frequency that hasn't already been
+        * added as the child of some intermediate note. */
+       HuffmanNode *cur_leaf;
+
+       /* Pointer past the end of the array of leaves. */
+       HuffmanNode *end_leaf = &leaves[num_used_symbols];
+
+       /* Pointer to the intermediate node of lowest frequency. */
+       HuffmanIntermediateNode     *cur_inode;
+
+       /* Pointer to the next unallocated intermediate node. */
+       HuffmanIntermediateNode     *next_inode;
+
+       /* Only jump back to here if the maximum length of the codewords allowed
+        * by the LZX format (16 bits) is exceeded. */
+try_building_tree_again:
+
+       /* Sort the leaves from those that correspond to the least frequent
+        * symbol, to those that correspond to the most frequent symbol.  If two
+        * leaves have the same frequency, they are sorted by symbol. */
+       qsort(leaves, num_used_symbols, sizeof(leaves[0]), cmp_nodes_by_freq);
+
+       cur_leaf   = &leaves[0];
+       cur_inode  = &inodes[0];
+       next_inode = &inodes[0];
+
+       /* The following loop takes the two lowest frequency nodes of those
+        * remaining and makes them the children of the next available
+        * intermediate node.  It continues until all the leaf nodes and
+        * intermediate nodes have been used up, or the maximum allowed length
+        * for the codewords is exceeded.  For the latter case, we must adjust
+        * the frequencies to be more equal and then execute this loop again. */
+       while (1) {
+
+               /* Lowest frequency node. */
+               HuffmanNode *f1;
+
+               /* Second lowest frequency node. */
+               HuffmanNode *f2;
+
+               /* Get the lowest and second lowest frequency nodes from the
+                * remaining leaves or from the intermediate nodes. */
+
+               if (cur_leaf != end_leaf && (cur_inode == next_inode ||
+                                       cur_leaf->freq <= cur_inode->node_base.freq)) {
+                       f1 = cur_leaf++;
+               } else if (cur_inode != next_inode) {
+                       f1 = (HuffmanNode*)cur_inode++;
+               }
+
+               if (cur_leaf != end_leaf && (cur_inode == next_inode ||
+                                       cur_leaf->freq <= cur_inode->node_base.freq)) {
+                       f2 = cur_leaf++;
+               } else if (cur_inode != next_inode) {
+                       f2 = (HuffmanNode*)cur_inode++;
+               } else {
+                       /* All nodes used up! */
+                       break;
+               }
+
+               /* next_inode becomes the parent of f1 and f2. */
+
+               next_inode->node_base.freq = f1->freq + f2->freq;
+               next_inode->node_base.sym  = INVALID_SYMBOL;
+               next_inode->left_child     = f1;
+               next_inode->right_child    = f2;
+
+               /* We need to keep track of the height so that we can detect if
+                * the length of a codeword has execeed max_codeword_len.   The
+                * parent node has a height one higher than the maximum height
+                * of its children. */
+               next_inode->node_base.height = max(f1->height, f2->height) + 1;
+
+               /* Check to see if the code length of the leaf farthest away
+                * from next_inode has exceeded the maximum code length. */
+               if (next_inode->node_base.height > max_codeword_len) {
+                       /* The code lengths can be made more uniform by making
+                        * the frequencies more uniform.  Divide all the
+                        * frequencies by 2, leaving 1 as the minimum frequency.
+                        * If this keeps happening, the symbol frequencies will
+                        * approach equality, which makes their Huffman
+                        * codewords approach the length
+                        * log_2(num_used_symbols).
+                        * */
+                       for (unsigned i = 0; i < num_used_symbols; i++)
+                               leaves[i].freq = (leaves[i].freq + 1) >> 1;
+
+                       goto try_building_tree_again;
+               }
+               next_inode++;
+       }
+
+       /* The Huffman tree is now complete, and its height is no more than
+        * max_codeword_len.  */
+
+       HuffmanIntermediateNode *root = next_inode - 1;
+       wimlib_assert(root->node_base.height <= max_codeword_len);
+
+       /* Compute the path lengths for the leaf nodes. */
+       huffman_tree_compute_path_lengths(&root->node_base, 0);
+
+       /* Sort the leaf nodes primarily by code length and secondarily by
+        * symbol.  */
+       qsort(leaves, num_used_symbols, sizeof(leaves[0]), cmp_nodes_by_code_len);
+
+       u16 cur_codeword = 0;
+       unsigned cur_codeword_len = 0;
+       for (unsigned i = 0; i < num_used_symbols; i++) {
+
+               /* Each time a codeword becomes one longer, the current codeword
+                * is left shifted by one place.  This is part of the procedure
+                * for enumerating the canonical Huffman code.  Additionally,
+                * whenever a codeword is used, 1 is added to the current
+                * codeword.  */
+
+               unsigned len_diff = leaves[i].path_len - cur_codeword_len;
+               cur_codeword <<= len_diff;
+               cur_codeword_len += len_diff;
+
+               u16 sym = leaves[i].sym;
+               codewords[sym] = cur_codeword;
+               lens[sym] = cur_codeword_len;
+
+               cur_codeword++;
+       }
+}
diff --git a/src/compress_parallel.c b/src/compress_parallel.c

index 25403423bd35af84f516908336cee520fa1193d6..d0ce5266464cb4021797cbd2a81c4ed5c5c652c3 100644 (file)
--- a/src/compress_parallel.c
+++ b/src/compress_parallel.c
@@ -27,7 +27,7 @@
  #endif
  
  #include "wimlib/assert.h"
-#include "wimlib/compress_chunks.h"
+#include "wimlib/chunk_compressor.h"
  #include "wimlib/error.h"
  #include "wimlib/list.h"
  #include "wimlib/util.h"
@@ -54,9 +54,7 @@ struct compressor_thread_data {
         pthread_t thread;
         struct message_queue *chunks_to_compress_queue;
         struct message_queue *compressed_chunks_queue;
-       int out_ctype;
-       u32 out_chunk_size;
-       struct wimlib_lzx_context *comp_ctx;
+       struct wimlib_compressor *compressor;
  };
  
  #define MAX_CHUNKS_PER_MSG 2
@@ -251,17 +249,17 @@ allocate_messages(size_t count, size_t chunks_per_msg, u32 out_chunk_size)
  }
  
  static void
-compress_chunks(struct message *msg, int out_ctype,
-               struct wimlib_lzx_context *comp_ctx)
+compress_chunks(struct message *msg, struct wimlib_compressor *compressor)
  {
  
         for (size_t i = 0; i < msg->num_filled_chunks; i++) {
+               wimlib_assert(msg->uncompressed_chunk_sizes[i] != 0);
                 msg->compressed_chunk_sizes[i] =
-                       compress_chunk(msg->uncompressed_chunks[i],
-                                      msg->uncompressed_chunk_sizes[i],
-                                      msg->compressed_chunks[i],
-                                      out_ctype,
-                                      comp_ctx);
+                       wimlib_compress(msg->uncompressed_chunks[i],
+                                       msg->uncompressed_chunk_sizes[i],
+                                       msg->compressed_chunks[i],
+                                       msg->uncompressed_chunk_sizes[i] - 1,
+                                       compressor);
         }
  }
  
@@ -272,7 +270,7 @@ compressor_thread_proc(void *arg)
         struct message *msg;
  
         while ((msg = message_queue_get(params->chunks_to_compress_queue)) != NULL) {
-               compress_chunks(msg, params->out_ctype, params->comp_ctx);
+               compress_chunks(msg, params->compressor);
                 message_queue_put(params->compressed_chunks_queue, msg);
         }
         return NULL;
@@ -298,10 +296,9 @@ parallel_chunk_compressor_destroy(struct chunk_compressor *_ctx)
         message_queue_destroy(&ctx->chunks_to_compress_queue);
         message_queue_destroy(&ctx->compressed_chunks_queue);
  
-       if (ctx->base.out_ctype == WIMLIB_COMPRESSION_TYPE_LZX &&
-           ctx->thread_data != NULL)
+       if (ctx->thread_data != NULL)
                 for (i = 0; i < ctx->num_threads; i++)
-                       wimlib_lzx_free_context(ctx->thread_data[i].comp_ctx);
+                       wimlib_free_compressor(ctx->thread_data[i].compressor);
  
         FREE(ctx->thread_data);
  
@@ -493,14 +490,10 @@ new_parallel_chunk_compressor(int out_ctype, u32 out_chunk_size,
  
                 dat->chunks_to_compress_queue = &ctx->chunks_to_compress_queue;
                 dat->compressed_chunks_queue = &ctx->compressed_chunks_queue;
-               dat->out_ctype = out_ctype;
-               dat->out_chunk_size = out_chunk_size;
-               if (out_ctype == WIMLIB_COMPRESSION_TYPE_LZX) {
-                       ret = wimlib_lzx_alloc_context(out_chunk_size, NULL,
-                                                      &dat->comp_ctx);
-                       if (ret)
-                               goto err;
-               }
+               ret = wimlib_create_compressor(out_ctype, out_chunk_size,
+                                              NULL, &dat->compressor);
+               if (ret)
+                       goto err;
         }
  
         for (ctx->num_started_threads = 0;
diff --git a/src/compress_serial.c b/src/compress_serial.c

index b3c6293eef95019aec730229f4e8aab3c5b0c14e..0ae354834286b8e84db6987e7391df262f2df89e 100644 (file)
--- a/src/compress_serial.c
+++ b/src/compress_serial.c
@@ -28,14 +28,14 @@
  
  #include "wimlib.h"
  #include "wimlib/assert.h"
-#include "wimlib/compress_chunks.h"
+#include "wimlib/chunk_compressor.h"
  #include "wimlib/util.h"
  
  #include <string.h>
  
  struct serial_chunk_compressor {
         struct chunk_compressor base;
-       struct wimlib_lzx_context *comp_ctx;
+       struct wimlib_compressor *compressor;
         u8 *udata;
         u8 *cdata;
         unsigned ulen;
@@ -50,6 +50,7 @@ serial_chunk_compressor_destroy(struct chunk_compressor *_ctx)
         if (ctx == NULL)
                 return;
  
+       wimlib_free_compressor(ctx->compressor);
         FREE(ctx->udata);
         FREE(ctx->cdata);
         FREE(ctx);
@@ -82,9 +83,9 @@ serial_chunk_compressor_get_chunk(struct chunk_compressor *_ctx,
         if (ctx->ulen == 0)
                 return false;
  
-       ctx->clen = compress_chunk(ctx->udata, ctx->ulen,
-                                  ctx->cdata, ctx->base.out_ctype,
-                                  ctx->comp_ctx);
+       ctx->clen = wimlib_compress(ctx->udata, ctx->ulen,
+                                   ctx->cdata, ctx->ulen - 1,
+                                   ctx->compressor);
  
         if (ctx->clen) {
                 *cdata_ret = ctx->cdata;
@@ -101,14 +102,14 @@ serial_chunk_compressor_get_chunk(struct chunk_compressor *_ctx,
  
  int
  new_serial_chunk_compressor(int out_ctype, u32 out_chunk_size,
-                           struct wimlib_lzx_context *comp_ctx,
                             struct chunk_compressor **compressor_ret)
  {
         struct serial_chunk_compressor *ctx;
+       int ret;
  
         ctx = CALLOC(1, sizeof(*ctx));
         if (ctx == NULL)
-               goto err;
+               return WIMLIB_ERR_NOMEM;
  
         ctx->base.out_ctype = out_ctype;
         ctx->base.out_chunk_size = out_chunk_size;
@@ -117,17 +118,24 @@ new_serial_chunk_compressor(int out_ctype, u32 out_chunk_size,
         ctx->base.submit_chunk = serial_chunk_compressor_submit_chunk;
         ctx->base.get_chunk = serial_chunk_compressor_get_chunk;
  
-       ctx->comp_ctx = comp_ctx;
+
+       ret = wimlib_create_compressor(out_ctype, out_chunk_size,
+                                      NULL, &ctx->compressor);
+       if (ret)
+               goto err;
+
         ctx->udata = MALLOC(out_chunk_size);
         ctx->cdata = MALLOC(out_chunk_size - 1);
         ctx->ulen = 0;
-       if (ctx->udata == NULL || ctx->cdata == NULL)
+       if (ctx->udata == NULL || ctx->cdata == NULL) {
+               ret = WIMLIB_ERR_NOMEM;
                 goto err;
+       }
  
         *compressor_ret = &ctx->base;
         return 0;
  
  err:
         serial_chunk_compressor_destroy(&ctx->base);
-       return WIMLIB_ERR_NOMEM;
+       return ret;
  }
diff --git a/src/decompress.c b/src/decompress.c

index c94696ddf3cd68ebb380cb4db6874d38f09459a5..4ea066f0d4a86a628c70941330554d8a5c745e3e 100644 (file)
--- a/src/decompress.c
+++ b/src/decompress.c
@@ -1,11 +1,12 @@
  /*
   * decompress.c
   *
- * Functions used for decompression.
+ * Generic functions for decompression, wrapping around actual decompression
+ * implementations.
   */
  
  /*
- * Copyright (C) 2012, 2013 Eric Biggers
+ * Copyright (C) 2013 Eric Biggers
   *
   * This file is part of wimlib, a library for working with WIM files.
   *
@@ -27,406 +28,121 @@
  #  include "config.h"
  #endif
  
-#include "wimlib/decompress.h"
-#include "wimlib/error.h"
+#include "wimlib.h"
+#include "wimlib/decompressor_ops.h"
  #include "wimlib/util.h"
  
-#include <string.h>
-
-#ifdef __GNUC__
-#  ifdef __SSE2__
-#    define USE_SSE2_FILL
-#    include <emmintrin.h>
-#  else
-#    define USE_LONG_FILL
-#  endif
-#endif
-
-/*
- * make_huffman_decode_table: - Builds a fast huffman decoding table from an
- * array that gives the length of the codeword for each symbol in the alphabet.
- * Originally based on code written by David Tritscher (taken the original LZX
- * decompression code); also heavily modified to add some optimizations used in
- * the zlib code, as well as more comments; also added some optimizations to
- * make filling in the decode table entries faster (may not help significantly
- * though).
- *
- * @decode_table:      The array in which to create the fast huffman decoding
- *                     table.  It must have a length of at least
- *                     (2**table_bits) + 2 * num_syms to guarantee
- *                     that there is enough space.  Also must be 16-byte
- *                     aligned (at least when USE_SSE2_FILL gets defined).
- *
- * @num_syms:          Number of symbols in the alphabet, including symbols
- *                     that do not appear in this particular input chunk.
- *
- * @table_bits:                Any symbols with a code length of table_bits or less can
- *                     be decoded in one lookup of the table.  2**table_bits
- *                     must be greater than or equal to @num_syms if there are
- *                     any Huffman codes longer than @table_bits.
- *
- * @lens:              An array of length @num_syms, indexable by symbol, that
- *                     gives the length of the Huffman codeword for that
- *                     symbol.  Because the Huffman tree is in canonical form,
- *                     it can be reconstructed by only knowing the length of
- *                     the codeword for each symbol.  It is assumed, but not
- *                     checked, that every length is less than
- *                     @max_codeword_len.
- *
- * @max_codeword_len:  The longest codeword length allowed in the compression
- *                     format.
- *
- * Returns 0 on success; returns -1 if the length values do not correspond to a
- * valid Huffman tree.
- *
- * The format of the Huffamn decoding table is as follows.  The first (1 <<
- * table_bits) entries of the table are indexed by chunks of the input of size
- * @table_bits.  If the next Huffman codeword in the input happens to have a
- * length of exactly @table_bits, the symbol is simply read directly from the
- * decoding table.  Alternatively, if the next Huffman codeword has length _less
- * than_ @table_bits, the symbol is also read directly from the decode table;
- * this is possible because every entry in the table that is indexed by an
- * integer that has the shorter codeword as a binary prefix is filled in with
- * the appropriate symbol.  If a codeword has length n <= table_bits, it will
- * have 2**(table_bits - n) possible suffixes, and thus that many entries in the
- * decoding table.
- *
- * It's a bit more complicated if the next Huffman codeword has length of more
- * than @table_bits.  The table entry indexed by the first @table_bits of that
- * codeword cannot give the appropriate symbol directly, because that entry is
- * guaranteed to be referenced by the Huffman codewords of multiple symbols.
- * And while the LZX compression format does not allow codes longer than 16
- * bits, a table of size (2 ** 16) = 65536 entries would be too slow to create.
- *
- * There are several different ways to make it possible to look up the symbols
- * for codewords longer than @table_bits.  One way is to make the entries for
- * the prefixes of length @table_bits of those entries be pointers to additional
- * decoding tables that are indexed by some number of additional bits of the
- * codeword.  The technique used here is a bit simpler, however: just store the
- * needed subtrees of the Huffman tree in the decoding table after the lookup
- * entries, beginning at index (2**table_bits).  Real pointers are replaced by
- * indices into the decoding table, and symbol entries are distinguished from
- * pointers by the fact that values less than @num_syms must be symbol values.
- */
-int
-make_huffman_decode_table(u16 *decode_table,  unsigned num_syms,
-                         unsigned table_bits, const u8 *lens,
-                         unsigned max_codeword_len)
+struct wimlib_decompressor {
+       const struct decompressor_ops *ops;
+       void *private;
+};
+
+static const struct decompressor_ops *decompressor_ops[] = {
+       [WIMLIB_COMPRESSION_TYPE_LZX]    = &lzx_decompressor_ops,
+       [WIMLIB_COMPRESSION_TYPE_XPRESS] = &xpress_decompressor_ops,
+       [WIMLIB_COMPRESSION_TYPE_LZMS]   = &lzms_decompressor_ops,
+};
+
+static struct wimlib_decompressor_params_header *
+decompressor_default_params[ARRAY_LEN(decompressor_ops)] = {
+       [WIMLIB_COMPRESSION_TYPE_LZX]    = NULL,
+       [WIMLIB_COMPRESSION_TYPE_XPRESS] = NULL,
+       [WIMLIB_COMPRESSION_TYPE_LZMS]   = NULL,
+};
+
+static bool
+decompressor_ctype_valid(int ctype)
  {
-       unsigned len_counts[max_codeword_len + 1];
-       u16 sorted_syms[num_syms];
-       unsigned offsets[max_codeword_len + 1];
-       const unsigned table_num_entries = 1 << table_bits;
-       int left;
-       unsigned decode_table_pos;
-       void *decode_table_ptr;
-       unsigned sym_idx;
-       unsigned codeword_len;
-       unsigned stores_per_loop;
-
-#ifdef USE_LONG_FILL
-       const unsigned entries_per_long = sizeof(unsigned long) / sizeof(decode_table[0]);
-#endif
-
-#ifdef USE_SSE2_FILL
-       const unsigned entries_per_xmm = sizeof(__m128i) / sizeof(decode_table[0]);
-#endif
-
-       wimlib_assert2((uintptr_t)decode_table % DECODE_TABLE_ALIGNMENT == 0);
-
-       /* accumulate lengths for codes */
-       for (unsigned i = 0; i <= max_codeword_len; i++)
-               len_counts[i] = 0;
-
-       for (unsigned sym = 0; sym < num_syms; sym++) {
-               wimlib_assert2(lens[sym] <= max_codeword_len);
-               len_counts[lens[sym]]++;
-       }
-
-       /* check for an over-subscribed or incomplete set of lengths */
-       left = 1;
-       for (unsigned len = 1; len <= max_codeword_len; len++) {
-               left <<= 1;
-               left -= len_counts[len];
-               if (unlikely(left < 0)) { /* over-subscribed */
-                       DEBUG("Invalid Huffman code (over-subscribed)");
-                       return -1;
-               }
-       }
-
-       if (unlikely(left != 0)) /* incomplete set */{
-               if (left == 1 << max_codeword_len) {
-                       /* Empty code--- okay in XPRESS and LZX */
-                       memset(decode_table, 0,
-                              table_num_entries * sizeof(decode_table[0]));
-                       return 0;
-               } else {
-                       DEBUG("Invalid Huffman code (incomplete set)");
-                       return -1;
-               }
-       }
-
-       /* Generate offsets into symbol table for each length for sorting */
-       offsets[1] = 0;
-       for (unsigned len = 1; len < max_codeword_len; len++)
-               offsets[len + 1] = offsets[len] + len_counts[len];
-
-       /* Sort symbols primarily by length and secondarily by symbol order.
-        * This is basically a count-sort over the codeword lengths. */
-       for (unsigned sym = 0; sym < num_syms; sym++)
-               if (lens[sym] != 0)
-                       sorted_syms[offsets[lens[sym]]++] = sym;
-
-       /* Fill entries for codewords short enough for a direct mapping.  We can
-        * take advantage of the ordering of the codewords, since the Huffman
-        * code is canonical.  It must be the case that all the codewords of
-        * some length L numerically precede all the codewords of length L + 1.
-        * Furthermore, if we have 2 symbols A and B with the same codeword
-        * length but symbol A is sorted before symbol B, then then we know that
-        * the codeword for A numerically precedes the codeword for B. */
-       decode_table_ptr = decode_table;
-       sym_idx = 0;
-       codeword_len = 1;
-#ifdef USE_SSE2_FILL
-       /* Fill in the Huffman decode table entries one 128-bit vector at a
-        * time.  This is 8 entries per store. */
-       stores_per_loop = (1 << (table_bits - codeword_len)) / entries_per_xmm;
-       for (; stores_per_loop != 0; codeword_len++, stores_per_loop >>= 1) {
-               unsigned end_sym_idx = sym_idx + len_counts[codeword_len];
-               for (; sym_idx < end_sym_idx; sym_idx++) {
-                       /* Note: unlike in the 'long' version below, the __m128i
-                        * type already has __attribute__((may_alias)), so using
-                        * it to access the decode table, which is an array of
-                        * unsigned shorts, will not violate strict aliasing. */
-                       u16 sym;
-                       __m128i v;
-                       __m128i *p;
-                       unsigned n;
-
-                       sym = sorted_syms[sym_idx];
-
-                       v = _mm_set1_epi16(sym);
-                       p = (__m128i*)decode_table_ptr;
-                       n = stores_per_loop;
-                       do {
-                               *p++ = v;
-                       } while (--n);
-                       decode_table_ptr = p;
-               }
-       }
-#endif /* USE_SSE2_FILL */
-
-#ifdef USE_LONG_FILL
-       /* Fill in the Huffman decode table entries one 'unsigned long' at a
-        * time.  On 32-bit systems this is 2 entries per store, while on 64-bit
-        * systems this is 4 entries per store. */
-       stores_per_loop = (1 << (table_bits - codeword_len)) / entries_per_long;
-       for (; stores_per_loop != 0; codeword_len++, stores_per_loop >>= 1) {
-               unsigned end_sym_idx = sym_idx + len_counts[codeword_len];
-               for (; sym_idx < end_sym_idx; sym_idx++) {
-
-                       /* Accessing the array of unsigned shorts as unsigned
-                        * longs would violate strict aliasing and would require
-                        * compiling the code with -fno-strict-aliasing to
-                        * guarantee correctness.  To work around this problem,
-                        * use the gcc 'may_alias' extension to define a special
-                        * unsigned long type that may alias any other in-memory
-                        * variable.  */
-                       typedef unsigned long __attribute__((may_alias)) aliased_long_t;
-
-                       u16 sym;
-                       aliased_long_t *p;
-                       aliased_long_t v;
-                       unsigned n;
-
-                       sym = sorted_syms[sym_idx];
-
-                       BUILD_BUG_ON(sizeof(aliased_long_t) != 4 &&
-                                    sizeof(aliased_long_t) != 8);
+       return (ctype >= 0 &&
+               ctype < ARRAY_LEN(decompressor_ops) &&
+               decompressor_ops[ctype] != NULL);
+}
  
-                       v = sym;
-                       if (sizeof(aliased_long_t) >= 4)
-                               v |= v << 16;
-                       if (sizeof(aliased_long_t) >= 8) {
-                               /* This may produce a compiler warning if an
-                                * aliased_long_t is 32 bits, but this won't be
-                                * executed unless an aliased_long_t is at least
-                                * 64 bits anyway. */
-                               v |= v << 32;
-                       }
+WIMLIBAPI int
+wimlib_set_default_decompressor_params(enum wimlib_compression_type ctype,
+                                      const struct wimlib_decompressor_params_header *params)
+{
+       struct wimlib_decompressor_params_header *dup;
  
-                       p = (aliased_long_t *)decode_table_ptr;
-                       n = stores_per_loop;
+       if (!decompressor_ctype_valid(ctype))
+               return WIMLIB_ERR_INVALID_COMPRESSION_TYPE;
  
-                       do {
-                               *p++ = v;
-                       } while (--n);
-                       decode_table_ptr = p;
-               }
+       dup = NULL;
+       if (params) {
+               dup = memdup(params, params->size);
+               if (dup == NULL)
+                       return WIMLIB_ERR_NOMEM;
         }
-#endif /* USE_LONG_FILL */
-
-       /* Fill in the Huffman decode table entries one 16-bit integer at a
-        * time. */
-       stores_per_loop = (1 << (table_bits - codeword_len));
-       for (; stores_per_loop != 0; codeword_len++, stores_per_loop >>= 1) {
-               unsigned end_sym_idx = sym_idx + len_counts[codeword_len];
-               for (; sym_idx < end_sym_idx; sym_idx++) {
-                       u16 sym;
-                       u16 *p;
-                       unsigned n;
-
-                       sym = sorted_syms[sym_idx];
  
-                       p = (u16*)decode_table_ptr;
-                       n = stores_per_loop;
-
-                       do {
-                               *p++ = sym;
-                       } while (--n);
+       FREE(decompressor_default_params[ctype]);
+       decompressor_default_params[ctype] = dup;
+       return 0;
+}
  
-                       decode_table_ptr = p;
-               }
+void
+cleanup_decompressor_params(void)
+{
+       for (size_t i = 0; i < ARRAY_LEN(decompressor_default_params); i++) {
+               FREE(decompressor_default_params[i]);
+               decompressor_default_params[i] = NULL;
         }
+}
  
-       /* If we've filled in the entire table, we are done.  Otherwise, there
-        * are codes longer than table bits that we need to store in the
-        * tree-like structure at the end of the table rather than directly in
-        * the main decode table itself. */
-
-       decode_table_pos = (u16*)decode_table_ptr - decode_table;
-       if (decode_table_pos != table_num_entries) {
-               unsigned j;
-               unsigned next_free_tree_slot;
-               unsigned cur_codeword;
-
-               wimlib_assert2(decode_table_pos < table_num_entries);
-
-               /* Fill in the remaining entries, which correspond to codes
-                * longer than @table_bits.
-                *
-                * First, zero out the rest of the entries.  This is necessary
-                * so that the entries appear as "unallocated" in the next part.
-                * */
-               j = decode_table_pos;
-               do {
-                       decode_table[j] = 0;
-               } while (++j != table_num_entries);
-
-               /* Assert that 2**table_bits is at least num_syms.  If this
-                * wasn't the case, we wouldn't be able to distinguish pointer
-                * entries from symbol entries. */
-               wimlib_assert2(table_num_entries >= num_syms);
-
-
-               /* The tree nodes are allocated starting at decode_table[1 <<
-                * table_bits].  Remember that the full size of the table,
-                * including the extra space for the tree nodes, is actually
-                * 2**table_bits + 2 * num_syms slots, while table_num_entries
-                * is only 2**table_bits. */
-               next_free_tree_slot = table_num_entries;
-
-               /* The current Huffman codeword  */
-               cur_codeword = decode_table_pos << 1;
-
-               /* Go through every codeword of length greater than @table_bits,
-                * primarily in order of codeword length and secondarily in
-                * order of symbol. */
-               wimlib_assert2(codeword_len == table_bits + 1);
-               for (; codeword_len <= max_codeword_len; codeword_len++, cur_codeword <<= 1)
-               {
-                       unsigned end_sym_idx = sym_idx + len_counts[codeword_len];
-                       for (; sym_idx < end_sym_idx; sym_idx++, cur_codeword++) {
-                               unsigned sym = sorted_syms[sym_idx];
-                               unsigned extra_bits = codeword_len - table_bits;
-
-                               /* index of the current node; find it from the
-                                * prefix of the current Huffman codeword. */
-                               unsigned node_idx = cur_codeword >> extra_bits;
-                               wimlib_assert2(node_idx < table_num_entries);
-
-                               /* Go through each bit of the current Huffman
-                                * codeword beyond the prefix of length
-                                * @table_bits and walk the tree, allocating any
-                                * slots that have not yet been allocated. */
-                               do {
-
-                                       /* If the current tree node points to
-                                        * nowhere but we need to follow it,
-                                        * allocate a new node for it to point
-                                        * to. */
-                                       if (decode_table[node_idx] == 0) {
-                                               decode_table[node_idx] = next_free_tree_slot;
-                                               decode_table[next_free_tree_slot++] = 0;
-                                               decode_table[next_free_tree_slot++] = 0;
-                                               wimlib_assert2(next_free_tree_slot <=
-                                                              table_num_entries + 2 * num_syms);
-                                       }
-
-                                       /* Set node_idx to left child */
-                                       node_idx = decode_table[node_idx];
-
-                                       /* Is the next bit 0 or 1? If 0, go left
-                                        * (already done).  If 1, go right by
-                                        * incrementing node_idx. */
-                                       --extra_bits;
-                                       node_idx += (cur_codeword >> extra_bits) & 1;
-                               } while (extra_bits != 0);
-
-                               /* node_idx is now the index of the leaf entry
-                                * into which the actual symbol will go. */
-                               decode_table[node_idx] = sym;
-
-                               /* Note: cur_codeword is always incremented at
-                                * the end of this loop because this is how
-                                * canonical Huffman codes are generated (add 1
-                                * for each code, then left shift whenever the
-                                * code length increases) */
-                       }
+WIMLIBAPI int
+wimlib_create_decompressor(enum wimlib_compression_type ctype,
+                          size_t max_block_size,
+                          const struct wimlib_decompressor_params_header *extra_params,
+                          struct wimlib_decompressor **dec_ret)
+{
+       struct wimlib_decompressor *dec;
+
+       if (dec_ret == NULL)
+               return WIMLIB_ERR_INVALID_PARAM;
+
+       if (!decompressor_ctype_valid(ctype))
+               return WIMLIB_ERR_INVALID_COMPRESSION_TYPE;
+
+       dec = MALLOC(sizeof(*dec));
+       if (dec == NULL)
+               return WIMLIB_ERR_NOMEM;
+       dec->ops = decompressor_ops[ctype];
+       dec->private = NULL;
+       if (dec->ops->create_decompressor) {
+               const struct wimlib_decompressor_params_header *params;
+               int ret;
+
+               if (extra_params)
+                       params = extra_params;
+               else
+                       params = decompressor_default_params[ctype];
+               ret = dec->ops->create_decompressor(max_block_size,
+                                                   params,
+                                                   &dec->private);
+               if (ret) {
+                       FREE(dec);
+                       return ret;
                 }
         }
+       *dec_ret = dec;
         return 0;
  }
  
-/* Reads a Huffman-encoded symbol from the bistream when the number of remaining
- * bits is less than the maximum codeword length. */
-int
-read_huffsym_near_end_of_input(struct input_bitstream *istream,
-                              const u16 decode_table[],
-                              const u8 lens[],
-                              unsigned num_syms,
-                              unsigned table_bits,
-                              unsigned *n)
+WIMLIBAPI int
+wimlib_decompress(const void *compressed_data, size_t compressed_size,
+                 void *uncompressed_data, size_t uncompressed_size,
+                 struct wimlib_decompressor *dec)
  {
-       unsigned bitsleft = istream->bitsleft;
-       unsigned key_size;
-       u16 sym;
-       u16 key_bits;
-
-       if (table_bits > bitsleft) {
-               key_size = bitsleft;
-               bitsleft = 0;
-               key_bits = bitstream_peek_bits(istream, key_size) <<
-                                               (table_bits - key_size);
-       } else {
-               key_size = table_bits;
-               bitsleft -= table_bits;
-               key_bits = bitstream_peek_bits(istream, table_bits);
-       }
+       return dec->ops->decompress(compressed_data, compressed_size,
+                                   uncompressed_data, uncompressed_size,
+                                   dec->private);
+}
  
-       sym = decode_table[key_bits];
-       if (sym >= num_syms) {
-               bitstream_remove_bits(istream, key_size);
-               do {
-                       if (bitsleft == 0)
-                               return -1;
-                       key_bits = sym + bitstream_peek_bits(istream, 1);
-                       bitstream_remove_bits(istream, 1);
-                       bitsleft--;
-               } while ((sym = decode_table[key_bits]) >= num_syms);
-       } else {
-               bitstream_remove_bits(istream, lens[sym]);
+WIMLIBAPI void
+wimlib_free_decompressor(struct wimlib_decompressor *dec)
+{
+       if (dec) {
+               if (dec->ops->free_decompressor)
+                       dec->ops->free_decompressor(dec->private);
+               FREE(dec);
         }
-       *n = sym;
-       return 0;
  }
diff --git a/src/decompress_common.c b/src/decompress_common.c

new file mode 100644 (file)

index 0000000..767527d
--- /dev/null
+++ b/src/decompress_common.c
@@ -0,0 +1,432 @@
+/*
+ * decompress_common.c
+ *
+ * Code for decompression shared among multiple compression formats.
+ */
+
+/*
+ * Copyright (C) 2012, 2013 Eric Biggers
+ *
+ * This file is part of wimlib, a library for working with WIM files.
+ *
+ * wimlib is free software; you can redistribute it and/or modify it under the
+ * terms of the GNU General Public License as published by the Free
+ * Software Foundation; either version 3 of the License, or (at your option)
+ * any later version.
+ *
+ * wimlib is distributed in the hope that it will be useful, but WITHOUT ANY
+ * WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR
+ * A PARTICULAR PURPOSE. See the GNU General Public License for more
+ * details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with wimlib; if not, see http://www.gnu.org/licenses/.
+ */
+
+#ifdef HAVE_CONFIG_H
+#  include "config.h"
+#endif
+
+#include "wimlib/decompress_common.h"
+#include "wimlib/error.h"
+#include "wimlib/util.h"
+
+#include <string.h>
+
+#ifdef __GNUC__
+#  ifdef __SSE2__
+#    define USE_SSE2_FILL
+#    include <emmintrin.h>
+#  else
+#    define USE_LONG_FILL
+#  endif
+#endif
+
+/*
+ * make_huffman_decode_table: - Builds a fast huffman decoding table from an
+ * array that gives the length of the codeword for each symbol in the alphabet.
+ * Originally based on code written by David Tritscher (taken the original LZX
+ * decompression code); also heavily modified to add some optimizations used in
+ * the zlib code, as well as more comments; also added some optimizations to
+ * make filling in the decode table entries faster (may not help significantly
+ * though).
+ *
+ * @decode_table:      The array in which to create the fast huffman decoding
+ *                     table.  It must have a length of at least
+ *                     (2**table_bits) + 2 * num_syms to guarantee
+ *                     that there is enough space.  Also must be 16-byte
+ *                     aligned (at least when USE_SSE2_FILL gets defined).
+ *
+ * @num_syms:          Number of symbols in the alphabet, including symbols
+ *                     that do not appear in this particular input chunk.
+ *
+ * @table_bits:                Any symbols with a code length of table_bits or less can
+ *                     be decoded in one lookup of the table.  2**table_bits
+ *                     must be greater than or equal to @num_syms if there are
+ *                     any Huffman codes longer than @table_bits.
+ *
+ * @lens:              An array of length @num_syms, indexable by symbol, that
+ *                     gives the length of the Huffman codeword for that
+ *                     symbol.  Because the Huffman tree is in canonical form,
+ *                     it can be reconstructed by only knowing the length of
+ *                     the codeword for each symbol.  It is assumed, but not
+ *                     checked, that every length is less than
+ *                     @max_codeword_len.
+ *
+ * @max_codeword_len:  The longest codeword length allowed in the compression
+ *                     format.
+ *
+ * Returns 0 on success; returns -1 if the length values do not correspond to a
+ * valid Huffman tree.
+ *
+ * The format of the Huffamn decoding table is as follows.  The first (1 <<
+ * table_bits) entries of the table are indexed by chunks of the input of size
+ * @table_bits.  If the next Huffman codeword in the input happens to have a
+ * length of exactly @table_bits, the symbol is simply read directly from the
+ * decoding table.  Alternatively, if the next Huffman codeword has length _less
+ * than_ @table_bits, the symbol is also read directly from the decode table;
+ * this is possible because every entry in the table that is indexed by an
+ * integer that has the shorter codeword as a binary prefix is filled in with
+ * the appropriate symbol.  If a codeword has length n <= table_bits, it will
+ * have 2**(table_bits - n) possible suffixes, and thus that many entries in the
+ * decoding table.
+ *
+ * It's a bit more complicated if the next Huffman codeword has length of more
+ * than @table_bits.  The table entry indexed by the first @table_bits of that
+ * codeword cannot give the appropriate symbol directly, because that entry is
+ * guaranteed to be referenced by the Huffman codewords of multiple symbols.
+ * And while the LZX compression format does not allow codes longer than 16
+ * bits, a table of size (2 ** 16) = 65536 entries would be too slow to create.
+ *
+ * There are several different ways to make it possible to look up the symbols
+ * for codewords longer than @table_bits.  One way is to make the entries for
+ * the prefixes of length @table_bits of those entries be pointers to additional
+ * decoding tables that are indexed by some number of additional bits of the
+ * codeword.  The technique used here is a bit simpler, however: just store the
+ * needed subtrees of the Huffman tree in the decoding table after the lookup
+ * entries, beginning at index (2**table_bits).  Real pointers are replaced by
+ * indices into the decoding table, and symbol entries are distinguished from
+ * pointers by the fact that values less than @num_syms must be symbol values.
+ */
+int
+make_huffman_decode_table(u16 *decode_table,  unsigned num_syms,
+                         unsigned table_bits, const u8 *lens,
+                         unsigned max_codeword_len)
+{
+       unsigned len_counts[max_codeword_len + 1];
+       u16 sorted_syms[num_syms];
+       unsigned offsets[max_codeword_len + 1];
+       const unsigned table_num_entries = 1 << table_bits;
+       int left;
+       unsigned decode_table_pos;
+       void *decode_table_ptr;
+       unsigned sym_idx;
+       unsigned codeword_len;
+       unsigned stores_per_loop;
+
+#ifdef USE_LONG_FILL
+       const unsigned entries_per_long = sizeof(unsigned long) / sizeof(decode_table[0]);
+#endif
+
+#ifdef USE_SSE2_FILL
+       const unsigned entries_per_xmm = sizeof(__m128i) / sizeof(decode_table[0]);
+#endif
+
+       wimlib_assert2((uintptr_t)decode_table % DECODE_TABLE_ALIGNMENT == 0);
+
+       /* accumulate lengths for codes */
+       for (unsigned i = 0; i <= max_codeword_len; i++)
+               len_counts[i] = 0;
+
+       for (unsigned sym = 0; sym < num_syms; sym++) {
+               wimlib_assert2(lens[sym] <= max_codeword_len);
+               len_counts[lens[sym]]++;
+       }
+
+       /* check for an over-subscribed or incomplete set of lengths */
+       left = 1;
+       for (unsigned len = 1; len <= max_codeword_len; len++) {
+               left <<= 1;
+               left -= len_counts[len];
+               if (unlikely(left < 0)) { /* over-subscribed */
+                       DEBUG("Invalid Huffman code (over-subscribed)");
+                       return -1;
+               }
+       }
+
+       if (unlikely(left != 0)) /* incomplete set */{
+               if (left == 1 << max_codeword_len) {
+                       /* Empty code--- okay in XPRESS and LZX */
+                       memset(decode_table, 0,
+                              table_num_entries * sizeof(decode_table[0]));
+                       return 0;
+               } else {
+                       DEBUG("Invalid Huffman code (incomplete set)");
+                       return -1;
+               }
+       }
+
+       /* Generate offsets into symbol table for each length for sorting */
+       offsets[1] = 0;
+       for (unsigned len = 1; len < max_codeword_len; len++)
+               offsets[len + 1] = offsets[len] + len_counts[len];
+
+       /* Sort symbols primarily by length and secondarily by symbol order.
+        * This is basically a count-sort over the codeword lengths. */
+       for (unsigned sym = 0; sym < num_syms; sym++)
+               if (lens[sym] != 0)
+                       sorted_syms[offsets[lens[sym]]++] = sym;
+
+       /* Fill entries for codewords short enough for a direct mapping.  We can
+        * take advantage of the ordering of the codewords, since the Huffman
+        * code is canonical.  It must be the case that all the codewords of
+        * some length L numerically precede all the codewords of length L + 1.
+        * Furthermore, if we have 2 symbols A and B with the same codeword
+        * length but symbol A is sorted before symbol B, then then we know that
+        * the codeword for A numerically precedes the codeword for B. */
+       decode_table_ptr = decode_table;
+       sym_idx = 0;
+       codeword_len = 1;
+#ifdef USE_SSE2_FILL
+       /* Fill in the Huffman decode table entries one 128-bit vector at a
+        * time.  This is 8 entries per store. */
+       stores_per_loop = (1 << (table_bits - codeword_len)) / entries_per_xmm;
+       for (; stores_per_loop != 0; codeword_len++, stores_per_loop >>= 1) {
+               unsigned end_sym_idx = sym_idx + len_counts[codeword_len];
+               for (; sym_idx < end_sym_idx; sym_idx++) {
+                       /* Note: unlike in the 'long' version below, the __m128i
+                        * type already has __attribute__((may_alias)), so using
+                        * it to access the decode table, which is an array of
+                        * unsigned shorts, will not violate strict aliasing. */
+                       u16 sym;
+                       __m128i v;
+                       __m128i *p;
+                       unsigned n;
+
+                       sym = sorted_syms[sym_idx];
+
+                       v = _mm_set1_epi16(sym);
+                       p = (__m128i*)decode_table_ptr;
+                       n = stores_per_loop;
+                       do {
+                               *p++ = v;
+                       } while (--n);
+                       decode_table_ptr = p;
+               }
+       }
+#endif /* USE_SSE2_FILL */
+
+#ifdef USE_LONG_FILL
+       /* Fill in the Huffman decode table entries one 'unsigned long' at a
+        * time.  On 32-bit systems this is 2 entries per store, while on 64-bit
+        * systems this is 4 entries per store. */
+       stores_per_loop = (1 << (table_bits - codeword_len)) / entries_per_long;
+       for (; stores_per_loop != 0; codeword_len++, stores_per_loop >>= 1) {
+               unsigned end_sym_idx = sym_idx + len_counts[codeword_len];
+               for (; sym_idx < end_sym_idx; sym_idx++) {
+
+                       /* Accessing the array of unsigned shorts as unsigned
+                        * longs would violate strict aliasing and would require
+                        * compiling the code with -fno-strict-aliasing to
+                        * guarantee correctness.  To work around this problem,
+                        * use the gcc 'may_alias' extension to define a special
+                        * unsigned long type that may alias any other in-memory
+                        * variable.  */
+                       typedef unsigned long __attribute__((may_alias)) aliased_long_t;
+
+                       u16 sym;
+                       aliased_long_t *p;
+                       aliased_long_t v;
+                       unsigned n;
+
+                       sym = sorted_syms[sym_idx];
+
+                       BUILD_BUG_ON(sizeof(aliased_long_t) != 4 &&
+                                    sizeof(aliased_long_t) != 8);
+
+                       v = sym;
+                       if (sizeof(aliased_long_t) >= 4)
+                               v |= v << 16;
+                       if (sizeof(aliased_long_t) >= 8) {
+                               /* This may produce a compiler warning if an
+                                * aliased_long_t is 32 bits, but this won't be
+                                * executed unless an aliased_long_t is at least
+                                * 64 bits anyway. */
+                               v |= v << 32;
+                       }
+
+                       p = (aliased_long_t *)decode_table_ptr;
+                       n = stores_per_loop;
+
+                       do {
+                               *p++ = v;
+                       } while (--n);
+                       decode_table_ptr = p;
+               }
+       }
+#endif /* USE_LONG_FILL */
+
+       /* Fill in the Huffman decode table entries one 16-bit integer at a
+        * time. */
+       stores_per_loop = (1 << (table_bits - codeword_len));
+       for (; stores_per_loop != 0; codeword_len++, stores_per_loop >>= 1) {
+               unsigned end_sym_idx = sym_idx + len_counts[codeword_len];
+               for (; sym_idx < end_sym_idx; sym_idx++) {
+                       u16 sym;
+                       u16 *p;
+                       unsigned n;
+
+                       sym = sorted_syms[sym_idx];
+
+                       p = (u16*)decode_table_ptr;
+                       n = stores_per_loop;
+
+                       do {
+                               *p++ = sym;
+                       } while (--n);
+
+                       decode_table_ptr = p;
+               }
+       }
+
+       /* If we've filled in the entire table, we are done.  Otherwise, there
+        * are codes longer than table bits that we need to store in the
+        * tree-like structure at the end of the table rather than directly in
+        * the main decode table itself. */
+
+       decode_table_pos = (u16*)decode_table_ptr - decode_table;
+       if (decode_table_pos != table_num_entries) {
+               unsigned j;
+               unsigned next_free_tree_slot;
+               unsigned cur_codeword;
+
+               wimlib_assert2(decode_table_pos < table_num_entries);
+
+               /* Fill in the remaining entries, which correspond to codes
+                * longer than @table_bits.
+                *
+                * First, zero out the rest of the entries.  This is necessary
+                * so that the entries appear as "unallocated" in the next part.
+                * */
+               j = decode_table_pos;
+               do {
+                       decode_table[j] = 0;
+               } while (++j != table_num_entries);
+
+               /* Assert that 2**table_bits is at least num_syms.  If this
+                * wasn't the case, we wouldn't be able to distinguish pointer
+                * entries from symbol entries. */
+               wimlib_assert2(table_num_entries >= num_syms);
+
+
+               /* The tree nodes are allocated starting at decode_table[1 <<
+                * table_bits].  Remember that the full size of the table,
+                * including the extra space for the tree nodes, is actually
+                * 2**table_bits + 2 * num_syms slots, while table_num_entries
+                * is only 2**table_bits. */
+               next_free_tree_slot = table_num_entries;
+
+               /* The current Huffman codeword  */
+               cur_codeword = decode_table_pos << 1;
+
+               /* Go through every codeword of length greater than @table_bits,
+                * primarily in order of codeword length and secondarily in
+                * order of symbol. */
+               wimlib_assert2(codeword_len == table_bits + 1);
+               for (; codeword_len <= max_codeword_len; codeword_len++, cur_codeword <<= 1)
+               {
+                       unsigned end_sym_idx = sym_idx + len_counts[codeword_len];
+                       for (; sym_idx < end_sym_idx; sym_idx++, cur_codeword++) {
+                               unsigned sym = sorted_syms[sym_idx];
+                               unsigned extra_bits = codeword_len - table_bits;
+
+                               /* index of the current node; find it from the
+                                * prefix of the current Huffman codeword. */
+                               unsigned node_idx = cur_codeword >> extra_bits;
+                               wimlib_assert2(node_idx < table_num_entries);
+
+                               /* Go through each bit of the current Huffman
+                                * codeword beyond the prefix of length
+                                * @table_bits and walk the tree, allocating any
+                                * slots that have not yet been allocated. */
+                               do {
+
+                                       /* If the current tree node points to
+                                        * nowhere but we need to follow it,
+                                        * allocate a new node for it to point
+                                        * to. */
+                                       if (decode_table[node_idx] == 0) {
+                                               decode_table[node_idx] = next_free_tree_slot;
+                                               decode_table[next_free_tree_slot++] = 0;
+                                               decode_table[next_free_tree_slot++] = 0;
+                                               wimlib_assert2(next_free_tree_slot <=
+                                                              table_num_entries + 2 * num_syms);
+                                       }
+
+                                       /* Set node_idx to left child */
+                                       node_idx = decode_table[node_idx];
+
+                                       /* Is the next bit 0 or 1? If 0, go left
+                                        * (already done).  If 1, go right by
+                                        * incrementing node_idx. */
+                                       --extra_bits;
+                                       node_idx += (cur_codeword >> extra_bits) & 1;
+                               } while (extra_bits != 0);
+
+                               /* node_idx is now the index of the leaf entry
+                                * into which the actual symbol will go. */
+                               decode_table[node_idx] = sym;
+
+                               /* Note: cur_codeword is always incremented at
+                                * the end of this loop because this is how
+                                * canonical Huffman codes are generated (add 1
+                                * for each code, then left shift whenever the
+                                * code length increases) */
+                       }
+               }
+       }
+       return 0;
+}
+
+/* Reads a Huffman-encoded symbol from the bistream when the number of remaining
+ * bits is less than the maximum codeword length. */
+int
+read_huffsym_near_end_of_input(struct input_bitstream *istream,
+                              const u16 decode_table[],
+                              const u8 lens[],
+                              unsigned num_syms,
+                              unsigned table_bits,
+                              unsigned *n)
+{
+       unsigned bitsleft = istream->bitsleft;
+       unsigned key_size;
+       u16 sym;
+       u16 key_bits;
+
+       if (table_bits > bitsleft) {
+               key_size = bitsleft;
+               bitsleft = 0;
+               key_bits = bitstream_peek_bits(istream, key_size) <<
+                                               (table_bits - key_size);
+       } else {
+               key_size = table_bits;
+               bitsleft -= table_bits;
+               key_bits = bitstream_peek_bits(istream, table_bits);
+       }
+
+       sym = decode_table[key_bits];
+       if (sym >= num_syms) {
+               bitstream_remove_bits(istream, key_size);
+               do {
+                       if (bitsleft == 0)
+                               return -1;
+                       key_bits = sym + bitstream_peek_bits(istream, 1);
+                       bitstream_remove_bits(istream, 1);
+                       bitsleft--;
+               } while ((sym = decode_table[key_bits]) >= num_syms);
+       } else {
+               bitstream_remove_bits(istream, lens[sym]);
+       }
+       *n = sym;
+       return 0;
+}
diff --git a/src/integrity.c b/src/integrity.c

index 8e1df18911f9d1d641e675cc95d2058f2fad17cd..350b3a202fa9dd2082fa340d70bf20bbd18d17d1 100644 (file)
--- a/src/integrity.c
+++ b/src/integrity.c
@@ -366,8 +366,7 @@ write_integrity_table(WIMStruct *wim,
                                              0,
                                              &wim->hdr.integrity_table_reshdr,
                                              NULL,
-                                            0,
-                                            &wim->lzx_context);
+                                            0);
         FREE(new_table);
  out_free_old_table:
         FREE(old_table);
diff --git a/src/lookup_table.c b/src/lookup_table.c

index f54f0cc675e0de4dc3d4db1e06eaf5296b78a2ce..357d64387e995867e23b97057a29501567b39075 100644 (file)
--- a/src/lookup_table.c
+++ b/src/lookup_table.c
@@ -323,7 +323,6 @@ for_lookup_table_entry(struct wim_lookup_table *table,
                 hlist_for_each_entry_safe(lte, pos, tmp, &table->array[i],
                                           hash_list)
                 {
-                       wimlib_assert2(!(lte->resource_entry.flags & WIM_RESHDR_FLAG_METADATA));
                         ret = visitor(lte, arg);
                         if (ret)
                                 return ret;
@@ -869,8 +868,7 @@ write_wim_lookup_table_from_stream_list(struct list_head *stream_list,
                                         struct filedes *out_fd,
                                         u16 part_number,
                                         struct wim_reshdr *out_reshdr,
-                                       int write_resource_flags,
-                                       struct wimlib_lzx_context **comp_ctx)
+                                       int write_resource_flags)
  {
         size_t table_size;
         struct wim_lookup_table_entry *lte;
@@ -950,8 +948,7 @@ write_wim_lookup_table_from_stream_list(struct list_head *stream_list,
                                              0,
                                              out_reshdr,
                                              NULL,
-                                            write_resource_flags,
-                                            comp_ctx);
+                                            write_resource_flags);
         FREE(table_buf);
         DEBUG("ret=%d", ret);
         return ret;
diff --git a/src/lz77.c b/src/lz77.c

index 5729bd4ca52176c1b88e0ce84b3eb7cb71cdff56..b5495da74d1599cd59e12cc8ef65c495550eba55 100644 (file)
--- a/src/lz77.c
+++ b/src/lz77.c
@@ -30,7 +30,7 @@
  #  include <config.h>
  #endif
  
-#include "wimlib/compress.h"
+#include "wimlib/compress_common.h"
  #include "wimlib/util.h"
  
  #include <string.h>
diff --git a/src/lzms-compress.c b/src/lzms-compress.c

new file mode 100644 (file)

index 0000000..e5abf24
--- /dev/null
+++ b/src/lzms-compress.c
@@ -0,0 +1,129 @@
+/*
+ * lzms-compress.c
+ *
+ * A compressor for the LZMS compression format.
+ */
+
+/*
+ * Copyright (C) 2013 Eric Biggers
+ *
+ * This file is part of wimlib, a library for working with WIM files.
+ *
+ * wimlib is free software; you can redistribute it and/or modify it under the
+ * terms of the GNU General Public License as published by the Free
+ * Software Foundation; either version 3 of the License, or (at your option)
+ * any later version.
+ *
+ * wimlib is distributed in the hope that it will be useful, but WITHOUT ANY
+ * WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR
+ * A PARTICULAR PURPOSE. See the GNU General Public License for more
+ * details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with wimlib; if not, see http://www.gnu.org/licenses/.
+ */
+
+/* This a compressor for the LZMS compression format.  More details about this
+ * format can be found in lzms-decompress.c.  */
+
+#ifdef HAVE_CONFIG_H
+#  include "config.h"
+#endif
+
+#include "wimlib.h"
+#include "wimlib/assert.h"
+#include "wimlib/compressor_ops.h"
+#include "wimlib/compress_common.h"
+#include "wimlib/error.h"
+#include "wimlib/lzms.h"
+#include "wimlib/util.h"
+
+#include <string.h>
+
+struct lzms_compressor {
+       u8 *window;
+       u32 window_size;
+       u32 max_block_size;
+
+       s32 *last_target_usages;
+};
+
+static void
+lzms_preprocess_data(u8 *data, s32 size, s32 *last_target_usages)
+{
+       for (s32 i = 0; i < size - 11; i++) {
+       }
+}
+
+static size_t
+lzms_compress(const void *uncompressed_data, size_t uncompressed_size,
+             void *compressed_data, size_t compressed_size_avail, void *_ctx)
+{
+       struct lzms_compressor *ctx = _ctx;
+
+       if (uncompressed_size > ctx->max_block_size) {
+               LZMS_DEBUG("Can't compress %su bytes: LZMS context "
+                          "only supports %u bytes",
+                          uncompressed_size, ctx->max_block_size);
+               return 0;
+       }
+
+       memcpy(ctx->window, uncompressed_data, uncompressed_size);
+       ctx->window_size = uncompressed_size;
+
+       lzms_preprocess_data(ctx->window, ctx->window_size,
+                            ctx->last_target_usages);
+
+       return 0;
+}
+
+static void
+lzms_free_compressor(void *_ctx)
+{
+       struct lzms_compressor *ctx = _ctx;
+
+       if (ctx) {
+               FREE(ctx->window);
+               FREE(ctx->last_target_usages);
+               FREE(ctx);
+       }
+}
+
+static int
+lzms_create_compressor(size_t max_block_size,
+                      const struct wimlib_compressor_params_header *params,
+                      void **ctx_ret)
+{
+       struct lzms_compressor *ctx;
+
+       if (max_block_size == 0 || max_block_size > 1U << 26) {
+               LZMS_DEBUG("Invalid max_block_size (%u)", max_block_size);
+               return WIMLIB_ERR_INVALID_PARAM;
+       }
+
+       ctx = CALLOC(1, sizeof(struct lzms_compressor));
+       if (ctx == NULL)
+               goto oom;
+
+       ctx->window = MALLOC(max_block_size);
+       if (ctx->window == NULL)
+               goto oom;
+       ctx->max_block_size = max_block_size;
+
+       ctx->last_target_usages = MALLOC(65536 * sizeof(ctx->last_target_usages[0]));
+       if (ctx->last_target_usages == NULL)
+               goto oom;
+
+       *ctx_ret = ctx;
+       return 0;
+
+oom:
+       lzms_free_compressor(ctx);
+       return WIMLIB_ERR_NOMEM;
+}
+
+const struct compressor_ops lzms_compressor_ops = {
+       .create_compressor  = lzms_create_compressor,
+       .compress           = lzms_compress,
+       .free_compressor    = lzms_free_compressor,
+};
diff --git a/src/lzms-decompress.c b/src/lzms-decompress.c

index 186e88d0b9387827b78fafbf653cdedc572148ef..40d35bf6e2610e945a1034f19dc303e40ffa7d2b 100644 (file)
--- a/src/lzms-decompress.c
+++ b/src/lzms-decompress.c
@@ -193,8 +193,9 @@
  #endif
  
  #include "wimlib.h"
-#include "wimlib/compress.h"
-#include "wimlib/decompress.h"
+#include "wimlib/compress_common.h"
+#include "wimlib/decompressor_ops.h"
+#include "wimlib/decompress_common.h"
  #include "wimlib/error.h"
  #include "wimlib/lzms.h"
  #include "wimlib/util.h"
@@ -381,6 +382,9 @@ struct lzms_decompressor {
         u32 upcoming_lz_offset;
         u32 upcoming_delta_power;
         u32 upcoming_delta_offset;
+
+       /* Used for postprocessing  */
+       s32 last_target_usages[65536];
  };
  
  /* A table that maps position slots to their base values.  These are constants
@@ -1093,18 +1097,16 @@ lzms_init_decompressor(struct lzms_decompressor *ctx,
  /* Decode the series of literals and matches from the LZMS-compressed data.
   * Returns 0 on success; nonzero if the compressed data is invalid.  */
  static int
-lzms_decode_items(const u8 *cdata, size_t clen, u8 *ubuf, size_t ulen)
+lzms_decode_items(const u8 *cdata, size_t clen, u8 *ubuf, size_t ulen,
+                 struct lzms_decompressor *ctx)
  {
-       /* XXX: The context could be allocated on the heap.  */
-       struct lzms_decompressor ctx;
-
         /* Initialize the LZMS decompressor.  */
-       lzms_init_decompressor(&ctx, cdata, clen, ubuf, ulen);
+       lzms_init_decompressor(ctx, cdata, clen, ubuf, ulen);
  
         /* Decode the sequence of items.  */
-       while (ctx.out_next != ctx.out_end) {
-               LZMS_DEBUG("Position %u", ctx.out_next - ctx.out_begin);
-               if (lzms_decode_item(&ctx))
+       while (ctx->out_next != ctx->out_end) {
+               LZMS_DEBUG("Position %u", ctx->out_next - ctx->out_begin);
+               if (lzms_decode_item(ctx))
                         return -1;
         }
         return 0;
@@ -1216,17 +1218,15 @@ lzms_process_x86_translation(u8 *ubuf, s32 i, s32 *closest_target_usage_p,
   * actually needs to be done (or to plug in alternate filters, like in LZMA),
   * and the corresponding preprocessing seems to be done unconditionally.  */
  static void
-lzms_postprocess_data(u8 *ubuf, s32 ulen)
+lzms_postprocess_data(u8 *ubuf, s32 ulen, s32 *last_target_usages)
  {
         /* Offset (from beginning of buffer) of the most recent reference to a
          * seemingly valid target address.  */
         s32 closest_target_usage = -LZMS_X86_MAX_TRANSLATION_OFFSET - 1;
  
-       /* Offset (from beginning of buffer) of the most recently used target
-        * address beginning with two bytes equal to the array index.
-        *
-        * XXX: This array could be allocated on the heap.  */
-       s32 last_target_usages[65536];
+       /* Initialize the last_target_usages array.  Each entry will contain the
+        * offset (from beginning of buffer) of the most recently used target
+        * address beginning with two bytes equal to the array index.  */
         for (s32 i = 0; i < 65536; i++)
                 last_target_usages[i] = -LZMS_X86_MAX_GOOD_TARGET_OFFSET - 1;
  
@@ -1238,48 +1238,81 @@ lzms_postprocess_data(u8 *ubuf, s32 ulen)
                                                  last_target_usages);
  }
  
-/* API function documented in wimlib.h  */
-WIMLIBAPI int
-wimlib_lzms_decompress(const void *cdata, unsigned clen,
-                      void *ubuf, unsigned ulen)
+static int
+lzms_decompress(const void *compressed_data, size_t compressed_size,
+               void *uncompressed_data, size_t uncompressed_size, void *_ctx)
  {
+       struct lzms_decompressor *ctx = _ctx;
+
         /* The range decoder requires that a minimum of 4 bytes of compressed
          * data be initially available.  */
-       if (clen < 4) {
-               LZMS_DEBUG("Compressed length too small (got %u, expected >= 4)",
-                          clen);
+       if (compressed_size < 4) {
+               LZMS_DEBUG("Compressed size too small (got %zu, expected >= 4)",
+                          compressed_size);
                 return -1;
         }
  
         /* A LZMS-compressed data block should be evenly divisible into 16-bit
          * integers.  */
-       if (clen % 2 != 0) {
-               LZMS_DEBUG("Compressed length not divisible by 2 (got %u)", clen);
+       if (compressed_size % 2 != 0) {
+               LZMS_DEBUG("Compressed size not divisible by 2 (got %zu)",
+                          compressed_size);
                 return -1;
         }
  
         /* Handle the trivial case where nothing needs to be decompressed.
          * (Necessary because a window of size 0 does not have a valid position
          * slot.)  */
-       if (ulen == 0)
+       if (uncompressed_size == 0)
                 return 0;
  
         /* The x86 post-processor requires that the uncompressed length fit into
          * a signed 32-bit integer.  Also, the position slot table cannot be
          * searched for a position of INT32_MAX or greater.  */
-       if (ulen >= INT32_MAX) {
+       if (uncompressed_size >= INT32_MAX) {
                 LZMS_DEBUG("Uncompressed length too large "
                            "(got %u, expected < INT32_MAX)", ulen);
                 return -1;
         }
  
         /* Decode the literals and matches.  */
-       if (lzms_decode_items(cdata, clen, ubuf, ulen))
+       if (lzms_decode_items(compressed_data, compressed_size,
+                             uncompressed_data, uncompressed_size, ctx))
                 return -1;
  
         /* Postprocess the data.  */
-       lzms_postprocess_data(ubuf, ulen);
+       lzms_postprocess_data(uncompressed_data, uncompressed_size,
+                             ctx->last_target_usages);
  
         LZMS_DEBUG("Decompression successful.");
         return 0;
  }
+
+static void
+lzms_free_decompressor(void *_ctx)
+{
+       struct lzms_decompressor *ctx = _ctx;
+
+       FREE(ctx);
+}
+
+static int
+lzms_create_decompressor(size_t max_block_size,
+                        const struct wimlib_decompressor_params_header *params,
+                        void **ctx_ret)
+{
+       struct lzms_decompressor *ctx;
+
+       ctx = MALLOC(sizeof(struct lzms_decompressor));
+       if (ctx == NULL)
+               return WIMLIB_ERR_NOMEM;
+
+       *ctx_ret = ctx;
+       return 0;
+}
+
+const struct decompressor_ops lzms_decompressor_ops = {
+       .create_decompressor  = lzms_create_decompressor,
+       .decompress           = lzms_decompress,
+       .free_decompressor    = lzms_free_decompressor,
+};
diff --git a/src/lzx-common.c b/src/lzx-common.c

index 547059e7b93268c8cc9af73e635ada28ec5594fa..5f5228352381447c4a10c5d13998d71497b27134 100644 (file)
--- a/src/lzx-common.c
+++ b/src/lzx-common.c
@@ -66,11 +66,11 @@ const u8 lzx_extra_bits[LZX_MAX_POSITION_SLOTS] = {
  };
  #endif
  
-/* LZX window size can be between 2^15 and 2^21, inclusively.  */
+/* LZX window size must be a power of 2 between 2^15 and 2^21, inclusively.  */
  bool
-lzx_window_size_valid(u32 window_size)
+lzx_window_size_valid(size_t window_size)
  {
-       if (window_size == 0)
+       if (window_size == 0 || (u32)window_size != window_size)
                 return false;
         u32 order = bsr32(window_size);
         if (window_size != 1U << order)
diff --git a/src/lzx-compress.c b/src/lzx-compress.c

index c72fd460c84d47a4612fde0214499acad1d17f5c..e4676dca55612bdea066e30b4afdfc61cb7ddb14 100644 (file)
--- a/src/lzx-compress.c
+++ b/src/lzx-compress.c
@@ -189,7 +189,8 @@
  #endif
  
  #include "wimlib.h"
-#include "wimlib/compress.h"
+#include "wimlib/compressor_ops.h"
+#include "wimlib/compress_common.h"
  #include "wimlib/endianness.h"
  #include "wimlib/error.h"
  #include "wimlib/lzx.h"
@@ -199,7 +200,7 @@
  #include <string.h>
  
  #ifdef ENABLE_LZX_DEBUG
-#  include "wimlib/decompress.h"
+#  include "wimlib/decompress_common.h"
  #endif
  
  #include "divsufsort/divsufsort.h"
@@ -386,7 +387,7 @@ struct salink {
  struct lzx_compressor {
  
         /* The parameters that were used to create the compressor.  */
-       struct wimlib_lzx_params params;
+       struct wimlib_lzx_compressor_params params;
  
         /* The buffer of data to be compressed.
          *
@@ -2211,34 +2212,32 @@ do_call_insn_preprocessing(u8 data[], int size)
         }
  }
  
-/* API function documented in wimlib.h  */
-WIMLIBAPI unsigned
-wimlib_lzx_compress2(const void                        * const restrict uncompressed_data,
-                    unsigned                     const          uncompressed_len,
-                    void                       * const restrict compressed_data,
-                    struct wimlib_lzx_context  * const restrict lzx_ctx)
+static size_t
+lzx_compress(const void *uncompressed_data, size_t uncompressed_size,
+            void *compressed_data, size_t compressed_size_avail, void *_ctx)
  {
-       struct lzx_compressor *ctx = (struct lzx_compressor*)lzx_ctx;
+       struct lzx_compressor *ctx = _ctx;
         struct output_bitstream ostream;
-       input_idx_t compressed_len;
+       size_t compressed_size;
  
-       if (uncompressed_len < 100) {
+       if (uncompressed_size < 100) {
                 LZX_DEBUG("Too small to bother compressing.");
                 return 0;
         }
  
-       if (uncompressed_len > ctx->max_window_size) {
-               LZX_DEBUG("Can't compress %u bytes using window of %u bytes!",
-                         uncompressed_len, ctx->max_window_size);
+       if (uncompressed_size > ctx->max_window_size) {
+               LZX_DEBUG("Can't compress %zu bytes using window of %u bytes!",
+                         uncompressed_size, ctx->max_window_size);
                 return 0;
         }
  
-       LZX_DEBUG("Attempting to compress %u bytes...", uncompressed_len);
+       LZX_DEBUG("Attempting to compress %zu bytes...",
+                 uncompressed_size);
  
         /* The input data must be preprocessed.  To avoid changing the original
          * input, copy it to a temporary buffer.  */
-       memcpy(ctx->window, uncompressed_data, uncompressed_len);
-       ctx->window_size = uncompressed_len;
+       memcpy(ctx->window, uncompressed_data, uncompressed_size);
+       ctx->window_size = uncompressed_size;
  
         /* This line is unnecessary; it just avoids inconsequential accesses of
          * uninitialized memory that would show up in memory-checking tools such
@@ -2262,18 +2261,19 @@ wimlib_lzx_compress2(const void                 * const restrict uncompressed_data,
         LZX_DEBUG("Writing compressed blocks...");
  
         /* Generate the compressed data.  */
-       init_output_bitstream(&ostream, compressed_data, ctx->window_size - 1);
+       init_output_bitstream(&ostream, compressed_data, compressed_size_avail);
         lzx_write_all_blocks(ctx, &ostream);
  
         LZX_DEBUG("Flushing bitstream...");
-       compressed_len = flush_output_bitstream(&ostream);
-       if (compressed_len == ~(input_idx_t)0) {
-               LZX_DEBUG("Data did not compress to less than original length!");
+       compressed_size = flush_output_bitstream(&ostream);
+       if (compressed_size == ~(input_idx_t)0) {
+               LZX_DEBUG("Data did not compress to %zu bytes or less!",
+                         compressed_size_avail);
                 return 0;
         }
  
-       LZX_DEBUG("Done: compressed %u => %u bytes.",
-                 uncompressed_len, compressed_len);
+       LZX_DEBUG("Done: compressed %zu => %zu bytes.",
+                 uncompressed_size, compressed_size);
  
         /* Verify that we really get the same thing back when decompressing.
          * Although this could be disabled by default in all cases, it only
@@ -2285,44 +2285,46 @@ wimlib_lzx_compress2(const void                 * const restrict uncompressed_data,
         #endif
             )
         {
-               /* The decompression buffer can be any temporary space that's no
-                * longer needed.  */
-               u8 *buf = (u8*)(ctx->SA ? ctx->SA : ctx->prev_tab);
+               struct wimlib_decompressor *decompressor;
  
-               if (wimlib_lzx_decompress2(compressed_data, compressed_len,
-                                          buf, uncompressed_len, ctx->max_window_size))
+               if (0 == wimlib_create_decompressor(WIMLIB_COMPRESSION_TYPE_LZX,
+                                                   ctx->max_window_size,
+                                                   NULL,
+                                                   &decompressor))
                 {
-                       ERROR("Failed to decompress data we "
-                             "compressed using LZX algorithm");
-                       wimlib_assert(0);
-                       return 0;
-               }
-
-               if (memcmp(uncompressed_data, buf, uncompressed_len)) {
-                       ERROR("Data we compressed using LZX algorithm "
-                             "didn't decompress to original");
-                       wimlib_assert(0);
-                       return 0;
+                       int ret;
+                       ret = wimlib_decompress(compressed_data,
+                                               compressed_size,
+                                               ctx->window,
+                                               uncompressed_size,
+                                               decompressor);
+                       wimlib_free_decompressor(decompressor);
+
+                       if (ret) {
+                               ERROR("Failed to decompress data we "
+                                     "compressed using LZX algorithm");
+                               wimlib_assert(0);
+                               return 0;
+                       }
+                       if (memcmp(uncompressed_data, ctx->window, uncompressed_size)) {
+                               ERROR("Data we compressed using LZX algorithm "
+                                     "didn't decompress to original");
+                               wimlib_assert(0);
+                               return 0;
+                       }
+               } else {
+                       WARNING("Failed to create decompressor for "
+                               "data verification!");
                 }
         }
-       return compressed_len;
-}
-
-static bool
-lzx_params_compatible(const struct wimlib_lzx_params *oldparams,
-                     const struct wimlib_lzx_params *newparams)
-{
-       return 0 == memcmp(oldparams, newparams, sizeof(struct wimlib_lzx_params));
+       return compressed_size;
  }
  
-static struct wimlib_lzx_params lzx_user_default_params;
-static struct wimlib_lzx_params *lzx_user_default_params_ptr;
-
  static bool
-lzx_params_valid(const struct wimlib_lzx_params *params)
+lzx_params_valid(const struct wimlib_lzx_compressor_params *params)
  {
         /* Validate parameters.  */
-       if (params->size_of_this != sizeof(struct wimlib_lzx_params)) {
+       if (params->hdr.size != sizeof(struct wimlib_lzx_compressor_params)) {
                 LZX_DEBUG("Invalid parameter structure size!");
                 return false;
         }
@@ -2365,37 +2367,42 @@ lzx_params_valid(const struct wimlib_lzx_params *params)
         return true;
  }
  
-/* API function documented in wimlib.h  */
-WIMLIBAPI int
-wimlib_lzx_set_default_params(const struct wimlib_lzx_params * params)
+static void
+lzx_free_compressor(void *_ctx)
  {
-       if (params) {
-               if (!lzx_params_valid(params))
-                       return WIMLIB_ERR_INVALID_PARAM;
-               lzx_user_default_params = *params;
-               lzx_user_default_params_ptr = &lzx_user_default_params;
-       } else {
-               lzx_user_default_params_ptr = NULL;
+       struct lzx_compressor *ctx = _ctx;
+
+       if (ctx) {
+               FREE(ctx->chosen_matches);
+               FREE(ctx->cached_matches);
+               FREE(ctx->optimum);
+               FREE(ctx->salink);
+               FREE(ctx->SA);
+               FREE(ctx->block_specs);
+               FREE(ctx->prev_tab);
+               FREE(ctx->window);
+               FREE(ctx);
         }
-       return 0;
  }
  
-/* API function documented in wimlib.h  */
-WIMLIBAPI int
-wimlib_lzx_alloc_context(u32 window_size,
-                        const struct wimlib_lzx_params *params,
-                        struct wimlib_lzx_context **ctx_pp)
+static int
+lzx_create_compressor(size_t window_size,
+                     const struct wimlib_compressor_params_header *_params,
+                     void **ctx_ret)
  {
+       const struct wimlib_lzx_compressor_params *params =
+               (const struct wimlib_lzx_compressor_params*)_params;
+       struct lzx_compressor *ctx;
  
         LZX_DEBUG("Allocating LZX context...");
  
         if (!lzx_window_size_valid(window_size))
                 return WIMLIB_ERR_INVALID_PARAM;
  
-       struct lzx_compressor *ctx;
-
-       static const struct wimlib_lzx_params fast_default = {
-               .size_of_this = sizeof(struct wimlib_lzx_params),
+       static const struct wimlib_lzx_compressor_params fast_default = {
+               .hdr = {
+                       .size = sizeof(struct wimlib_lzx_compressor_params),
+               },
                 .algorithm = WIMLIB_LZX_ALGORITHM_FAST,
                 .use_defaults = 0,
                 .alg_params = {
@@ -2403,8 +2410,10 @@ wimlib_lzx_alloc_context(u32 window_size,
                         },
                 },
         };
-       static const struct wimlib_lzx_params slow_default = {
-               .size_of_this = sizeof(struct wimlib_lzx_params),
+       static const struct wimlib_lzx_compressor_params slow_default = {
+               .hdr = {
+                       .size = sizeof(struct wimlib_lzx_compressor_params),
+               },
                 .algorithm = WIMLIB_LZX_ALGORITHM_SLOW,
                 .use_defaults = 0,
                 .alg_params = {
@@ -2426,10 +2435,7 @@ wimlib_lzx_alloc_context(u32 window_size,
                         return WIMLIB_ERR_INVALID_PARAM;
         } else {
                 LZX_DEBUG("Using default algorithm and parameters.");
-               if (lzx_user_default_params_ptr)
-                       params = lzx_user_default_params_ptr;
-               else
-                       params = &slow_default;
+               params = &slow_default;
         }
  
         if (params->use_defaults) {
@@ -2439,58 +2445,46 @@ wimlib_lzx_alloc_context(u32 window_size,
                         params = &fast_default;
         }
  
-       if (ctx_pp) {
-               ctx = *(struct lzx_compressor**)ctx_pp;
-
-               if (ctx &&
-                   lzx_params_compatible(&ctx->params, params) &&
-                   ctx->max_window_size == window_size)
-                       return 0;
-       } else {
-               LZX_DEBUG("Check parameters only.");
-               return 0;
-       }
-
         LZX_DEBUG("Allocating memory.");
  
         ctx = CALLOC(1, sizeof(struct lzx_compressor));
         if (ctx == NULL)
-               goto err;
+               goto oom;
  
         ctx->num_main_syms = lzx_get_num_main_syms(window_size);
         ctx->max_window_size = window_size;
         ctx->window = MALLOC(window_size + 12);
         if (ctx->window == NULL)
-               goto err;
+               goto oom;
  
         if (params->algorithm == WIMLIB_LZX_ALGORITHM_FAST) {
                 ctx->prev_tab = MALLOC(window_size * sizeof(ctx->prev_tab[0]));
                 if (ctx->prev_tab == NULL)
-                       goto err;
+                       goto oom;
         }
  
         size_t block_specs_length = DIV_ROUND_UP(window_size, LZX_DIV_BLOCK_SIZE);
         ctx->block_specs = MALLOC(block_specs_length * sizeof(ctx->block_specs[0]));
         if (ctx->block_specs == NULL)
-               goto err;
+               goto oom;
  
         if (params->algorithm == WIMLIB_LZX_ALGORITHM_SLOW) {
                 ctx->SA = MALLOC(3U * window_size * sizeof(ctx->SA[0]));
                 if (ctx->SA == NULL)
-                       goto err;
+                       goto oom;
                 ctx->ISA = ctx->SA + window_size;
                 ctx->LCP = ctx->ISA + window_size;
  
                 ctx->salink = MALLOC(window_size * sizeof(ctx->salink[0]));
                 if (ctx->salink == NULL)
-                       goto err;
+                       goto oom;
         }
  
         if (params->algorithm == WIMLIB_LZX_ALGORITHM_SLOW) {
                 ctx->optimum = MALLOC((LZX_OPTIM_ARRAY_SIZE + LZX_MAX_MATCH_LEN) *
                                        sizeof(ctx->optimum[0]));
                 if (ctx->optimum == NULL)
-                       goto err;
+                       goto oom;
         }
  
         if (params->algorithm == WIMLIB_LZX_ALGORITHM_SLOW) {
@@ -2503,71 +2497,28 @@ wimlib_lzx_alloc_context(u32 window_size,
                 ctx->cached_matches = MALLOC(window_size * (cache_per_pos + 1) *
                                              sizeof(ctx->cached_matches[0]));
                 if (ctx->cached_matches == NULL)
-                       goto err;
+                       goto oom;
         }
  
         ctx->chosen_matches = MALLOC(window_size * sizeof(ctx->chosen_matches[0]));
         if (ctx->chosen_matches == NULL)
-               goto err;
+               goto oom;
  
-       memcpy(&ctx->params, params, sizeof(struct wimlib_lzx_params));
+       memcpy(&ctx->params, params, sizeof(struct wimlib_lzx_compressor_params));
         memset(&ctx->zero_codes, 0, sizeof(ctx->zero_codes));
  
         LZX_DEBUG("Successfully allocated new LZX context.");
  
-       wimlib_lzx_free_context(*ctx_pp);
-       *ctx_pp = (struct wimlib_lzx_context*)ctx;
+       *ctx_ret = ctx;
         return 0;
  
-err:
-       wimlib_lzx_free_context((struct wimlib_lzx_context*)ctx);
-       LZX_DEBUG("Ran out of memory.");
+oom:
+       lzx_free_compressor(ctx);
         return WIMLIB_ERR_NOMEM;
  }
  
-/* API function documented in wimlib.h  */
-WIMLIBAPI void
-wimlib_lzx_free_context(struct wimlib_lzx_context *_ctx)
-{
-       struct lzx_compressor *ctx = (struct lzx_compressor*)_ctx;
-
-       if (ctx) {
-               FREE(ctx->chosen_matches);
-               FREE(ctx->cached_matches);
-               FREE(ctx->optimum);
-               FREE(ctx->salink);
-               FREE(ctx->SA);
-               FREE(ctx->block_specs);
-               FREE(ctx->prev_tab);
-               FREE(ctx->window);
-               FREE(ctx);
-       }
-}
-
-/* API function documented in wimlib.h  */
-WIMLIBAPI unsigned
-wimlib_lzx_compress(const void * const restrict uncompressed_data,
-                   unsigned     const          uncompressed_len,
-                   void       * const restrict compressed_data)
-{
-       int ret;
-       struct wimlib_lzx_context *ctx = NULL;
-       unsigned compressed_len;
-
-       ret = wimlib_lzx_alloc_context(32768, NULL, &ctx);
-       if (ret) {
-               wimlib_assert(ret != WIMLIB_ERR_INVALID_PARAM);
-               WARNING("Couldn't allocate LZX compression context: %"TS"",
-                       wimlib_get_error_string(ret));
-               return 0;
-       }
-
-       compressed_len = wimlib_lzx_compress2(uncompressed_data,
-                                             uncompressed_len,
-                                             compressed_data,
-                                             ctx);
-
-       wimlib_lzx_free_context(ctx);
-
-       return compressed_len;
-}
+const struct compressor_ops lzx_compressor_ops = {
+       .create_compressor  = lzx_create_compressor,
+       .compress           = lzx_compress,
+       .free_compressor    = lzx_free_compressor,
+};
diff --git a/src/lzx-decompress.c b/src/lzx-decompress.c

index b7872520890135d8eee0db082746469e715122ba..2405b9493ad9710f0476af9e2745fe8c59490b2f 100644 (file)
--- a/src/lzx-decompress.c
+++ b/src/lzx-decompress.c
@@ -108,7 +108,8 @@
  #endif
  
  #include "wimlib.h"
-#include "wimlib/decompress.h"
+#include "wimlib/decompressor_ops.h"
+#include "wimlib/decompress_common.h"
  #include "wimlib/lzx.h"
  #include "wimlib/util.h"
  
@@ -135,6 +136,11 @@ struct lzx_tables {
         u8 alignedtree_lens[LZX_ALIGNEDCODE_NUM_SYMBOLS];
  } _aligned_attribute(DECODE_TABLE_ALIGNMENT);
  
+struct lzx_decompressor {
+       u32 max_window_size;
+       unsigned num_main_syms;
+       struct lzx_tables tables;
+};
  
  /*
   * Reads a Huffman-encoded symbol using the pre-tree.
@@ -705,7 +711,7 @@ lzx_decode_match(unsigned main_element, int block_type,
  }
  
  static void
-undo_call_insn_translation(u32 *call_insn_target, int input_pos,
+undo_call_insn_translation(u32 *call_insn_target, s32 input_pos,
                            s32 file_size)
  {
         s32 abs_offset;
@@ -747,9 +753,9 @@ undo_call_insn_translation(u32 *call_insn_target, int input_pos,
   * as it is used in calculating the translated jump targets.  But in WIM files,
   * this file size is always the same (LZX_WIM_MAGIC_FILESIZE == 12000000).*/
  static void
-undo_call_insn_preprocessing(u8 uncompressed_data[], int uncompressed_data_len)
+undo_call_insn_preprocessing(u8 *uncompressed_data, s32 uncompressed_size)
  {
-       for (int i = 0; i < uncompressed_data_len - 10; i++) {
+       for (s32 i = 0; i < uncompressed_size - 10; i++) {
                 if (uncompressed_data[i] == 0xe8) {
                         undo_call_insn_translation((u32*)&uncompressed_data[i + 1],
                                                    i,
@@ -818,47 +824,38 @@ lzx_decompress_block(int block_type, unsigned block_size,
         return 0;
  }
  
-/* API function documented in wimlib.h  */
-WIMLIBAPI int
-wimlib_lzx_decompress2(const void *compressed_data, unsigned compressed_len,
-                      void *uncompressed_data, unsigned uncompressed_len,
-                      u32 max_window_size)
+static int
+lzx_decompress(const void *compressed_data, size_t compressed_size,
+              void *uncompressed_data, size_t uncompressed_size,
+              void *_ctx)
  {
-       struct lzx_tables tables;
+       struct lzx_decompressor *ctx = _ctx;
         struct input_bitstream istream;
         struct lzx_lru_queue queue;
         unsigned window_pos;
         unsigned block_size;
         unsigned block_type;
-       unsigned num_main_syms;
         int ret;
         bool e8_preprocessing_done;
  
-       LZX_DEBUG("compressed_data = %p, compressed_len = %u, "
-                 "uncompressed_data = %p, uncompressed_len = %u, "
+       LZX_DEBUG("compressed_data = %p, compressed_size = %zu, "
+                 "uncompressed_data = %p, uncompressed_size = %zu, "
                   "max_window_size=%u).",
-                 compressed_data, compressed_len,
-                 uncompressed_data, uncompressed_len, max_window_size);
+                 compressed_data, compressed_size,
+                 uncompressed_data, uncompressed_size,
+                 ctx->max_window_size);
  
-       if (!lzx_window_size_valid(max_window_size)) {
-               LZX_DEBUG("Window size of %u is invalid!",
-                         max_window_size);
-               return -1;
-       }
-
-       num_main_syms = lzx_get_num_main_syms(max_window_size);
-
-       if (uncompressed_len > max_window_size) {
-               LZX_DEBUG("Uncompressed chunk size of %u exceeds "
+       if (uncompressed_size > ctx->max_window_size) {
+               LZX_DEBUG("Uncompressed size of %zu exceeds "
                           "window size of %u!",
-                         uncompressed_len, max_window_size);
+                         uncompressed_size, ctx->max_window_size);
                 return -1;
         }
  
-       memset(tables.maintree_lens, 0, sizeof(tables.maintree_lens));
-       memset(tables.lentree_lens, 0, sizeof(tables.lentree_lens));
+       memset(ctx->tables.maintree_lens, 0, sizeof(ctx->tables.maintree_lens));
+       memset(ctx->tables.lentree_lens, 0, sizeof(ctx->tables.lentree_lens));
         lzx_lru_queue_init(&queue);
-       init_input_bitstream(&istream, compressed_data, compressed_len);
+       init_input_bitstream(&istream, compressed_data, compressed_size);
  
         e8_preprocessing_done = false; /* Set to true if there may be 0xe8 bytes
                                           in the uncompressed data. */
@@ -869,23 +866,23 @@ wimlib_lzx_decompress2(const void *compressed_data, unsigned compressed_len,
          * blocks.  */
  
         for (window_pos = 0;
-            window_pos < uncompressed_len;
+            window_pos < uncompressed_size;
              window_pos += block_size)
         {
                 LZX_DEBUG("Reading block header.");
-               ret = lzx_read_block_header(&istream, num_main_syms,
-                                           max_window_size, &block_size,
-                                           &block_type, &tables, &queue);
+               ret = lzx_read_block_header(&istream, ctx->num_main_syms,
+                                           ctx->max_window_size, &block_size,
+                                           &block_type, &ctx->tables, &queue);
                 if (ret)
                         return ret;
  
                 LZX_DEBUG("block_size = %u, window_pos = %u",
                           block_size, window_pos);
  
-               if (block_size > uncompressed_len - window_pos) {
+               if (block_size > uncompressed_size - window_pos) {
                         LZX_DEBUG("Expected a block size of at "
-                                 "most %u bytes (found %u bytes)",
-                                 uncompressed_len - window_pos, block_size);
+                                 "most %zu bytes (found %u bytes)",
+                                 uncompressed_size - window_pos, block_size);
                         return -1;
                 }
  
@@ -898,16 +895,16 @@ wimlib_lzx_decompress2(const void *compressed_data, unsigned compressed_len,
                                 LZX_DEBUG("LZX_BLOCKTYPE_ALIGNED");
                         ret = lzx_decompress_block(block_type,
                                                    block_size,
-                                                  num_main_syms,
+                                                  ctx->num_main_syms,
                                                    uncompressed_data,
                                                    window_pos,
-                                                  &tables,
+                                                  &ctx->tables,
                                                    &queue,
                                                    &istream);
                         if (ret)
                                 return ret;
  
-                       if (tables.maintree_lens[0xe8] != 0)
+                       if (ctx->tables.maintree_lens[0xe8] != 0)
                                 e8_preprocessing_done = true;
                         break;
                 case LZX_BLOCKTYPE_UNCOMPRESSED:
@@ -934,16 +931,41 @@ wimlib_lzx_decompress2(const void *compressed_data, unsigned compressed_len,
                 }
         }
         if (e8_preprocessing_done)
-               undo_call_insn_preprocessing(uncompressed_data, uncompressed_len);
+               undo_call_insn_preprocessing(uncompressed_data, uncompressed_size);
         return 0;
  }
  
-/* API function documented in wimlib.h  */
-WIMLIBAPI int
-wimlib_lzx_decompress(const void *compressed_data, unsigned compressed_len,
-                     void *uncompressed_data, unsigned uncompressed_len)
+static void
+lzx_free_decompressor(void *_ctx)
  {
-       return wimlib_lzx_decompress2(compressed_data, compressed_len,
-                                     uncompressed_data, uncompressed_len,
-                                     32768);
+       struct lzx_decompressor *ctx = _ctx;
+
+       FREE(ctx);
  }
+
+static int
+lzx_create_decompressor(size_t max_window_size,
+                       const struct wimlib_decompressor_params_header *params,
+                       void **ctx_ret)
+{
+       struct lzx_decompressor *ctx;
+
+       if (!lzx_window_size_valid(max_window_size))
+               return WIMLIB_ERR_INVALID_PARAM;
+
+       ctx = MALLOC(sizeof(struct lzx_decompressor));
+       if (ctx == NULL)
+               return WIMLIB_ERR_NOMEM;
+
+       ctx->max_window_size = max_window_size;
+       ctx->num_main_syms = lzx_get_num_main_syms(max_window_size);
+
+       *ctx_ret = ctx;
+       return 0;
+}
+
+const struct decompressor_ops lzx_decompressor_ops = {
+       .create_decompressor = lzx_create_decompressor,
+       .decompress          = lzx_decompress,
+       .free_decompressor   = lzx_free_decompressor,
+};
diff --git a/src/metadata_resource.c b/src/metadata_resource.c

index aebc5468cd0b30a24c6c8bc72a2bc70aab04916f..2d780e96d82f25f9fa59b885db7d308527f8fe51 100644 (file)
--- a/src/metadata_resource.c
+++ b/src/metadata_resource.c
@@ -297,8 +297,7 @@ write_metadata_resource(WIMStruct *wim, int image, int write_resource_flags)
                                              wim->out_chunk_size,
                                              &imd->metadata_lte->out_reshdr,
                                              imd->metadata_lte->hash,
-                                            write_resource_flags,
-                                            &wim->lzx_context);
+                                            write_resource_flags);
  
         /* Original checksum was overridden; set a flag so it isn't used.  */
         imd->metadata_lte->dont_check_metadata_hash = 1;
diff --git a/src/resource.c b/src/resource.c

index ff46114d7acc6b5f0bb457a2795dde65bf96ea22..1a46e751184377863f53f7b11582db44e6662d00 100644 (file)
--- a/src/resource.c
+++ b/src/resource.c
@@ -90,29 +90,6 @@
   */
  
  
-/* Decompress the specified chunk that uses the specified compression type
- * @ctype, part of a WIM with default chunk size @wim_chunk_size.  For LZX the
- * separate @wim_chunk_size is needed because it determines the window size used
- * for LZX compression.  */
-static int
-decompress(const void *cchunk, unsigned clen, void *uchunk, unsigned ulen,
-          int ctype, u32 wim_chunk_size)
-{
-       switch (ctype) {
-       case WIMLIB_COMPRESSION_TYPE_LZX:
-               return wimlib_lzx_decompress2(cchunk, clen,
-                                             uchunk, ulen, wim_chunk_size);
-       case WIMLIB_COMPRESSION_TYPE_XPRESS:
-               return wimlib_xpress_decompress(cchunk, clen,
-                                               uchunk, ulen);
-       case WIMLIB_COMPRESSION_TYPE_LZMS:
-               return wimlib_lzms_decompress(cchunk, clen, uchunk, ulen);
-       default:
-               ERROR("Invalid compression format (%d)", ctype);
-               return -1;
-       }
-}
-
  struct data_range {
         u64 offset;
         u64 size;
@@ -164,6 +141,7 @@ read_compressed_wim_resource(const struct wim_resource_spec * const rspec,
         bool chunk_offsets_malloced = false;
         bool ubuf_malloced = false;
         bool cbuf_malloced = false;
+       struct wimlib_decompressor *decompressor;
  
         /* Sanity checks  */
         wimlib_assert(rspec != NULL);
@@ -232,6 +210,21 @@ read_compressed_wim_resource(const struct wim_resource_spec * const rspec,
                 goto out_free_memory;
         }
  
+       /* Get valid decompressor.  */
+       if (ctype == rspec->wim->decompressor_ctype &&
+           chunk_size == rspec->wim->decompressor_max_block_size)
+       {
+               /* Cached decompressor.  */
+               decompressor = rspec->wim->decompressor;
+               rspec->wim->decompressor_ctype = WIMLIB_COMPRESSION_TYPE_NONE;
+               rspec->wim->decompressor = NULL;
+       } else {
+               ret = wimlib_create_decompressor(ctype, chunk_size, NULL,
+                                                &decompressor);
+               if (ret)
+                       goto out_free_memory;
+       }
+
         const u32 chunk_order = bsr32(chunk_size);
  
         /* Calculate the total number of chunks the resource is divided into.  */
@@ -450,7 +443,7 @@ read_compressed_wim_resource(const struct wim_resource_spec * const rspec,
                         ERROR("Invalid chunk size in compressed resource!");
                         errno = EINVAL;
                         ret = WIMLIB_ERR_DECOMPRESSION;
-                       goto out_free_memory;
+                       goto out_save_decompressor;
                 }
                 if (rspec->is_pipable)
                         cur_read_offset += sizeof(struct pwm_chunk_hdr);
@@ -494,17 +487,16 @@ read_compressed_wim_resource(const struct wim_resource_spec * const rspec,
                                 DEBUG("Decompressing chunk %"PRIu64" "
                                       "(csize=%"PRIu32" usize=%"PRIu32")",
                                       i, chunk_csize, chunk_usize);
-                               ret = decompress(cbuf,
-                                                chunk_csize,
-                                                ubuf,
-                                                chunk_usize,
-                                                ctype,
-                                                chunk_size);
+                               ret = wimlib_decompress(cbuf,
+                                                       chunk_csize,
+                                                       ubuf,
+                                                       chunk_usize,
+                                                       decompressor);
                                 if (ret) {
                                         ERROR("Failed to decompress data!");
                                         ret = WIMLIB_ERR_DECOMPRESSION;
                                         errno = EINVAL;
-                                       goto out_free_memory;
+                                       goto out_save_decompressor;
                                 }
                         }
                         cur_read_offset += chunk_csize;
@@ -525,7 +517,7 @@ read_compressed_wim_resource(const struct wim_resource_spec * const rspec,
                                 ret = (*cb)(&ubuf[start], size, cb_ctx);
  
                                 if (ret)
-                                       goto out_free_memory;
+                                       goto out_save_decompressor;
  
                                 cur_range_pos += size;
                                 if (cur_range_pos == cur_range_end) {
@@ -556,6 +548,11 @@ read_compressed_wim_resource(const struct wim_resource_spec * const rspec,
                         goto read_error;
         }
         ret = 0;
+out_save_decompressor:
+       wimlib_free_decompressor(rspec->wim->decompressor);
+       rspec->wim->decompressor = decompressor;
+       rspec->wim->decompressor_ctype = ctype;
+       rspec->wim->decompressor_max_block_size = chunk_size;
  out_free_memory:
         errno_save = errno;
         if (chunk_offsets_malloced)
diff --git a/src/wim.c b/src/wim.c

index 97e156ddd40d23616a9bfca2e59cd4dd8961bdb7..d833ec75b53cd66dc16055e21604497636fd4609 100644 (file)
--- a/src/wim.c
+++ b/src/wim.c
@@ -38,6 +38,8 @@
  #include "wimlib/security.h"
  #include "wimlib/wim.h"
  #include "wimlib/xml.h"
+#include "wimlib/compressor_ops.h"
+#include "wimlib/decompressor_ops.h"
  
  #ifdef __WIN32__
  #  include "wimlib/win32.h" /* for realpath() replacement */
@@ -937,10 +939,10 @@ wimlib_free(WIMStruct *wim)
         if (filedes_valid(&wim->out_fd))
                 filedes_close(&wim->out_fd);
  
-       wimlib_lzx_free_context(wim->lzx_context);
-
         free_lookup_table(wim->lookup_table);
  
+       wimlib_free_decompressor(wim->decompressor);
+
         FREE(wim->filename);
         free_wim_info(wim->wim_info);
         if (wim->image_metadata) {
@@ -1003,4 +1005,6 @@ wimlib_global_cleanup(void)
  #ifdef __WIN32__
         win32_global_cleanup();
  #endif
+       cleanup_decompressor_params();
+       cleanup_compressor_params();
  }
diff --git a/src/write.c b/src/write.c

index 7c39971fec0e9543c26023724b4ac3c54ba6abb3..e495cb5b29721c21aa7a1526b0d8d604453348f5 100644 (file)
--- a/src/write.c
+++ b/src/write.c
@@ -34,7 +34,7 @@
  #  include <sys/file.h>
  #endif
  
-#include "wimlib/compress_chunks.h"
+#include "wimlib/chunk_compressor.h"
  #include "wimlib/endianness.h"
  #include "wimlib/error.h"
  #include "wimlib/file_io.h"
@@ -1199,11 +1199,6 @@ remove_zero_length_streams(struct list_head *stream_list)
   *     no streams are hard-filtered or no streams are unhashed, this parameter
   *     can be NULL.
   *
- * @comp_ctx
- *     A location in which to allocate the pointer to the default LZX
- *     compression context.  This will only be used if @out_ctype is
- *     WIMLIB_COMPRESSION_TYPE_LZX.
- *
   * @progress_func
   *     If non-NULL, a progress function that will be called periodically with
   *     WIMLIB_PROGRESS_MSG_WRITE_STREAMS messages.  Note that on-the-fly
@@ -1268,7 +1263,6 @@ write_stream_list(struct list_head *stream_list,
                   unsigned num_threads,
                   struct wim_lookup_table *lookup_table,
                   struct filter_context *filter_ctx,
-                 struct wimlib_lzx_context **comp_ctx,
                   wimlib_progress_func_t progress_func)
  {
         int ret;
@@ -1367,15 +1361,8 @@ write_stream_list(struct list_head *stream_list,
                 }
  
                 if (ctx.compressor == NULL) {
-                       if (out_ctype == WIMLIB_COMPRESSION_TYPE_LZX) {
-                               ret = wimlib_lzx_alloc_context(out_chunk_size,
-                                                              NULL,
-                                                              comp_ctx);
-                               if (ret)
-                                       goto out_destroy_context;
-                       }
                         ret = new_serial_chunk_compressor(out_ctype, out_chunk_size,
-                                                         *comp_ctx, &ctx.compressor);
+                                                         &ctx.compressor);
                         if (ret)
                                 goto out_destroy_context;
                 }
@@ -1478,8 +1465,7 @@ write_wim_resource(struct wim_lookup_table_entry *lte,
                    struct filedes *out_fd,
                    int out_ctype,
                    u32 out_chunk_size,
-                  int write_resource_flags,
-                  struct wimlib_lzx_context **comp_ctx)
+                  int write_resource_flags)
  {
         LIST_HEAD(stream_list);
         list_add(&lte->write_streams_list, &stream_list);
@@ -1492,7 +1478,6 @@ write_wim_resource(struct wim_lookup_table_entry *lte,
                                  1,
                                  NULL,
                                  NULL,
-                                comp_ctx,
                                  NULL);
  }
  
@@ -1503,8 +1488,7 @@ write_wim_resource_from_buffer(const void *buf, size_t buf_size,
                                u32 out_chunk_size,
                                struct wim_reshdr *out_reshdr,
                                u8 *hash,
-                              int write_resource_flags,
-                              struct wimlib_lzx_context **comp_ctx)
+                              int write_resource_flags)
  {
         int ret;
         struct wim_lookup_table_entry *lte;
@@ -1529,7 +1513,7 @@ write_wim_resource_from_buffer(const void *buf, size_t buf_size,
         }
  
         ret = write_wim_resource(lte, out_fd, out_ctype, out_chunk_size,
-                                write_resource_flags, comp_ctx);
+                                write_resource_flags);
         if (ret)
                 goto out_free_lte;
  
@@ -1936,7 +1920,6 @@ write_wim_streams(WIMStruct *wim, int image, int write_flags,
                                  num_threads,
                                  wim->lookup_table,
                                  filter_ctx,
-                                &wim->lzx_context,
                                  progress_func);
  }
  
@@ -1996,8 +1979,7 @@ write_wim_metadata_resources(WIMStruct *wim, int image, int write_flags,
                                                  &wim->out_fd,
                                                  wim->out_compression_type,
                                                  wim->out_chunk_size,
-                                                write_resource_flags,
-                                                &wim->lzx_context);
+                                                write_resource_flags);
                 }
                 if (ret)
                         return ret;
@@ -2117,8 +2099,7 @@ write_wim_lookup_table(WIMStruct *wim, int image, int write_flags,
                                                        &wim->out_fd,
                                                        wim->hdr.part_number,
                                                        out_reshdr,
-                                                      write_flags_to_resource_flags(write_flags),
-                                                      &wim->lzx_context);
+                                                      write_flags_to_resource_flags(write_flags));
  }
  
  /*
@@ -2991,7 +2972,6 @@ overwrite_wim_inplace(WIMStruct *wim, int write_flags,
                                 num_threads,
                                 wim->lookup_table,
                                 &filter_ctx,
-                               &wim->lzx_context,
                                 progress_func);
         if (ret)
                 goto out_truncate;
diff --git a/src/xml.c b/src/xml.c

index 8179ebce7ec0f9998c2333c3136475b9cfe399a9..542fc3791b7d1ce8c4ddfe0bc3c482046a995d8e 100644 (file)
--- a/src/xml.c
+++ b/src/xml.c
@@ -1521,8 +1521,7 @@ write_wim_xml_data(WIMStruct *wim, int image, u64 total_bytes,
                                              0,
                                              out_reshdr,
                                              NULL,
-                                            write_resource_flags,
-                                            &wim->lzx_context);
+                                            write_resource_flags);
         FREE(xml_data);
         DEBUG("ret=%d", ret);
         return ret;
diff --git a/src/xpress-compress.c b/src/xpress-compress.c

index 005a0a22452692d47372907255838ed61d8aa81d..2637ce93cab8fa3de765b37fa6e0980431764043 100644 (file)
--- a/src/xpress-compress.c
+++ b/src/xpress-compress.c
@@ -31,7 +31,8 @@
  
  #include "wimlib.h"
  #include "wimlib/assert.h"
-#include "wimlib/compress.h"
+#include "wimlib/compressor_ops.h"
+#include "wimlib/compress_common.h"
  #include "wimlib/error.h"
  #include "wimlib/util.h"
  #include "wimlib/xpress.h"
@@ -42,6 +43,21 @@
  #include <stdlib.h>
  #include <string.h>
  
+struct xpress_record_ctx {
+       input_idx_t freqs[XPRESS_NUM_SYMBOLS];
+       struct xpress_match *matches;
+};
+
+struct xpress_compressor {
+       u8 *window;
+       u32 max_window_size;
+       struct xpress_match *matches;
+       input_idx_t *prev_tab;
+       u16 codewords[XPRESS_NUM_SYMBOLS];
+       u8 lens[XPRESS_NUM_SYMBOLS];
+       struct xpress_record_ctx record_ctx;
+};
+
  /* Intermediate XPRESS match/literal representation.  */
  struct xpress_match {
         u16 adjusted_len;  /* Match length minus XPRESS_MIN_MATCH_LEN */
@@ -98,11 +114,6 @@ xpress_write_matches_and_literals(struct output_bitstream *ostream,
         bitstream_put_bits(ostream, codewords[XPRESS_END_OF_DATA], lens[XPRESS_END_OF_DATA]);
  }
  
-struct xpress_record_ctx {
-       input_idx_t freqs[XPRESS_NUM_SYMBOLS];
-       struct xpress_match *matches;
-};
-
  static void
  xpress_record_literal(u8 lit, void *_ctx)
  {
@@ -144,26 +155,16 @@ static const struct lz_params xpress_lz_params = {
         .too_far        = 4096,
  };
  
-/* API function documented in wimlib.h  */
-WIMLIBAPI unsigned
-wimlib_xpress_compress(const void * restrict uncompressed_data,
-                      unsigned uncompressed_len,
-                      void * restrict compressed_data)
+static size_t
+xpress_compress(const void *uncompressed_data, size_t uncompressed_size,
+               void *compressed_data, size_t compressed_size_avail, void *_c)
  {
+       struct xpress_compressor *c = _c;
         u8 *cptr = compressed_data;
         struct output_bitstream ostream;
-
-       struct xpress_record_ctx record_ctx;
-
-       struct xpress_match *matches;
-       input_idx_t *prev_tab;
-       u8 *udata;
-
-       u16 codewords[XPRESS_NUM_SYMBOLS];
-       u8 lens[XPRESS_NUM_SYMBOLS];
         input_idx_t num_matches;
-       input_idx_t compressed_len;
         input_idx_t i;
+       size_t compressed_size;
  
         /* XPRESS requires 256 bytes of overhead for the Huffman code, so it's
          * impossible to compress 256 bytes or less of data to less than the
@@ -174,94 +175,146 @@ wimlib_xpress_compress(const void * restrict uncompressed_data,
          *
          * +4 to take into account that init_output_bitstream() requires at
          * least 4 bytes of data.  */
-       if (uncompressed_len < XPRESS_NUM_SYMBOLS / 2 + 1 + 4)
+       if (compressed_size_avail < XPRESS_NUM_SYMBOLS / 2 + 1 + 4)
                 return 0;
  
-       if (uncompressed_len <= STACK_MAX) {
-               matches = alloca(uncompressed_len * sizeof(matches[0]));
-               udata = alloca(uncompressed_len + 8);
-               prev_tab = alloca(uncompressed_len * sizeof(prev_tab[0]));
-       } else {
-               matches = MALLOC(uncompressed_len * sizeof(matches[0]));
-               udata = MALLOC(uncompressed_len + 8);
-               prev_tab = MALLOC(uncompressed_len * sizeof(prev_tab[0]));
-               if (matches == NULL || udata == NULL || prev_tab == NULL) {
-                       WARNING("Failed to allocate memory for compression...");
-                       compressed_len = 0;
-                       goto out_free;
-               }
-       }
-
         /* Copy the data to a temporary buffer, but only to avoid
          * inconsequential accesses of uninitialized memory in
          * lz_analyze_block().  */
-       memcpy(udata, uncompressed_data, uncompressed_len);
-       memset(udata + uncompressed_len, 0, 8);
+       memcpy(c->window, uncompressed_data, uncompressed_size);
+       memset(c->window + uncompressed_size, 0, 8);
  
         /* Determine match/literal sequence to divide the data into.  */
-       ZERO_ARRAY(record_ctx.freqs);
-       record_ctx.matches = matches;
-       lz_analyze_block(udata,
-                        uncompressed_len,
+       memset(c->record_ctx.freqs, 0, sizeof(c->record_ctx.freqs));
+       c->record_ctx.matches = c->matches;
+       lz_analyze_block(c->window,
+                        uncompressed_size,
                          xpress_record_match,
                          xpress_record_literal,
-                        &record_ctx,
+                        &c->record_ctx,
                          &xpress_lz_params,
-                        prev_tab);
+                        c->prev_tab);
  
-       num_matches = (record_ctx.matches - matches);
+       num_matches = (c->record_ctx.matches - c->matches);
  
         /* Account for end of data symbol.  */
-       record_ctx.freqs[XPRESS_END_OF_DATA]++;
+       c->record_ctx.freqs[XPRESS_END_OF_DATA]++;
  
         /* Build the Huffman code.  */
         make_canonical_huffman_code(XPRESS_NUM_SYMBOLS, XPRESS_MAX_CODEWORD_LEN,
-                                   record_ctx.freqs, lens, codewords);
+                                   c->record_ctx.freqs, c->lens, c->codewords);
  
         /* Output the Huffman code as a series of 512 4-bit lengths.  */
         for (i = 0; i < XPRESS_NUM_SYMBOLS; i += 2)
-               *cptr++ = (lens[i] & 0xf) | (lens[i + 1] << 4);
+               *cptr++ = (c->lens[i] & 0xf) | (c->lens[i + 1] << 4);
  
         /* Output the encoded matches/literals.  */
         init_output_bitstream(&ostream, cptr,
-                             uncompressed_len - XPRESS_NUM_SYMBOLS / 2 - 1);
-       xpress_write_matches_and_literals(&ostream, matches,
-                                         num_matches, codewords, lens);
+                             compressed_size_avail - XPRESS_NUM_SYMBOLS / 2 - 1);
+
+       xpress_write_matches_and_literals(&ostream, c->matches,
+                                         num_matches, c->codewords, c->lens);
  
         /* Flush any pending data and get the length of the compressed data.  */
-       compressed_len = flush_output_bitstream(&ostream);
-       if (compressed_len == ~(input_idx_t)0) {
-               compressed_len = 0;
-               goto out_free;
-       }
-       compressed_len += XPRESS_NUM_SYMBOLS / 2;
+       compressed_size = flush_output_bitstream(&ostream);
+       if (compressed_size == ~(input_idx_t)0)
+               return 0;
+
+       compressed_size += XPRESS_NUM_SYMBOLS / 2;
  
  #if defined(ENABLE_XPRESS_DEBUG) || defined(ENABLE_VERIFY_COMPRESSION)
         /* Verify that we really get the same thing back when decompressing.  */
-       if (wimlib_xpress_decompress(compressed_data, compressed_len,
-                                    udata, uncompressed_len))
         {
-               ERROR("Failed to decompress data we "
-                     "compressed using XPRESS algorithm");
-               wimlib_assert(0);
-               compressed_len = 0;
-               goto out_free;
-       }
-
-       if (memcmp(uncompressed_data, udata, uncompressed_len)) {
-               ERROR("Data we compressed using XPRESS algorithm "
-                     "didn't decompress to original");
-               wimlib_assert(0);
-               compressed_len = 0;
-               goto out_free;
+               struct wimlib_decompressor *decompressor;
+
+               if (0 == wimlib_create_decompressor(WIMLIB_COMPRESSION_TYPE_XPRESS,
+                                                   c->max_window_size,
+                                                   NULL,
+                                                   &decompressor))
+               {
+                       int ret;
+                       ret = wimlib_decompress(compressed_data,
+                                               compressed_size,
+                                               c->window,
+                                               uncompressed_size,
+                                               decompressor);
+                       wimlib_free_decompressor(decompressor);
+
+                       if (ret) {
+                               ERROR("Failed to decompress data we "
+                                     "compressed using XPRESS algorithm");
+                               wimlib_assert(0);
+                               return 0;
+                       }
+                       if (memcmp(uncompressed_data, c->window,
+                                  uncompressed_size))
+                       {
+                               ERROR("Data we compressed using XPRESS algorithm "
+                                     "didn't decompress to original");
+                               wimlib_assert(0);
+                               return 0;
+                       }
+               } else {
+                       WARNING("Failed to create decompressor for "
+                               "data verification!");
+               }
         }
  #endif
  
-out_free:
-       if (uncompressed_len > STACK_MAX) {
-               FREE(matches);
-               FREE(udata);
-               FREE(prev_tab);
+       return compressed_size;
+}
+
+static void
+xpress_free_compressor(void *_c)
+{
+       struct xpress_compressor *c = _c;
+
+       if (c) {
+               FREE(c->window);
+               FREE(c->matches);
+               FREE(c->prev_tab);
+               FREE(c);
         }
-       return compressed_len;
  }
+
+static int
+xpress_create_compressor(size_t max_window_size,
+                        const struct wimlib_compressor_params_header *params,
+                        void **c_ret)
+{
+       struct xpress_compressor *c;
+
+       if (max_window_size == 0 || max_window_size > (1U << 26))
+               return WIMLIB_ERR_INVALID_PARAM;
+
+       c = CALLOC(1, sizeof(struct xpress_compressor));
+       if (c == NULL)
+               goto oom;
+
+       c->window = MALLOC(max_window_size + 8);
+       if (c->window == NULL)
+               goto oom;
+
+       c->max_window_size = max_window_size;
+
+       c->matches = MALLOC(max_window_size * sizeof(c->matches[0]));
+       if (c->matches == NULL)
+               goto oom;
+
+       c->prev_tab = MALLOC(max_window_size * sizeof(c->prev_tab[0]));
+       if (c->prev_tab == NULL)
+               goto oom;
+
+       *c_ret = c;
+       return 0;
+
+oom:
+       xpress_free_compressor(c);
+       return WIMLIB_ERR_NOMEM;
+}
+
+const struct compressor_ops xpress_compressor_ops = {
+       .create_compressor  = xpress_create_compressor,
+       .compress           = xpress_compress,
+       .free_compressor    = xpress_free_compressor,
+};
diff --git a/src/xpress-decompress.c b/src/xpress-decompress.c

index f08cccbb4b405372b4a4bbb15018973ed7337875..e4f4c6ba43f4e7f0c8da423d698d87fe2b017925 100644 (file)
--- a/src/xpress-decompress.c
+++ b/src/xpress-decompress.c
@@ -70,7 +70,8 @@
  #endif
  
  #include "wimlib.h"
-#include "wimlib/decompress.h"
+#include "wimlib/decompressor_ops.h"
+#include "wimlib/decompress_common.h"
  #include "wimlib/xpress.h"
  
  /*
@@ -195,13 +196,11 @@ xpress_lz_decode(struct input_bitstream * restrict istream,
  
  
  /* API function documented in wimlib.h  */
-WIMLIBAPI int
-wimlib_xpress_decompress(const void * const restrict _compressed_data,
-                        const unsigned compressed_len,
-                        void * const restrict uncompressed_data,
-                        const unsigned uncompressed_len)
+static int
+xpress_decompress(const void *compressed_data, size_t compressed_size,
+                 void *uncompressed_data, size_t uncompressed_size, void *_ctx)
  {
-       const u8 *compressed_data = _compressed_data;
+       const u8 *cdata = compressed_data;
         u8 lens[XPRESS_NUM_SYMBOLS];
         u8 *lens_p;
         u16 decode_table[(1 << XPRESS_TABLEBITS) + 2 * XPRESS_NUM_SYMBOLS]
@@ -211,13 +210,13 @@ wimlib_xpress_decompress(const void * const restrict _compressed_data,
         /* XPRESS uses only one Huffman code.  It contains 512 symbols, and the
          * code lengths of these symbols are given literally as 4-bit integers
          * in the first 256 bytes of the compressed data.  */
-       if (compressed_len < XPRESS_NUM_SYMBOLS / 2)
+       if (compressed_size < XPRESS_NUM_SYMBOLS / 2)
                 return -1;
  
         lens_p = lens;
         for (unsigned i = 0; i < XPRESS_NUM_SYMBOLS / 2; i++) {
-               *lens_p++ = compressed_data[i] & 0xf;
-               *lens_p++ = compressed_data[i] >> 4;
+               *lens_p++ = cdata[i] & 0xf;
+               *lens_p++ = cdata[i] >> 4;
         }
  
         if (make_huffman_decode_table(decode_table, XPRESS_NUM_SYMBOLS,
@@ -225,9 +224,13 @@ wimlib_xpress_decompress(const void * const restrict _compressed_data,
                                       XPRESS_MAX_CODEWORD_LEN))
                 return -1;
  
-       init_input_bitstream(&istream, compressed_data + XPRESS_NUM_SYMBOLS / 2,
-                            compressed_len - XPRESS_NUM_SYMBOLS / 2);
+       init_input_bitstream(&istream, cdata + XPRESS_NUM_SYMBOLS / 2,
+                            compressed_size - XPRESS_NUM_SYMBOLS / 2);
  
         return xpress_lz_decode(&istream, uncompressed_data,
-                               uncompressed_len, lens, decode_table);
+                               uncompressed_size, lens, decode_table);
  }
+
+const struct decompressor_ops xpress_decompressor_ops = {
+       .decompress = xpress_decompress,
+};
author	Eric Biggers <ebiggers3@gmail.com>
	Wed, 25 Dec 2013 04:53:18 +0000 (22:53 -0600)
committer	Eric Biggers <ebiggers3@gmail.com>
	Wed, 25 Dec 2013 05:40:16 +0000 (23:40 -0600)
Makefile.am		patch \| blob \| history
include/wimlib.h		patch \| blob \| history
include/wimlib/chunk_compressor.h	[moved from include/wimlib/compress_chunks.h with 87% similarity]	patch \| blob \| history
include/wimlib/compress_common.h	[moved from include/wimlib/compress.h with 96% similarity]	patch \| blob \| history
include/wimlib/compressor_ops.h	[new file with mode: 0644]	patch \| blob
include/wimlib/decompress_common.h	[moved from include/wimlib/decompress.h with 98% similarity]	patch \| blob \| history
include/wimlib/decompressor_ops.h	[new file with mode: 0644]	patch \| blob
include/wimlib/lookup_table.h		patch \| blob \| history
include/wimlib/lzx.h		patch \| blob \| history
include/wimlib/wim.h		patch \| blob \| history
include/wimlib/write.h		patch \| blob \| history
programs/imagex.c		patch \| blob \| history
src/compress.c		patch \| blob \| history
src/compress_chunk.c	[deleted file]	patch \| blob \| history
src/compress_common.c	[new file with mode: 0644]	patch \| blob
src/compress_parallel.c		patch \| blob \| history
src/compress_serial.c		patch \| blob \| history
src/decompress.c		patch \| blob \| history
src/decompress_common.c	[new file with mode: 0644]	patch \| blob
src/integrity.c		patch \| blob \| history
src/lookup_table.c		patch \| blob \| history
src/lz77.c		patch \| blob \| history
src/lzms-compress.c	[new file with mode: 0644]	patch \| blob
src/lzms-decompress.c		patch \| blob \| history
src/lzx-common.c		patch \| blob \| history
src/lzx-compress.c		patch \| blob \| history
src/lzx-decompress.c		patch \| blob \| history
src/metadata_resource.c		patch \| blob \| history
src/resource.c		patch \| blob \| history
src/wim.c		patch \| blob \| history
src/write.c		patch \| blob \| history
src/xml.c		patch \| blob \| history
src/xpress-compress.c		patch \| blob \| history
src/xpress-decompress.c		patch \| blob \| history