*/
/*
- * Copyright (C) 2012, 2013, 2014 Eric Biggers
+ * Copyright (C) 2012-2016 Eric Biggers
*
- * This file is part of wimlib, a library for working with WIM files.
+ * This file is free software; you can redistribute it and/or modify it under
+ * the terms of the GNU Lesser General Public License as published by the Free
+ * Software Foundation; either version 3 of the License, or (at your option) any
+ * later version.
*
- * wimlib is free software; you can redistribute it and/or modify it under the
- * terms of the GNU General Public License as published by the Free
- * Software Foundation; either version 3 of the License, or (at your option)
- * any later version.
- *
- * wimlib is distributed in the hope that it will be useful, but WITHOUT ANY
- * WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR
- * A PARTICULAR PURPOSE. See the GNU General Public License for more
+ * This file is distributed in the hope that it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+ * FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License for more
* details.
*
- * You should have received a copy of the GNU General Public License
- * along with wimlib; if not, see http://www.gnu.org/licenses/.
+ * You should have received a copy of the GNU Lesser General Public License
+ * along with this file; if not, see http://www.gnu.org/licenses/.
*/
#ifdef HAVE_CONFIG_H
# include "config.h"
#endif
-#include "wimlib/apply.h"
-#include "wimlib/dentry.h"
-#include "wimlib/error.h"
-#include "wimlib/file_io.h"
-#include "wimlib/reparse.h"
-#include "wimlib/timestamp.h"
-#include "wimlib/unix_data.h"
-
#include <errno.h>
#include <fcntl.h>
-#include <limits.h>
#include <stdlib.h>
#include <sys/stat.h>
#include <sys/time.h>
#include <sys/types.h>
#include <unistd.h>
+#include "wimlib/apply.h"
+#include "wimlib/assert.h"
+#include "wimlib/blob_table.h"
+#include "wimlib/dentry.h"
+#include "wimlib/error.h"
+#include "wimlib/file_io.h"
+#include "wimlib/reparse.h"
+#include "wimlib/timestamp.h"
+#include "wimlib/unix_data.h"
+
/* We don't require O_NOFOLLOW, but the advantage of having it is that if we
* need to extract a file to a location at which there exists a symbolic link,
* open(..., O_NOFOLLOW | ...) recognizes the symbolic link rather than
unix_get_supported_features(const char *target,
struct wim_features *supported_features)
{
+ supported_features->sparse_files = 1;
supported_features->hard_links = 1;
supported_features->symlink_reparse_points = 1;
supported_features->unix_data = 1;
}
#define NUM_PATHBUFS 2 /* We need 2 when creating hard links */
-#define MAX_OPEN_FDS 1000 /* TODO: Add special case for when the number of
- identical streams exceeds this number. */
struct unix_apply_ctx {
/* Extract flags, the pointer to the WIMStruct, etc. */
unsigned which_pathbuf;
/* Currently open file descriptors for extraction */
- struct filedes open_fds[MAX_OPEN_FDS];
+ struct filedes open_fds[MAX_OPEN_FILES];
/* Number of currently open file descriptors in open_fds, starting from
* the beginning of the array. */
unsigned num_open_fds;
- /* Buffer for reading reparse data streams into memory */
+ /* For each currently open file, whether we're writing to it in "sparse"
+ * mode or not. */
+ bool is_sparse_file[MAX_OPEN_FILES];
+
+ /* Whether is_sparse_file[] is true for any currently open file */
+ bool any_sparse_files;
+
+ /* Buffer for reading reparse point data into memory */
u8 reparse_data[REPARSE_DATA_MAX_SIZE];
/* Pointer to the next byte in @reparse_data to fill */
d = dentry;
do {
p -= d->d_extraction_name_nchars;
- memcpy(p, d->d_extraction_name, d->d_extraction_name_nchars);
+ if (d->d_extraction_name_nchars)
+ memcpy(p, d->d_extraction_name,
+ d->d_extraction_name_nchars);
*--p = '/';
d = d->d_parent;
} while (!dentry_is_root(d) && will_extract_dentry(d));
return unix_build_extraction_path(inode_first_extraction_dentry(inode), ctx);
}
-/* Sets the timestamps on a file being extracted.
- *
- * Either @fd or @path must be specified (not -1 and not NULL, respectively).
- */
+/* Should the specified file be extracted as a directory on UNIX? We extract
+ * the file as a directory if FILE_ATTRIBUTE_DIRECTORY is set and the file does
+ * not have a symlink or junction reparse point. It *may* have a different type
+ * of reparse point. */
+static inline bool
+should_extract_as_directory(const struct wim_inode *inode)
+{
+ return (inode->i_attributes & FILE_ATTRIBUTE_DIRECTORY) &&
+ !inode_is_symlink(inode);
+}
+
+/* Sets the timestamps on a file being extracted. */
static int
-unix_set_timestamps(int fd, const char *path, u64 atime, u64 mtime)
+unix_set_timestamps(const char *path, u64 atime, u64 mtime)
{
+#ifdef HAVE_UTIMENSAT
{
struct timespec times[2];
times[0] = wim_timestamp_to_timespec(atime);
times[1] = wim_timestamp_to_timespec(mtime);
- errno = ENOSYS;
-#ifdef HAVE_FUTIMENS
- if (fd >= 0 && !futimens(fd, times))
- return 0;
-#endif
-#ifdef HAVE_UTIMENSAT
- if (fd < 0 && !utimensat(AT_FDCWD, path, times, AT_SYMLINK_NOFOLLOW))
+ if (utimensat(AT_FDCWD, path, times, AT_SYMLINK_NOFOLLOW) == 0)
return 0;
-#endif
if (errno != ENOSYS)
- return WIMLIB_ERR_SET_TIMESTAMPS;
+ return -1;
}
+#endif
{
struct timeval times[2];
times[0] = wim_timestamp_to_timeval(atime);
times[1] = wim_timestamp_to_timeval(mtime);
- if (fd >= 0 && !futimes(fd, times))
- return 0;
- if (fd < 0 && !lutimes(path, times))
- return 0;
- return WIMLIB_ERR_SET_TIMESTAMPS;
+ return lutimes(path, times);
}
}
+/* Set metadata on an extracted file. */
static int
-unix_set_owner_and_group(int fd, const char *path, uid_t uid, gid_t gid)
+unix_set_metadata(const struct wim_inode *inode, struct unix_apply_ctx *ctx)
{
- if (fd >= 0 && !fchown(fd, uid, gid))
- return 0;
- if (fd < 0 && !lchown(path, uid, gid))
- return 0;
- return WIMLIB_ERR_SET_SECURITY;
-}
-
-static int
-unix_set_mode(int fd, const char *path, mode_t mode)
-{
- if (fd >= 0 && !fchmod(fd, mode))
- return 0;
- if (fd < 0 && !chmod(path, mode))
- return 0;
- return WIMLIB_ERR_SET_SECURITY;
-}
-
-/*
- * Set metadata on an extracted file.
- *
- * @fd is an open file descriptor to the extracted file, or -1. @path is the
- * path to the extracted file, or NULL. If valid, this function uses @fd.
- * Otherwise, if valid, it uses @path. Otherwise, it calculates the path to one
- * alias of the extracted file and uses it.
- */
-static int
-unix_set_metadata(int fd, const struct wim_inode *inode,
- const char *path, struct unix_apply_ctx *ctx)
-{
- int ret;
+ const char *path = unix_build_inode_extraction_path(inode, ctx);
struct wimlib_unix_data unix_data;
- if (fd < 0 && !path)
- path = unix_build_inode_extraction_path(inode, ctx);
-
if ((ctx->common.extract_flags & WIMLIB_EXTRACT_FLAG_UNIX_DATA)
&& inode_get_unix_data(inode, &unix_data))
{
u32 gid = unix_data.gid;
u32 mode = unix_data.mode;
- ret = unix_set_owner_and_group(fd, path, uid, gid);
- if (ret) {
- if (!path)
- path = unix_build_inode_extraction_path(inode, ctx);
+ if (lchown(path, uid, gid) != 0) {
if (ctx->common.extract_flags &
WIMLIB_EXTRACT_FLAG_STRICT_ACLS)
{
ERROR_WITH_ERRNO("Can't set uid=%"PRIu32" and "
"gid=%"PRIu32" on \"%s\"",
uid, gid, path);
- return ret;
- } else {
- WARNING_WITH_ERRNO("Can't set uid=%"PRIu32" and "
- "gid=%"PRIu32" on \"%s\"",
- uid, gid, path);
+ return WIMLIB_ERR_SET_SECURITY;
}
+ WARNING_WITH_ERRNO("Can't set uid=%"PRIu32" and "
+ "gid=%"PRIu32" on \"%s\"",
+ uid, gid, path);
}
- ret = 0;
- if (!inode_is_symlink(inode))
- ret = unix_set_mode(fd, path, mode);
- if (ret) {
- if (!path)
- path = unix_build_inode_extraction_path(inode, ctx);
+ if (!inode_is_symlink(inode) && chmod(path, mode) != 0) {
if (ctx->common.extract_flags &
WIMLIB_EXTRACT_FLAG_STRICT_ACLS)
{
ERROR_WITH_ERRNO("Can't set mode=0%"PRIo32" "
"on \"%s\"", mode, path);
- return ret;
- } else {
- WARNING_WITH_ERRNO("Can't set mode=0%"PRIo32" "
- "on \"%s\"", mode, path);
+ return WIMLIB_ERR_SET_SECURITY;
}
+ WARNING_WITH_ERRNO("Can't set mode=0%"PRIo32" "
+ "on \"%s\"", mode, path);
}
}
- ret = unix_set_timestamps(fd, path,
- inode->i_last_access_time,
- inode->i_last_write_time);
- if (ret) {
- if (!path)
- path = unix_build_inode_extraction_path(inode, ctx);
+ if (unix_set_timestamps(path, inode->i_last_access_time,
+ inode->i_last_write_time) != 0)
+ {
if (ctx->common.extract_flags &
WIMLIB_EXTRACT_FLAG_STRICT_TIMESTAMPS)
{
ERROR_WITH_ERRNO("Can't set timestamps on \"%s\"", path);
- return ret;
- } else {
- WARNING_WITH_ERRNO("Can't set timestamps on \"%s\"", path);
+ return WIMLIB_ERR_SET_TIMESTAMPS;
}
+ WARNING_WITH_ERRNO("Can't set timestamps on \"%s\"", path);
}
return 0;
}
-/* Extract all needed aliases of the @inode, where one alias, corresponding to
- * @first_dentry, has already been extracted to @first_path. */
+/*
+ * Extract all needed aliases of the specified @inode, where the first alias has
+ * already been extracted to @first_path.
+ */
static int
unix_create_hardlinks(const struct wim_inode *inode,
- const struct wim_dentry *first_dentry,
const char *first_path, struct unix_apply_ctx *ctx)
{
const struct wim_dentry *dentry;
const char *newpath;
- list_for_each_entry(dentry, &inode->i_extraction_aliases,
- d_extraction_alias_node)
- {
- if (dentry == first_dentry)
+ inode_for_each_extraction_alias(dentry, inode) {
+ if (dentry == inode_first_extraction_dentry(inode))
continue;
-
newpath = unix_build_extraction_path(dentry, ctx);
retry_link:
if (link(first_path, newpath)) {
return 0;
}
-/* If @dentry represents a directory, create it. */
static int
-unix_create_if_directory(const struct wim_dentry *dentry,
- struct unix_apply_ctx *ctx)
+unix_create_directory(const struct wim_dentry *dentry,
+ struct unix_apply_ctx *ctx)
{
- const char *path;
+ const char *path = unix_build_extraction_path(dentry, ctx);
struct stat stbuf;
- if (!dentry_is_directory(dentry))
- return 0;
-
- path = unix_build_extraction_path(dentry, ctx);
if (mkdir(path, 0755) &&
/* It's okay if the path already exists, as long as it's a
* directory. */
ERROR_WITH_ERRNO("Can't create directory \"%s\"", path);
return WIMLIB_ERR_MKDIR;
}
+
return 0;
}
-/* If @dentry represents an empty regular file or a special file, create it, set
- * its metadata, and create any needed hard links. */
static int
-unix_extract_if_empty_file(const struct wim_dentry *dentry,
- struct unix_apply_ctx *ctx)
+unix_create_nondirectory(const struct wim_inode *inode,
+ struct unix_apply_ctx *ctx)
{
- const struct wim_inode *inode;
+ const char *path = unix_build_inode_extraction_path(inode, ctx);
struct wimlib_unix_data unix_data;
- const char *path;
- int ret;
-
- inode = dentry->d_inode;
-
- /* Extract all aliases only when the "first" comes up. */
- if (dentry != inode_first_extraction_dentry(inode))
- return 0;
-
- /* Is this a directory, a symbolic link, or any type of nonempty file?
- */
- if (inode_is_directory(inode) || inode_is_symlink(inode) ||
- inode_unnamed_lte_resolved(inode))
- return 0;
/* Recognize special files in UNIX_DATA mode */
if ((ctx->common.extract_flags & WIMLIB_EXTRACT_FLAG_UNIX_DATA) &&
inode_get_unix_data(inode, &unix_data) &&
!S_ISREG(unix_data.mode))
{
- path = unix_build_extraction_path(dentry, ctx);
retry_mknod:
if (mknod(path, unix_data.mode, unix_data.rdev)) {
if (errno == EPERM) {
path);
return WIMLIB_ERR_MKNOD;
}
- /* On special files, we can set timestamps immediately because
- * we don't need to write any data to them. */
- ret = unix_set_metadata(-1, inode, path, ctx);
} else {
int fd;
- path = unix_build_extraction_path(dentry, ctx);
retry_create:
- fd = open(path, O_TRUNC | O_CREAT | O_WRONLY | O_NOFOLLOW, 0644);
+ fd = open(path, O_EXCL | O_CREAT | O_WRONLY | O_NOFOLLOW, 0644);
if (fd < 0) {
if (errno == EEXIST && !unlink(path))
goto retry_create;
ERROR_WITH_ERRNO("Can't create regular file \"%s\"", path);
return WIMLIB_ERR_OPEN;
}
- /* On empty files, we can set timestamps immediately because we
- * don't need to write any data to them. */
- ret = unix_set_metadata(fd, inode, path, ctx);
- if (close(fd) && !ret) {
+ if (close(fd)) {
ERROR_WITH_ERRNO("Error closing \"%s\"", path);
- ret = WIMLIB_ERR_WRITE;
+ return WIMLIB_ERR_WRITE;
}
}
- if (ret)
- return ret;
- return unix_create_hardlinks(inode, dentry, path, ctx);
+ return unix_create_hardlinks(inode, path, ctx);
}
+/* Create all files (and directories) except for symlinks. */
static int
-unix_create_dirs_and_empty_files(const struct list_head *dentry_list,
- struct unix_apply_ctx *ctx)
+unix_create_file_structure(const struct list_head *dentry_list,
+ struct unix_apply_ctx *ctx)
{
const struct wim_dentry *dentry;
+ const struct wim_inode *inode;
int ret;
list_for_each_entry(dentry, dentry_list, d_extraction_list_node) {
- ret = unix_create_if_directory(dentry, ctx);
+ inode = dentry->d_inode;
+ if (!should_extract_as_directory(inode))
+ continue;
+ ret = unix_create_directory(dentry, ctx);
+ if (!ret)
+ ret = report_file_created(&ctx->common);
if (ret)
return ret;
}
list_for_each_entry(dentry, dentry_list, d_extraction_list_node) {
- ret = unix_extract_if_empty_file(dentry, ctx);
+ inode = dentry->d_inode;
+ if (should_extract_as_directory(inode) ||
+ inode_is_symlink(inode) ||
+ dentry != inode_first_extraction_dentry(inode))
+ continue;
+ ret = unix_create_nondirectory(inode, ctx);
+ if (!ret)
+ ret = report_file_created(&ctx->common);
if (ret)
return ret;
}
return 0;
}
+static void
+unix_count_inodes(const struct list_head *dentry_list,
+ u64 *full_count, u64 *symlink_count)
+{
+ const struct wim_dentry *dentry;
+
+ *full_count = 0;
+ *symlink_count = 0;
+
+ list_for_each_entry(dentry, dentry_list, d_extraction_list_node) {
+ if (dentry != inode_first_extraction_dentry(dentry->d_inode))
+ continue;
+ ++*full_count;
+ if (inode_is_symlink(dentry->d_inode))
+ ++*symlink_count;
+ }
+}
+
static int
unix_create_symlink(const struct wim_inode *inode, const char *path,
- const u8 *rpdata, u16 rpdatalen, bool rpfix,
- const char *apply_dir, size_t apply_dir_nchars)
+ size_t rpdatalen, struct unix_apply_ctx *ctx)
{
- char link_target[REPARSE_DATA_MAX_SIZE];
+ char target[REPARSE_POINT_MAX_SIZE];
+ struct blob_descriptor blob_override;
int ret;
- struct wim_lookup_table_entry lte_override;
- lte_override.resource_location = RESOURCE_IN_ATTACHED_BUFFER;
- lte_override.attached_buffer = (void *)rpdata;
- lte_override.size = rpdatalen;
+ blob_set_is_located_in_attached_buffer(&blob_override,
+ ctx->reparse_data, rpdatalen);
- ret = wim_inode_readlink(inode, link_target,
- sizeof(link_target) - 1, <e_override);
- if (ret < 0) {
+ ret = wim_inode_readlink(inode, target, sizeof(target) - 1,
+ &blob_override,
+ ctx->target_abspath,
+ ctx->target_abspath_nchars);
+ if (unlikely(ret < 0)) {
errno = -ret;
return WIMLIB_ERR_READLINK;
}
+ target[ret] = '\0';
- link_target[ret] = 0;
-
- if (rpfix && link_target[0] == '/') {
-
- /* "Fix" the absolute symbolic link by prepending the absolute
- * path to the target directory. */
-
- if (sizeof(link_target) - (ret + 1) < apply_dir_nchars) {
- errno = ENAMETOOLONG;
- return WIMLIB_ERR_REPARSE_POINT_FIXUP_FAILED;
- }
- memmove(link_target + apply_dir_nchars, link_target,
- ret + 1);
- memcpy(link_target, apply_dir, apply_dir_nchars);
- }
retry_symlink:
- if (symlink(link_target, path)) {
+ if (symlink(target, path)) {
if (errno == EEXIST && !unlink(path))
goto retry_symlink;
return WIMLIB_ERR_LINK;
for (unsigned i = offset; i < ctx->num_open_fds; i++)
filedes_close(&ctx->open_fds[i]);
ctx->num_open_fds = 0;
+ ctx->any_sparse_files = false;
}
static int
-unix_begin_extract_stream_instance(const struct wim_lookup_table_entry *stream,
- const struct wim_inode *inode,
- struct unix_apply_ctx *ctx)
+unix_begin_extract_blob_instance(const struct blob_descriptor *blob,
+ const struct wim_inode *inode,
+ const struct wim_inode_stream *strm,
+ struct unix_apply_ctx *ctx)
{
- const struct wim_dentry *first_dentry;
- const char *first_path;
+ const char *path = unix_build_inode_extraction_path(inode, ctx);
int fd;
- if (inode_is_symlink(inode)) {
+ if (unlikely(strm->stream_type == STREAM_TYPE_REPARSE_POINT)) {
/* On UNIX, symbolic links must be created with symlink(), which
* requires that the full link target be available. */
- if (stream->size > REPARSE_DATA_MAX_SIZE) {
+ if (blob->size > REPARSE_DATA_MAX_SIZE) {
ERROR_WITH_ERRNO("Reparse data of \"%s\" has size "
"%"PRIu64" bytes (exceeds %u bytes)",
- inode_first_full_path(inode),
- stream->size, REPARSE_DATA_MAX_SIZE);
+ path,
+ blob->size, REPARSE_DATA_MAX_SIZE);
return WIMLIB_ERR_INVALID_REPARSE_DATA;
}
ctx->reparse_ptr = ctx->reparse_data;
return 0;
}
- if (ctx->num_open_fds == MAX_OPEN_FDS) {
- ERROR("Can't extract data: too many open files!");
- return WIMLIB_ERR_UNSUPPORTED;
- }
+ wimlib_assert(stream_is_unnamed_data_stream(strm));
- first_dentry = inode_first_extraction_dentry(inode);
- first_path = unix_build_extraction_path(first_dentry, ctx);
-retry_create:
- fd = open(first_path, O_TRUNC | O_CREAT | O_WRONLY | O_NOFOLLOW, 0644);
+ /* Unnamed data stream of "regular" file */
+
+ /* This should be ensured by extract_blob_list() */
+ wimlib_assert(ctx->num_open_fds < MAX_OPEN_FILES);
+
+ fd = open(path, O_WRONLY | O_NOFOLLOW);
if (fd < 0) {
- if (errno == EEXIST && !unlink(first_path))
- goto retry_create;
- ERROR_WITH_ERRNO("Can't create regular file \"%s\"", first_path);
+ ERROR_WITH_ERRNO("Can't open regular file \"%s\"", path);
return WIMLIB_ERR_OPEN;
}
+ if (inode->i_attributes & FILE_ATTRIBUTE_SPARSE_FILE) {
+ ctx->is_sparse_file[ctx->num_open_fds] = true;
+ ctx->any_sparse_files = true;
+ } else {
+ ctx->is_sparse_file[ctx->num_open_fds] = false;
+#ifdef HAVE_POSIX_FALLOCATE
+ posix_fallocate(fd, 0, blob->size);
+#endif
+ }
filedes_init(&ctx->open_fds[ctx->num_open_fds++], fd);
- return unix_create_hardlinks(inode, first_dentry, first_path, ctx);
+ return 0;
}
-/* Called when starting to read a single-instance stream for extraction */
+/* Called when starting to read a blob for extraction */
static int
-unix_begin_extract_stream(struct wim_lookup_table_entry *stream,
- u32 flags, void *_ctx)
+unix_begin_extract_blob(struct blob_descriptor *blob, void *_ctx)
{
struct unix_apply_ctx *ctx = _ctx;
- const struct stream_owner *owners = stream_owners(stream);
- int ret;
+ const struct blob_extraction_target *targets = blob_extraction_targets(blob);
- for (u32 i = 0; i < stream->out_refcnt; i++) {
- const struct wim_inode *inode = owners[i].inode;
-
- ret = unix_begin_extract_stream_instance(stream, inode, ctx);
+ for (u32 i = 0; i < blob->out_refcnt; i++) {
+ int ret = unix_begin_extract_blob_instance(blob,
+ targets[i].inode,
+ targets[i].stream,
+ ctx);
if (ret) {
ctx->reparse_ptr = NULL;
unix_cleanup_open_fds(ctx, 0);
return 0;
}
-/* Called when the next chunk of a single-instance stream has been read for
- * extraction */
+/* Called when the next chunk of a blob has been read for extraction */
static int
-unix_extract_chunk(const void *chunk, size_t size, void *_ctx)
+unix_extract_chunk(const struct blob_descriptor *blob, u64 offset,
+ const void *chunk, size_t size, void *_ctx)
{
struct unix_apply_ctx *ctx = _ctx;
+ const void * const end = chunk + size;
+ const void *p;
+ bool zeroes;
+ size_t len;
+ unsigned i;
int ret;
- for (unsigned i = 0; i < ctx->num_open_fds; i++) {
- ret = full_write(&ctx->open_fds[i], chunk, size);
- if (ret) {
- ERROR_WITH_ERRNO("Error writing data to filesystem");
- return ret;
+ /*
+ * For sparse files, only write nonzero regions. This lets the
+ * filesystem use holes to represent zero regions.
+ */
+ for (p = chunk; p != end; p += len, offset += len) {
+ zeroes = maybe_detect_sparse_region(p, end - p, &len,
+ ctx->any_sparse_files);
+ for (i = 0; i < ctx->num_open_fds; i++) {
+ if (!zeroes || !ctx->is_sparse_file[i]) {
+ ret = full_pwrite(&ctx->open_fds[i],
+ p, len, offset);
+ if (ret)
+ goto err;
+ }
}
}
+
if (ctx->reparse_ptr)
ctx->reparse_ptr = mempcpy(ctx->reparse_ptr, chunk, size);
return 0;
+
+err:
+ ERROR_WITH_ERRNO("Error writing data to filesystem");
+ return ret;
}
-/* Called when a single-instance stream has been fully read for extraction */
+/* Called when a blob has been fully read for extraction */
static int
-unix_end_extract_stream(struct wim_lookup_table_entry *stream, int status,
- void *_ctx)
+unix_end_extract_blob(struct blob_descriptor *blob, int status, void *_ctx)
{
struct unix_apply_ctx *ctx = _ctx;
int ret;
unsigned j;
- const struct stream_owner *owners = stream_owners(stream);
+ const struct blob_extraction_target *targets = blob_extraction_targets(blob);
ctx->reparse_ptr = NULL;
j = 0;
ret = 0;
- for (u32 i = 0; i < stream->out_refcnt; i++) {
- struct wim_inode *inode = owners[i].inode;
+ for (u32 i = 0; i < blob->out_refcnt; i++) {
+ struct wim_inode *inode = targets[i].inode;
if (inode_is_symlink(inode)) {
/* We finally have the symlink data, so we can create
* the symlink. */
const char *path;
- bool rpfix;
-
- rpfix = (ctx->common.extract_flags &
- WIMLIB_EXTRACT_FLAG_RPFIX) &&
- !inode->i_not_rpfixed;
path = unix_build_inode_extraction_path(inode, ctx);
- ret = unix_create_symlink(inode, path,
- ctx->reparse_data,
- stream->size,
- rpfix,
- ctx->target_abspath,
- ctx->target_abspath_nchars);
+ ret = unix_create_symlink(inode, path, blob->size, ctx);
if (ret) {
ERROR_WITH_ERRNO("Can't create symbolic link "
"\"%s\"", path);
break;
}
- ret = unix_set_metadata(-1, inode, path, ctx);
- if (ret)
- break;
} else {
- /* Set metadata on regular file just before closing it.
- */
struct filedes *fd = &ctx->open_fds[j];
- ret = unix_set_metadata(fd->fd, inode, NULL, ctx);
- if (ret)
+ /* If the file is sparse, extend it to its final size. */
+ if (ctx->is_sparse_file[j] && ftruncate(fd->fd, blob->size)) {
+ ERROR_WITH_ERRNO("Error extending \"%s\" to final size",
+ unix_build_inode_extraction_path(inode, ctx));
+ ret = WIMLIB_ERR_WRITE;
break;
+ }
if (filedes_close(fd)) {
ERROR_WITH_ERRNO("Error closing \"%s\"",
return ret;
}
+/* Apply metadata to all extracted files (and directories). */
static int
-unix_set_dir_metadata(struct list_head *dentry_list, struct unix_apply_ctx *ctx)
+unix_apply_metadata(struct list_head *dentry_list, struct unix_apply_ctx *ctx)
{
const struct wim_dentry *dentry;
+ const struct wim_inode *inode;
int ret;
- list_for_each_entry_reverse(dentry, dentry_list, d_extraction_list_node) {
- if (dentry_is_directory(dentry)) {
- ret = unix_set_metadata(-1, dentry->d_inode, NULL, ctx);
- if (ret)
- return ret;
- }
+ list_for_each_entry_reverse(dentry, dentry_list, d_extraction_list_node)
+ {
+ inode = dentry->d_inode;
+ if (dentry != inode_first_extraction_dentry(inode))
+ continue;
+ ret = unix_set_metadata(inode, ctx);
+ if (!ret)
+ ret = report_file_metadata_applied(&ctx->common);
+ if (ret)
+ return ret;
}
return 0;
}
int ret;
struct unix_apply_ctx *ctx = (struct unix_apply_ctx *)_ctx;
size_t path_max;
+ u64 full_count;
+ u64 symlink_count;
/* Compute the maximum path length that will be needed, then allocate
* some path buffers. */
ctx->common.target, ctx->common.target_nchars);
}
- /* Extract directories and empty regular files. Directories are needed
- * because we can't extract any other files until their directories
- * exist. Empty files are needed because they don't have
- * representatives in the stream list. */
- ret = unix_create_dirs_and_empty_files(dentry_list, ctx);
+ /*
+ * We do the extraction in three phases:
+ *
+ * 1. Create all directories and files except for symlinks
+ * 2. Extract streams
+ * 3. Apply metadata
+ *
+ * In phase (2), the streams which may be extracted include unnamed data
+ * streams (regular file contents), reparse streams (translated to
+ * symlink targets), and extended attribute (xattr) streams. These may
+ * come up for extraction in any order. Therefore, at least when xattr
+ * streams are present, all files must be created earlier, in phase (1).
+ *
+ * Symlinks are an exception: they cannot be created until the reparse
+ * stream comes up for extraction. Currently we hack around this by
+ * caching the xattrs of symlinks in memory until they can be applied
+ * between phases (2) and (3).
+ *
+ * Note that phase (3) must happen after all data all xattr extraction
+ * because it might set the file mode's to readonly (which precludes
+ * setxattr), and it also will set timestamps including the last
+ * modification time (which precludes write).
+ */
+
+ unix_count_inodes(dentry_list, &full_count, &symlink_count);
+
+ ret = start_file_structure_phase(&ctx->common,
+ full_count - symlink_count);
+ if (ret)
+ goto out;
+
+ ret = unix_create_file_structure(dentry_list, ctx);
+ if (ret)
+ goto out;
+
+ ret = end_file_structure_phase(&ctx->common);
if (ret)
goto out;
ctx->target_abspath_nchars = strlen(ctx->target_abspath);
}
- /* Extract nonempty regular files and symbolic links. */
-
- struct read_stream_list_callbacks cbs = {
- .begin_stream = unix_begin_extract_stream,
- .begin_stream_ctx = ctx,
- .consume_chunk = unix_extract_chunk,
- .consume_chunk_ctx = ctx,
- .end_stream = unix_end_extract_stream,
- .end_stream_ctx = ctx,
+ struct read_blob_callbacks cbs = {
+ .begin_blob = unix_begin_extract_blob,
+ .continue_blob = unix_extract_chunk,
+ .end_blob = unix_end_extract_blob,
+ .ctx = ctx,
};
- ret = extract_stream_list(&ctx->common, &cbs);
+ ret = extract_blob_list(&ctx->common, &cbs);
+ if (ret)
+ goto out;
+
+ ret = start_file_metadata_phase(&ctx->common, full_count);
if (ret)
goto out;
- /* Set directory metadata. We do this last so that we get the right
- * directory timestamps. */
- ret = unix_set_dir_metadata(dentry_list, ctx);
+ ret = unix_apply_metadata(dentry_list, ctx);
if (ret)
goto out;
+
+ ret = end_file_metadata_phase(&ctx->common);
+ if (ret)
+ goto out;
+
if (ctx->num_special_files_ignored) {
WARNING("%lu special files were not extracted due to EPERM!",
ctx->num_special_files_ignored);