- hFile = win32_open_file_readonly(path);
- if (hFile == INVALID_HANDLE_VALUE)
- return WIMLIB_ERR_OPEN;
-
- sha1_init(&ctx);
- for (;;) {
- if (!ReadFile(hFile, buf, sizeof(buf), &bytesRead, NULL)) {
- ret = WIMLIB_ERR_READ;
- goto out_close_handle;
- }
- if (bytesRead == 0)
- break;
- sha1_update(&ctx, buf, bytesRead);
- }
- ret = 0;
- sha1_final(hash, &ctx);
-out_close_handle:
- CloseHandle(hFile);
- return ret;
-}
-
-/* Scans an unnamed or named stream of a Win32 file (not a reparse point
- * stream); calculates its SHA1 message digest and either creates a `struct
- * wim_lookup_table_entry' in memory for it, or uses an existing 'struct
- * wim_lookup_table_entry' for an identical stream.
- *
- * @path_utf16: Path to the file (UTF-16LE).
- *
- * @path_utf16_nchars: Number of 2-byte characters in @path_utf16.
- *
- * @inode: WIM inode to save the stream into.
- *
- * @lookup_table: Stream lookup table for the WIM.
- *
- * @dat: A `WIN32_FIND_STREAM_DATA' structure that specifies the
- * stream name.
- *
- * Returns 0 on success; nonzero on failure.
- */
-static int win32_capture_stream(const wchar_t *path_utf16,
- size_t path_utf16_nchars,
- struct wim_inode *inode,
- struct wim_lookup_table *lookup_table,
- WIN32_FIND_STREAM_DATA *dat)
-{
- struct wim_ads_entry *ads_entry;
- u8 hash[SHA1_HASH_SIZE];
- struct wim_lookup_table_entry *lte;
- int ret;
- wchar_t *p, *colon;
- bool is_named_stream;
- wchar_t *spath;
- size_t spath_nchars;
- DWORD err;
-
- /* The stream name should be returned as :NAME:TYPE */
- p = dat->cStreamName;
- if (*p != L':')
- goto out_invalid_stream_name;
- p += 1;
- colon = wcschr(p, L':');
- if (colon == NULL)
- goto out_invalid_stream_name;
-
- if (wcscmp(colon + 1, L"$DATA")) {
- /* Not a DATA stream */
- ret = 0;
- goto out;
- }
-
- is_named_stream = (p != colon);
- if (is_named_stream) {
- /* Allocate an ADS entry for the named stream. */
- char *utf8_stream_name;
- size_t utf8_stream_name_len;
- ret = utf16_to_utf8((const char *)p,
- (colon - p) * sizeof(wchar_t),
- &utf8_stream_name,
- &utf8_stream_name_len);
- if (ret)
- goto out;
- ads_entry = inode_add_ads(inode, utf8_stream_name);
- FREE(utf8_stream_name);
- if (!ads_entry) {
- ret = WIMLIB_ERR_NOMEM;
- goto out;
- }
- }
-
- /* Create a UTF-16 string @spath that gives the filename, then a colon,
- * then the stream name. Or, if it's an unnamed stream, just the
- * filename. It is MALLOC()'ed so that it can be saved in the
- * wim_lookup_table_entry if needed. */
- *colon = '\0';
- spath_nchars = path_utf16_nchars;
- if (is_named_stream)
- spath_nchars += colon - p + 1;
-
- spath = MALLOC((spath_nchars + 1) * sizeof(wchar_t));
- memcpy(spath, path_utf16, path_utf16_nchars * sizeof(wchar_t));
- if (is_named_stream) {
- spath[path_utf16_nchars] = L':';
- memcpy(&spath[path_utf16_nchars + 1], p, (colon - p) * sizeof(wchar_t));
- }
- spath[spath_nchars] = L'\0';
-
- ret = win32_sha1sum(spath, hash);
- if (ret) {
- err = GetLastError();
- ERROR("Win32 API: Failed to read \"%ls\" to calculate SHA1sum",
- path_utf16);
- win32_error(err);
- goto out_free_spath;
- }
-
- lte = __lookup_resource(lookup_table, hash);
- if (lte) {
- /* Use existing wim_lookup_table_entry that has the same SHA1
- * message digest */
- lte->refcnt++;
- } else {
- /* Make a new wim_lookup_table_entry */
- lte = new_lookup_table_entry();
- if (!lte) {
- ret = WIMLIB_ERR_NOMEM;
- goto out_free_spath;
- }
- lte->file_on_disk = (char*)spath;
- spath = NULL;
- lte->resource_location = RESOURCE_WIN32;
- lte->resource_entry.original_size = (uint64_t)dat->StreamSize.QuadPart;
- lte->resource_entry.size = (uint64_t)dat->StreamSize.QuadPart;
- copy_hash(lte->hash, hash);
- lookup_table_insert(lookup_table, lte);
- }
- if (is_named_stream)
- ads_entry->lte = lte;
- else
- inode->i_lte = lte;
-out_free_spath:
- FREE(spath);
-out:
- return ret;
-out_invalid_stream_name:
- ERROR("Invalid stream name: \"%ls:%ls\"", path_utf16, dat->cStreamName);
- ret = WIMLIB_ERR_READ;
- goto out;
-}
-
-/* Scans a Win32 file for unnamed and named data streams (not reparse point
- * streams).
- *
- * @path_utf16: Path to the file (UTF-16LE).
- *
- * @path_utf16_nchars: Number of 2-byte characters in @path_utf16.
- *
- * @inode: WIM inode to save the stream into.
- *
- * @lookup_table: Stream lookup table for the WIM.
- *
- * Returns 0 on success; nonzero on failure.
- */
-static int win32_capture_streams(const wchar_t *path_utf16,
- size_t path_utf16_nchars,
- struct wim_inode *inode,
- struct wim_lookup_table *lookup_table)
-{
- WIN32_FIND_STREAM_DATA dat;
- int ret;
- HANDLE hFind;
- DWORD err;
-
- hFind = FindFirstStreamW(path_utf16, FindStreamInfoStandard, &dat, 0);
- if (hFind == INVALID_HANDLE_VALUE) {
- err = GetLastError();
-
- /* Seems legal for this to return ERROR_HANDLE_EOF on reparse
- * points and directories */
- if ((inode->i_attributes &
- (FILE_ATTRIBUTE_REPARSE_POINT | FILE_ATTRIBUTE_DIRECTORY))
- && err == ERROR_HANDLE_EOF)
- {
- return 0;
- } else {
- ERROR("Win32 API: Failed to look up data streams of \"%ls\"",
- path_utf16);
- win32_error(err);
- return WIMLIB_ERR_READ;
- }
- }
- do {
- ret = win32_capture_stream(path_utf16,
- path_utf16_nchars,
- inode, lookup_table,
- &dat);
- if (ret)
- goto out_find_close;
- } while (FindNextStreamW(hFind, &dat));
- err = GetLastError();
- if (err != ERROR_HANDLE_EOF) {
- ERROR("Win32 API: Error reading data streams from \"%ls\"", path_utf16);
- win32_error(err);
- ret = WIMLIB_ERR_READ;
- }
-out_find_close:
- FindClose(hFind);
- return ret;
-}
-
-#endif
-
-/*
- * build_dentry_tree():
- * Recursively builds a tree of WIM dentries from an on-disk directory
- * tree.
- *
- * @root_ret: Place to return a pointer to the root of the dentry tree. Only
- * modified if successful. Set to NULL if the file or directory was
- * excluded from capture.
- *
- * @root_disk_path: The path to the root of the directory tree on disk (UTF-8).
- *
- * @lookup_table: The lookup table for the WIM file. For each file added to the
- * dentry tree being built, an entry is added to the lookup table,
- * unless an identical stream is already in the lookup table.
- * These lookup table entries that are added point to the path of
- * the file on disk.
- *
- * @sd: Ignored. (Security data only captured in NTFS mode.)
- *
- * @capture_config:
- * Configuration for files to be excluded from capture.
- *
- * @add_flags: Bitwise or of WIMLIB_ADD_IMAGE_FLAG_*
- *
- * @extra_arg: Ignored in UNIX builds; used to pass sd_set pointer in Windows
- * builds.
- *
- * @return: 0 on success, nonzero on failure. It is a failure if any of
- * the files cannot be `stat'ed, or if any of the needed
- * directories cannot be opened or read. Failure to add the files
- * to the WIM may still occur later when trying to actually read
- * the on-disk files during a call to wimlib_write() or
- * wimlib_overwrite().
- */
-static int build_dentry_tree(struct wim_dentry **root_ret,
- const char *root_disk_path,
- struct wim_lookup_table *lookup_table,
- struct wim_security_data *sd,
- const struct capture_config *config,
- int add_image_flags,
- wimlib_progress_func_t progress_func,
- void *extra_arg)
-{
- struct wim_dentry *root = NULL;
- int ret = 0;
- struct wim_inode *inode;
-
- if (exclude_path(root_disk_path, config, true)) {
- if (add_image_flags & WIMLIB_ADD_IMAGE_FLAG_ROOT) {
- ERROR("Cannot exclude the root directory from capture");
- ret = WIMLIB_ERR_INVALID_CAPTURE_CONFIG;
- goto out;
- }
- if ((add_image_flags & WIMLIB_ADD_IMAGE_FLAG_VERBOSE)
- && progress_func)
- {
- union wimlib_progress_info info;
- info.scan.cur_path = root_disk_path;
- info.scan.excluded = true;
- progress_func(WIMLIB_PROGRESS_MSG_SCAN_DENTRY, &info);
- }
- goto out;
- }
-
- if ((add_image_flags & WIMLIB_ADD_IMAGE_FLAG_VERBOSE)
- && progress_func)
- {
- union wimlib_progress_info info;
- info.scan.cur_path = root_disk_path;
- info.scan.excluded = false;
- progress_func(WIMLIB_PROGRESS_MSG_SCAN_DENTRY, &info);
- }
-
-#if !defined(__CYGWIN__) && !defined(__WIN32__)
- /* UNIX version of capturing a directory tree */
- struct stat root_stbuf;
- int (*stat_fn)(const char *restrict, struct stat *restrict);
- if (add_image_flags & WIMLIB_ADD_IMAGE_FLAG_DEREFERENCE)
- stat_fn = stat;
- else
- stat_fn = lstat;
-
- ret = (*stat_fn)(root_disk_path, &root_stbuf);
- if (ret != 0) {
- ERROR_WITH_ERRNO("Failed to stat `%s'", root_disk_path);
- goto out;
- }
-
- if ((add_image_flags & WIMLIB_ADD_IMAGE_FLAG_ROOT) &&
- !S_ISDIR(root_stbuf.st_mode))
- {
- /* Do a dereference-stat in case the root is a symbolic link.
- * This case is allowed, provided that the symbolic link points
- * to a directory. */
- ret = stat(root_disk_path, &root_stbuf);
- if (ret != 0) {
- ERROR_WITH_ERRNO("Failed to stat `%s'", root_disk_path);
- ret = WIMLIB_ERR_STAT;
- goto out;
- }
- if (!S_ISDIR(root_stbuf.st_mode)) {
- ERROR("`%s' is not a directory", root_disk_path);
- ret = WIMLIB_ERR_NOTDIR;
- goto out;
- }
- }
- if (!S_ISREG(root_stbuf.st_mode) && !S_ISDIR(root_stbuf.st_mode)
- && !S_ISLNK(root_stbuf.st_mode)) {
- ERROR("`%s' is not a regular file, directory, or symbolic link.",
- root_disk_path);
- ret = WIMLIB_ERR_SPECIAL_FILE;
- goto out;
- }
-
- root = new_dentry_with_timeless_inode(path_basename(root_disk_path));
- if (!root) {
- if (errno == EILSEQ)
- ret = WIMLIB_ERR_INVALID_UTF8_STRING;
- else if (errno == ENOMEM)
- ret = WIMLIB_ERR_NOMEM;
- else
- ret = WIMLIB_ERR_ICONV_NOT_AVAILABLE;
- goto out;
- }
-
- inode = root->d_inode;
-
-#ifdef HAVE_STAT_NANOSECOND_PRECISION
- inode->i_creation_time = timespec_to_wim_timestamp(&root_stbuf.st_mtim);
- inode->i_last_write_time = timespec_to_wim_timestamp(&root_stbuf.st_mtim);
- inode->i_last_access_time = timespec_to_wim_timestamp(&root_stbuf.st_atim);
-#else
- inode->i_creation_time = unix_timestamp_to_wim(root_stbuf.st_mtime);
- inode->i_last_write_time = unix_timestamp_to_wim(root_stbuf.st_mtime);
- inode->i_last_access_time = unix_timestamp_to_wim(root_stbuf.st_atime);
-#endif
- if (sizeof(ino_t) >= 8)
- inode->i_ino = (u64)root_stbuf.st_ino;
- else
- inode->i_ino = (u64)root_stbuf.st_ino |
- ((u64)root_stbuf.st_dev << ((sizeof(ino_t) * 8) & 63));
- inode->i_resolved = 1;
- if (add_image_flags & WIMLIB_ADD_IMAGE_FLAG_UNIX_DATA) {
- ret = inode_set_unix_data(inode, root_stbuf.st_uid,
- root_stbuf.st_gid,
- root_stbuf.st_mode,
- lookup_table,
- UNIX_DATA_ALL | UNIX_DATA_CREATE);
- if (ret)
- goto out;
- }
- add_image_flags &= ~(WIMLIB_ADD_IMAGE_FLAG_ROOT | WIMLIB_ADD_IMAGE_FLAG_SOURCE);
- if (S_ISREG(root_stbuf.st_mode)) { /* Archiving a regular file */
-
- struct wim_lookup_table_entry *lte;
- u8 hash[SHA1_HASH_SIZE];
-
- inode->i_attributes = FILE_ATTRIBUTE_NORMAL;
-
- /* Empty files do not have to have a lookup table entry. */
- if (root_stbuf.st_size == 0)
- goto out;
-
- /* For each regular file, we must check to see if the file is in
- * the lookup table already; if it is, we increment its refcnt;
- * otherwise, we create a new lookup table entry and insert it.
- * */
-
- ret = sha1sum(root_disk_path, hash);
- if (ret != 0)
- goto out;
-
- lte = __lookup_resource(lookup_table, hash);
- if (lte) {
- lte->refcnt++;
- DEBUG("Add lte reference %u for `%s'", lte->refcnt,
- root_disk_path);
- } else {
- char *file_on_disk = STRDUP(root_disk_path);
- if (!file_on_disk) {
- ERROR("Failed to allocate memory for file path");
- ret = WIMLIB_ERR_NOMEM;
- goto out;
- }
- lte = new_lookup_table_entry();
- if (!lte) {
- FREE(file_on_disk);
- ret = WIMLIB_ERR_NOMEM;
- goto out;
- }
- lte->file_on_disk = file_on_disk;
- lte->resource_location = RESOURCE_IN_FILE_ON_DISK;
- lte->resource_entry.original_size = root_stbuf.st_size;
- lte->resource_entry.size = root_stbuf.st_size;
- copy_hash(lte->hash, hash);
- lookup_table_insert(lookup_table, lte);
- }
- root->d_inode->i_lte = lte;
- } else if (S_ISDIR(root_stbuf.st_mode)) { /* Archiving a directory */
-
- inode->i_attributes = FILE_ATTRIBUTE_DIRECTORY;
-
- DIR *dir;
- struct dirent entry, *result;
- struct wim_dentry *child;
-
- dir = opendir(root_disk_path);
- if (!dir) {
- ERROR_WITH_ERRNO("Failed to open the directory `%s'",
- root_disk_path);
- ret = WIMLIB_ERR_OPEN;
- goto out;
- }
-
- /* Buffer for names of files in directory. */
- size_t len = strlen(root_disk_path);
- char name[len + 1 + FILENAME_MAX + 1];
- memcpy(name, root_disk_path, len);
- name[len] = '/';
-
- /* Create a dentry for each entry in the directory on disk, and recurse
- * to any subdirectories. */
- while (1) {
- errno = 0;
- ret = readdir_r(dir, &entry, &result);
- if (ret != 0) {
- ret = WIMLIB_ERR_READ;
- ERROR_WITH_ERRNO("Error reading the "
- "directory `%s'",
- root_disk_path);
- break;
- }
- if (result == NULL)
- break;
- if (result->d_name[0] == '.' && (result->d_name[1] == '\0'
- || (result->d_name[1] == '.' && result->d_name[2] == '\0')))
- continue;
- strcpy(name + len + 1, result->d_name);
- ret = build_dentry_tree(&child, name, lookup_table,
- NULL, config, add_image_flags,
- progress_func, NULL);
- if (ret != 0)
- break;
- if (child)
- dentry_add_child(root, child);
- }
- closedir(dir);
- } else { /* Archiving a symbolic link */
- inode->i_attributes = FILE_ATTRIBUTE_REPARSE_POINT;
- inode->i_reparse_tag = WIM_IO_REPARSE_TAG_SYMLINK;
-
- /* The idea here is to call readlink() to get the UNIX target of
- * the symbolic link, then turn the target into a reparse point
- * data buffer that contains a relative or absolute symbolic
- * link (NOT a junction point or *full* path symbolic link with
- * drive letter).
- */
-
- char deref_name_buf[4096];
- ssize_t deref_name_len;
-
- deref_name_len = readlink(root_disk_path, deref_name_buf,
- sizeof(deref_name_buf) - 1);
- if (deref_name_len >= 0) {
- deref_name_buf[deref_name_len] = '\0';
- DEBUG("Read symlink `%s'", deref_name_buf);
- ret = inode_set_symlink(root->d_inode, deref_name_buf,
- lookup_table, NULL);
- if (ret == 0) {
- /*
- * Unfortunately, Windows seems to have the
- * concept of "file" symbolic links as being
- * different from "directory" symbolic links...
- * so FILE_ATTRIBUTE_DIRECTORY needs to be set
- * on the symbolic link if the *target* of the
- * symbolic link is a directory.
- */
- struct stat stbuf;
- if (stat(root_disk_path, &stbuf) == 0 &&
- S_ISDIR(stbuf.st_mode))
- {
- inode->i_attributes |= FILE_ATTRIBUTE_DIRECTORY;
- }
- }
- } else {
- ERROR_WITH_ERRNO("Failed to read target of "
- "symbolic link `%s'", root_disk_path);
- ret = WIMLIB_ERR_READLINK;
- }
- }
-#else
- /* Win32 version of capturing a directory tree */
-
- wchar_t *path_utf16;
- size_t path_utf16_nchars;
- struct sd_set *sd_set;
- DWORD err;
-
- if (extra_arg == NULL) {
- sd_set = alloca(sizeof(struct sd_set));
- sd_set->rb_root.rb_node = NULL,
- sd_set->sd = sd;
- } else {
- sd_set = extra_arg;
- }
-
- ret = utf8_to_utf16(root_disk_path, strlen(root_disk_path),
- (char**)&path_utf16, &path_utf16_nchars);
- if (ret)