wimlib.net Git - wimlib/blob - src/inode.c

   1 /*
   2  * inode.c
   3  *
   4  * Functions that operate on WIM inodes.
   5  *
   6  * See dentry.c for a description of the relationship between WIM dentries and
   7  * WIM inodes.
   8  */
   9
  10 /*
  11  * Copyright (C) 2012, 2013, 2014 Eric Biggers
  12  *
  13  * This file is part of wimlib, a library for working with WIM files.
  14  *
  15  * wimlib is free software; you can redistribute it and/or modify it under the
  16  * terms of the GNU General Public License as published by the Free
  17  * Software Foundation; either version 3 of the License, or (at your option)
  18  * any later version.
  19  *
  20  * wimlib is distributed in the hope that it will be useful, but WITHOUT ANY
  21  * WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR
  22  * A PARTICULAR PURPOSE. See the GNU General Public License for more
  23  * details.
  24  *
  25  * You should have received a copy of the GNU General Public License
  26  * along with wimlib; if not, see http://www.gnu.org/licenses/.
  27  */
  28
  29 #ifdef HAVE_CONFIG_H
  30 #  include "config.h"
  31 #endif
  32
  33 #include "wimlib/assert.h"
  34 #include "wimlib/dentry.h" /* Only for dentry_full_path().  Otherwise the code
  35                               in this file doesn't care about file names/paths.
  36                             */
  37 #include "wimlib/encoding.h"
  38 #include "wimlib/endianness.h"
  39 #include "wimlib/error.h"
  40 #include "wimlib/inode.h"
  41 #include "wimlib/inode_table.h"
  42 #include "wimlib/lookup_table.h"
  43 #include "wimlib/security.h"
  44 #include "wimlib/timestamp.h"
  45
  46 #include <errno.h>
  47
  48 /* Allocate a new inode.  Set the timestamps to the current time.  */
  49 struct wim_inode *
  50 new_inode(void)
  51 {
  52         struct wim_inode *inode = new_timeless_inode();
  53         if (inode) {
  54                 u64 now = get_wim_timestamp();
  55                 inode->i_creation_time = now;
  56                 inode->i_last_access_time = now;
  57                 inode->i_last_write_time = now;
  58         }
  59         return inode;
  60 }
  61
  62 /* Allocate a new inode.  Leave the timestamps zeroed out.  */
  63 struct wim_inode *
  64 new_timeless_inode(void)
  65 {
  66         struct wim_inode *inode = CALLOC(1, sizeof(struct wim_inode));
  67         if (inode) {
  68                 inode->i_security_id = -1;
  69                 inode->i_nlink = 1;
  70                 inode->i_next_stream_id = 1;
  71                 inode->i_not_rpfixed = 1;
  72                 inode->i_canonical_streams = 1;
  73                 INIT_LIST_HEAD(&inode->i_list);
  74                 INIT_LIST_HEAD(&inode->i_dentry);
  75         }
  76         return inode;
  77 }
  78
  79 /* Decrement link count on an inode.  */
  80 void
  81 put_inode(struct wim_inode *inode)
  82 {
  83         wimlib_assert(inode->i_nlink != 0);
  84         if (--inode->i_nlink == 0) {
  85                 /* If FUSE mounts are enabled, we must keep a unlinked inode
  86                  * around until all file descriptors to it have been closed.  */
  87         #ifdef WITH_FUSE
  88                 if (inode->i_num_opened_fds == 0)
  89         #endif
  90                         free_inode(inode);
  91         }
  92 }
  93
  94 /* Free memory allocated within an alternate data stream entry.  */
  95 static void
  96 destroy_ads_entry(struct wim_ads_entry *ads_entry)
  97 {
  98         FREE(ads_entry->stream_name);
  99 }
 100
 101 /* Free an inode.  Only use this if there can't be other links to the inode or
 102  * if it doesn't matter if there are.  */
 103 void
 104 free_inode(struct wim_inode *inode)
 105 {
 106         if (unlikely(!inode))
 107                 return;
 108
 109         if (unlikely(inode->i_ads_entries)) {
 110                 for (u16 i = 0; i < inode->i_num_ads; i++)
 111                         destroy_ads_entry(&inode->i_ads_entries[i]);
 112                 FREE(inode->i_ads_entries);
 113         }
 114         if (unlikely(inode->i_extra))
 115                 FREE(inode->i_extra);
 116         /* HACK: This may instead delete the inode from i_list, but hlist_del()
 117          * behaves the same as list_del(). */
 118         if (!hlist_unhashed(&inode->i_hlist))
 119                 hlist_del(&inode->i_hlist);
 120         FREE(inode);
 121 }
 122
 123 /* Return %true iff the alternate data stream entry @entry has the UTF-16LE
 124  * stream name @name that has length @name_nbytes bytes.  */
 125 static inline bool
 126 ads_entry_has_name(const struct wim_ads_entry *entry,
 127                    const utf16lechar *name, size_t name_nbytes,
 128                    bool ignore_case)
 129 {
 130         return 0 == cmp_utf16le_strings(name,
 131                                         name_nbytes / 2,
 132                                         entry->stream_name,
 133                                         entry->stream_name_nbytes / 2,
 134                                         ignore_case);
 135 }
 136
 137 /*
 138  * Returns the alternate data stream entry belonging to @inode that has the
 139  * stream name @stream_name, or NULL if the inode has no alternate data stream
 140  * with that name.
 141  *
 142  * If @p stream_name is the empty string, NULL is returned --- that is, this
 143  * function will not return "unnamed" alternate data stream entries.
 144  *
 145  * If NULL is returned, errno is set.
 146  */
 147 struct wim_ads_entry *
 148 inode_get_ads_entry(struct wim_inode *inode, const tchar *stream_name)
 149 {
 150         int ret;
 151         const utf16lechar *stream_name_utf16le;
 152         size_t stream_name_utf16le_nbytes;
 153         u16 i;
 154         struct wim_ads_entry *result;
 155
 156         if (inode->i_num_ads == 0) {
 157                 errno = ENOENT;
 158                 return NULL;
 159         }
 160
 161         if (stream_name[0] == T('\0')) {
 162                 errno = ENOENT;
 163                 return NULL;
 164         }
 165
 166         ret = tstr_get_utf16le_and_len(stream_name, &stream_name_utf16le,
 167                                        &stream_name_utf16le_nbytes);
 168         if (ret)
 169                 return NULL;
 170
 171         i = 0;
 172         result = NULL;
 173         do {
 174                 if (ads_entry_has_name(&inode->i_ads_entries[i],
 175                                        stream_name_utf16le,
 176                                        stream_name_utf16le_nbytes,
 177                                        default_ignore_case))
 178                 {
 179                         result = &inode->i_ads_entries[i];
 180                         break;
 181                 }
 182         } while (++i != inode->i_num_ads);
 183
 184         tstr_put_utf16le(stream_name_utf16le);
 185
 186         if (!result)
 187                 errno = ENOENT;
 188         return result;
 189 }
 190
 191 static struct wim_ads_entry *
 192 do_inode_add_ads(struct wim_inode *inode,
 193                  utf16lechar *stream_name, size_t stream_name_nbytes)
 194 {
 195         u16 num_ads;
 196         struct wim_ads_entry *ads_entries;
 197         struct wim_ads_entry *new_entry;
 198
 199         if (inode->i_num_ads >= 0xfffe) {
 200                 ERROR("File \"%"TS"\" has too many alternate data streams!",
 201                       inode_first_full_path(inode));
 202                 errno = EFBIG;
 203                 return NULL;
 204         }
 205         num_ads = inode->i_num_ads + 1;
 206         ads_entries = REALLOC(inode->i_ads_entries,
 207                               num_ads * sizeof(inode->i_ads_entries[0]));
 208         if (!ads_entries)
 209                 return NULL;
 210
 211         inode->i_ads_entries = ads_entries;
 212
 213         new_entry = &inode->i_ads_entries[num_ads - 1];
 214
 215         memset(new_entry, 0, sizeof(struct wim_ads_entry));
 216         new_entry->stream_name = stream_name;
 217         new_entry->stream_name_nbytes = stream_name_nbytes;
 218         new_entry->stream_id = inode->i_next_stream_id++;
 219         inode->i_num_ads = num_ads;
 220         return new_entry;
 221 }
 222
 223 /*
 224  * Add an alternate data stream entry to a WIM inode (UTF-16LE version).  On
 225  * success, returns a pointer to the new entry.  Note that this pointer might
 226  * become invalid if another ADS entry is added to the inode.  On failure,
 227  * returns NULL and sets errno.
 228  */
 229 struct wim_ads_entry *
 230 inode_add_ads_utf16le(struct wim_inode *inode,
 231                       const utf16lechar *stream_name, size_t stream_name_nbytes)
 232 {
 233         utf16lechar *dup = NULL;
 234         struct wim_ads_entry *result;
 235
 236         if (stream_name_nbytes) {
 237                 dup = utf16le_dupz(stream_name, stream_name_nbytes);
 238                 if (!dup)
 239                         return NULL;
 240         }
 241
 242         result = do_inode_add_ads(inode, dup, stream_name_nbytes);
 243         if (!result)
 244                 FREE(dup);
 245         return result;
 246 }
 247
 248 /*
 249  * Add an alternate data stream entry to a WIM inode (tchar version).  On
 250  * success, returns a pointer to the new entry.  Note that this pointer might
 251  * become invalid if another ADS entry is added to the inode.  On failure,
 252  * returns NULL and sets errno.
 253  */
 254 struct wim_ads_entry *
 255 inode_add_ads(struct wim_inode *inode, const tchar *stream_name)
 256 {
 257         utf16lechar *stream_name_utf16le = NULL;
 258         size_t stream_name_utf16le_nbytes = 0;
 259         struct wim_ads_entry *result;
 260
 261         if (stream_name && *stream_name)
 262                 if (tstr_to_utf16le(stream_name,
 263                                     tstrlen(stream_name) * sizeof(tchar),
 264                                     &stream_name_utf16le,
 265                                     &stream_name_utf16le_nbytes))
 266                         return NULL;
 267
 268         result = do_inode_add_ads(inode, stream_name_utf16le,
 269                                   stream_name_utf16le_nbytes);
 270         if (!result)
 271                 FREE(stream_name_utf16le);
 272         return result;
 273 }
 274
 275 /*
 276  * Add an data alternate stream entry to a WIM inode, where the contents of the
 277  * new stream are specified in a data buffer.  The inode must be resolved.
 278  *
 279  * On success, returns a pointer to the new alternate data stream entry.  Note
 280  * that this pointer might become invalid if another ADS entry is added to the
 281  * inode.  On failure, returns NULL and sets errno.
 282  */
 283 struct wim_ads_entry *
 284 inode_add_ads_with_data(struct wim_inode *inode, const tchar *name,
 285                         const void *value, size_t size,
 286                         struct wim_lookup_table *lookup_table)
 287 {
 288         struct wim_ads_entry *new_entry;
 289
 290         wimlib_assert(inode->i_resolved);
 291
 292         new_entry = inode_add_ads(inode, name);
 293         if (!new_entry)
 294                 return NULL;
 295
 296         new_entry->lte = new_stream_from_data_buffer(value, size, lookup_table);
 297         if (!new_entry->lte) {
 298                 inode_remove_ads(inode, new_entry, NULL);
 299                 return NULL;
 300         }
 301         return new_entry;
 302 }
 303
 304 /*
 305  * Does the inode have any named data streams?
 306  */
 307 bool
 308 inode_has_named_stream(const struct wim_inode *inode)
 309 {
 310         for (u16 i = 0; i < inode->i_num_ads; i++)
 311                 if (ads_entry_is_named_stream(&inode->i_ads_entries[i]))
 312                         return true;
 313         return false;
 314 }
 315
 316 /* Set the unnamed stream of a WIM inode, given a data buffer containing the
 317  * stream contents.  The inode must be resolved and cannot have an unnamed
 318  * stream specified already.  */
 319 int
 320 inode_set_unnamed_stream(struct wim_inode *inode, const void *data, size_t len,
 321                          struct wim_lookup_table *lookup_table)
 322 {
 323         wimlib_assert(inode->i_resolved);
 324         wimlib_assert(!inode->i_lte);
 325         inode->i_lte = new_stream_from_data_buffer(data, len, lookup_table);
 326         if (!inode->i_lte)
 327                 return WIMLIB_ERR_NOMEM;
 328         return 0;
 329 }
 330
 331 /* Remove an alternate data stream from a WIM inode.  */
 332 void
 333 inode_remove_ads(struct wim_inode *inode, struct wim_ads_entry *entry,
 334                  struct wim_lookup_table *lookup_table)
 335 {
 336         struct wim_lookup_table_entry *lte;
 337         unsigned idx = entry - inode->i_ads_entries;
 338
 339         wimlib_assert(idx < inode->i_num_ads);
 340         wimlib_assert(inode->i_resolved);
 341
 342         lte = entry->lte;
 343         if (lte)
 344                 lte_decrement_refcnt(lte, lookup_table);
 345
 346         destroy_ads_entry(entry);
 347
 348         memmove(&inode->i_ads_entries[idx],
 349                 &inode->i_ads_entries[idx + 1],
 350                 (inode->i_num_ads - idx - 1) * sizeof(inode->i_ads_entries[0]));
 351         inode->i_num_ads--;
 352 }
 353
 354 /*
 355  * Resolve an inode's single-instance streams.
 356  *
 357  * This takes each SHA-1 message digest stored in the inode or one of its ADS
 358  * entries and replaces it with a pointer directly to the appropriate 'struct
 359  * wim_lookup_table_entry' currently inserted into @table to represent the
 360  * single-instance stream having that SHA-1 message digest.
 361  *
 362  * If @force is %false:
 363  *      If any of the needed single-instance streams do not exist in @table,
 364  *      return WIMLIB_ERR_RESOURCE_NOT_FOUND and leave the inode unmodified.
 365  * If @force is %true:
 366  *      If any of the needed single-instance streams do not exist in @table,
 367  *      allocate new entries for them and insert them into @table.  This does
 368  *      not, of course, cause these streams to magically exist, but this is
 369  *      needed by the code for extraction from a pipe.
 370  *
 371  * If the inode is already resolved, this function does nothing.
 372  *
 373  * Returns 0 on success; WIMLIB_ERR_NOMEM if out of memory; or
 374  * WIMLIB_ERR_RESOURCE_NOT_FOUND if @force is %false and at least one
 375  * single-instance stream referenced by the inode was missing.
 376  */
 377 int
 378 inode_resolve_streams(struct wim_inode *inode, struct wim_lookup_table *table,
 379                       bool force)
 380 {
 381         const u8 *hash;
 382         struct wim_lookup_table_entry *lte, *ads_lte;
 383
 384         if (inode->i_resolved)
 385                 return 0;
 386
 387         struct wim_lookup_table_entry *ads_ltes[inode->i_num_ads];
 388
 389         /* Resolve the default data stream */
 390         lte = NULL;
 391         hash = inode->i_hash;
 392         if (!is_zero_hash(hash)) {
 393                 lte = lookup_stream(table, hash);
 394                 if (!lte) {
 395                         if (force) {
 396                                 lte = new_lookup_table_entry();
 397                                 if (!lte)
 398                                         return WIMLIB_ERR_NOMEM;
 399                                 copy_hash(lte->hash, hash);
 400                                 lookup_table_insert(table, lte);
 401                         } else {
 402                                 goto stream_not_found;
 403                         }
 404                 }
 405         }
 406
 407         /* Resolve the alternate data streams */
 408         for (u16 i = 0; i < inode->i_num_ads; i++) {
 409                 struct wim_ads_entry *cur_entry;
 410
 411                 ads_lte = NULL;
 412                 cur_entry = &inode->i_ads_entries[i];
 413                 hash = cur_entry->hash;
 414                 if (!is_zero_hash(hash)) {
 415                         ads_lte = lookup_stream(table, hash);
 416                         if (!ads_lte) {
 417                                 if (force) {
 418                                         ads_lte = new_lookup_table_entry();
 419                                         if (!ads_lte)
 420                                                 return WIMLIB_ERR_NOMEM;
 421                                         copy_hash(ads_lte->hash, hash);
 422                                         lookup_table_insert(table, ads_lte);
 423                                 } else {
 424                                         goto stream_not_found;
 425                                 }
 426                         }
 427                 }
 428                 ads_ltes[i] = ads_lte;
 429         }
 430         inode->i_lte = lte;
 431         for (u16 i = 0; i < inode->i_num_ads; i++)
 432                 inode->i_ads_entries[i].lte = ads_ltes[i];
 433         inode->i_resolved = 1;
 434         return 0;
 435
 436 stream_not_found:
 437         return stream_not_found_error(inode, hash);
 438 }
 439
 440 /*
 441  * Undo the effects of inode_resolve_streams().
 442  *
 443  * If the inode is not resolved, this function does nothing.
 444  */
 445 void
 446 inode_unresolve_streams(struct wim_inode *inode)
 447 {
 448         if (!inode->i_resolved)
 449                 return;
 450
 451         if (inode->i_lte)
 452                 copy_hash(inode->i_hash, inode->i_lte->hash);
 453         else
 454                 zero_out_hash(inode->i_hash);
 455
 456         for (u16 i = 0; i < inode->i_num_ads; i++) {
 457                 if (inode->i_ads_entries[i].lte)
 458                         copy_hash(inode->i_ads_entries[i].hash,
 459                                   inode->i_ads_entries[i].lte->hash);
 460                 else
 461                         zero_out_hash(inode->i_ads_entries[i].hash);
 462         }
 463         inode->i_resolved = 0;
 464 }
 465
 466 int
 467 stream_not_found_error(const struct wim_inode *inode, const u8 *hash)
 468 {
 469         if (wimlib_print_errors) {
 470                 tchar hashstr[SHA1_HASH_SIZE * 2 + 1];
 471
 472                 sprint_hash(hash, hashstr);
 473
 474                 ERROR("\"%"TS"\": stream not found\n"
 475                       "        SHA-1 message digest of missing stream:\n"
 476                       "        %"TS"",
 477                       inode_first_full_path(inode), hashstr);
 478         }
 479         return WIMLIB_ERR_RESOURCE_NOT_FOUND;
 480 }
 481
 482 /*
 483  * Return the lookup table entry for stream @stream_idx of the inode, where
 484  * stream_idx = 0 means the default un-named file stream, and stream_idx >= 1
 485  * corresponds to an alternate data stream.
 486  *
 487  * This works for both resolved and un-resolved inodes.
 488  */
 489 struct wim_lookup_table_entry *
 490 inode_stream_lte(const struct wim_inode *inode, unsigned stream_idx,
 491                  const struct wim_lookup_table *table)
 492 {
 493         if (inode->i_resolved)
 494                 return inode_stream_lte_resolved(inode, stream_idx);
 495         else
 496                 return inode_stream_lte_unresolved(inode, stream_idx, table);
 497 }
 498
 499 /*
 500  * Return the lookup table entry for the unnamed data stream of a *resolved*
 501  * inode, or NULL if there is none.  Also return the 0-based index of the
 502  * corresponding stream in *stream_idx_ret.
 503  */
 504 struct wim_lookup_table_entry *
 505 inode_unnamed_stream_resolved(const struct wim_inode *inode, u16 *stream_idx_ret)
 506 {
 507         wimlib_assert(inode->i_resolved);
 508         for (unsigned i = 0; i <= inode->i_num_ads; i++) {
 509                 if (inode_stream_name_nbytes(inode, i) == 0 &&
 510                     !is_zero_hash(inode_stream_hash_resolved(inode, i)))
 511                 {
 512                         *stream_idx_ret = i;
 513                         return inode_stream_lte_resolved(inode, i);
 514                 }
 515         }
 516         *stream_idx_ret = 0;
 517         return NULL;
 518 }
 519
 520 /*
 521  * Return the lookup table entry for the unnamed data stream of a *resolved*
 522  * inode, or NULL if there is none.
 523  */
 524 struct wim_lookup_table_entry *
 525 inode_unnamed_lte_resolved(const struct wim_inode *inode)
 526 {
 527         u16 stream_idx;
 528         return inode_unnamed_stream_resolved(inode, &stream_idx);
 529 }
 530
 531 /*
 532  * Return the lookup table entry for the unnamed data stream of an *unresolved*
 533  * inode, or NULL if there is none.
 534  */
 535 struct wim_lookup_table_entry *
 536 inode_unnamed_lte_unresolved(const struct wim_inode *inode,
 537                              const struct wim_lookup_table *table)
 538 {
 539         wimlib_assert(!inode->i_resolved);
 540         for (unsigned i = 0; i <= inode->i_num_ads; i++) {
 541                 if (inode_stream_name_nbytes(inode, i) == 0 &&
 542                     !is_zero_hash(inode_stream_hash_unresolved(inode, i)))
 543                 {
 544                         return inode_stream_lte_unresolved(inode, i, table);
 545                 }
 546         }
 547         return NULL;
 548 }
 549
 550 /*
 551  * Return the lookup table entry for the unnamed data stream of an inode, or
 552  * NULL if there is none.
 553  *
 554  * You'd think this would be easier than it actually is, since the unnamed data
 555  * stream should be the one referenced from the inode itself.  Alas, if there
 556  * are named data streams, Microsoft's "imagex.exe" program will put the unnamed
 557  * data stream in one of the alternate data streams instead of inside the WIM
 558  * dentry itself.  So we need to check the alternate data streams too.
 559  *
 560  * Also, note that a dentry may appear to have more than one unnamed stream, but
 561  * if the SHA-1 message digest is all 0's then the corresponding stream does not
 562  * really "count" (this is the case for the inode's own file stream when the
 563  * file stream that should be there is actually in one of the alternate stream
 564  * entries.).  This is despite the fact that we may need to extract such a
 565  * missing entry as an empty file or empty named data stream.
 566  */
 567 struct wim_lookup_table_entry *
 568 inode_unnamed_lte(const struct wim_inode *inode,
 569                   const struct wim_lookup_table *table)
 570 {
 571         if (inode->i_resolved)
 572                 return inode_unnamed_lte_resolved(inode);
 573         else
 574                 return inode_unnamed_lte_unresolved(inode, table);
 575 }
 576
 577 /*
 578  * Return the SHA-1 message digest of the unnamed data stream of a WIM inode.
 579  *
 580  * If inode does not have an unnamed data stream, this returns a void SHA-1
 581  * message digest containing all zero bytes.
 582  */
 583 const u8 *
 584 inode_unnamed_stream_hash(const struct wim_inode *inode)
 585 {
 586         const u8 *hash;
 587
 588         for (unsigned i = 0; i <= inode->i_num_ads; i++) {
 589                 if (inode_stream_name_nbytes(inode, i) == 0) {
 590                         hash = inode_stream_hash(inode, i);
 591                         if (!is_zero_hash(hash))
 592                                 return hash;
 593                 }
 594         }
 595         return zero_hash;
 596 }
 597
 598 /*
 599  * Translate a single-instance stream entry into the pointer contained in the
 600  * inode (or ads entry of an inode) that references it.
 601  *
 602  * This is only possible for "unhashed" streams, which are guaranteed to have
 603  * only one reference, and that reference is guaranteed to be in a resolved
 604  * inode.  (It can't be in an unresolved inode, since that would imply the hash
 605  * is known!)
 606  */
 607 struct wim_lookup_table_entry **
 608 retrieve_lte_pointer(struct wim_lookup_table_entry *lte)
 609 {
 610         wimlib_assert(lte->unhashed);
 611         struct wim_inode *inode = lte->back_inode;
 612         u32 stream_id = lte->back_stream_id;
 613         if (stream_id == 0)
 614                 return &inode->i_lte;
 615         else
 616                 for (u16 i = 0; i < inode->i_num_ads; i++)
 617                         if (inode->i_ads_entries[i].stream_id == stream_id)
 618                                 return &inode->i_ads_entries[i].lte;
 619         wimlib_assert(0);
 620         return NULL;
 621 }
 622
 623 /*
 624  * Read the alternate data stream entries of a WIM dentry.
 625  *
 626  * @p:
 627  *      Pointer to buffer that starts with the first alternate stream entry.
 628  *
 629  * @inode:
 630  *      Inode to load the alternate data streams into.  @inode->i_num_ads must
 631  *      have been set to the number of alternate data streams that are expected.
 632  *
 633  * @nbytes_remaining_p:
 634  *      Number of bytes of data remaining in the buffer pointed to by @p.
 635  *      On success this will be updated to point just past the ADS entries.
 636  *
 637  * On success, inode->i_ads_entries is set to an array of `struct
 638  * wim_ads_entry's of length inode->i_num_ads.  On failure, @inode is not
 639  * modified.
 640  *
 641  * Return values:
 642  *      WIMLIB_ERR_SUCCESS (0)
 643  *      WIMLIB_ERR_INVALID_METADATA_RESOURCE
 644  *      WIMLIB_ERR_NOMEM
 645  */
 646 int
 647 read_ads_entries(const u8 * restrict p, struct wim_inode * restrict inode,
 648                  size_t *nbytes_remaining_p)
 649 {
 650         size_t nbytes_remaining = *nbytes_remaining_p;
 651         u16 num_ads;
 652         struct wim_ads_entry *ads_entries;
 653         int ret;
 654
 655         BUILD_BUG_ON(sizeof(struct wim_ads_entry_on_disk) != WIM_ADS_ENTRY_DISK_SIZE);
 656
 657         /* Allocate an array for our in-memory representation of the alternate
 658          * data stream entries. */
 659         num_ads = inode->i_num_ads;
 660         ads_entries = CALLOC(num_ads, sizeof(inode->i_ads_entries[0]));
 661         if (!ads_entries)
 662                 goto out_of_memory;
 663
 664         /* Read the entries into our newly allocated buffer. */
 665         for (u16 i = 0; i < num_ads; i++) {
 666                 u64 length;
 667                 struct wim_ads_entry *cur_entry;
 668                 const struct wim_ads_entry_on_disk *disk_entry =
 669                         (const struct wim_ads_entry_on_disk*)p;
 670
 671                 cur_entry = &ads_entries[i];
 672                 ads_entries[i].stream_id = i + 1;
 673
 674                 /* Do we have at least the size of the fixed-length data we know
 675                  * need? */
 676                 if (nbytes_remaining < sizeof(struct wim_ads_entry_on_disk))
 677                         goto out_invalid;
 678
 679                 /* Read the length field */
 680                 length = le64_to_cpu(disk_entry->length);
 681
 682                 /* Make sure the length field is neither so small it doesn't
 683                  * include all the fixed-length data nor so large it overflows
 684                  * the metadata resource buffer. */
 685                 if (length < sizeof(struct wim_ads_entry_on_disk) ||
 686                     length > nbytes_remaining)
 687                         goto out_invalid;
 688
 689                 /* Read the rest of the fixed-length data. */
 690
 691                 cur_entry->reserved = le64_to_cpu(disk_entry->reserved);
 692                 copy_hash(cur_entry->hash, disk_entry->hash);
 693                 cur_entry->stream_name_nbytes = le16_to_cpu(disk_entry->stream_name_nbytes);
 694
 695                 /* If stream_name_nbytes != 0, this is a named stream.
 696                  * Otherwise this is an unnamed stream, or in some cases (bugs
 697                  * in Microsoft's software I guess) a meaningless entry
 698                  * distinguished from the real unnamed stream entry, if any, by
 699                  * the fact that the real unnamed stream entry has a nonzero
 700                  * hash field. */
 701                 if (cur_entry->stream_name_nbytes) {
 702                         /* The name is encoded in UTF16-LE, which uses 2-byte
 703                          * coding units, so the length of the name had better be
 704                          * an even number of bytes... */
 705                         if (cur_entry->stream_name_nbytes & 1)
 706                                 goto out_invalid;
 707
 708                         /* Add the length of the stream name to get the length
 709                          * we actually need to read.  Make sure this isn't more
 710                          * than the specified length of the entry. */
 711                         if (sizeof(struct wim_ads_entry_on_disk) +
 712                             cur_entry->stream_name_nbytes > length)
 713                                 goto out_invalid;
 714
 715                         cur_entry->stream_name = utf16le_dupz(disk_entry->stream_name,
 716                                                               cur_entry->stream_name_nbytes);
 717                         if (!cur_entry->stream_name)
 718                                 goto out_of_memory;
 719                 } else {
 720                         /* Mark inode as having weird stream entries.  */
 721                         inode->i_canonical_streams = 0;
 722                 }
 723
 724                 /* It's expected that the size of every ADS entry is a multiple
 725                  * of 8.  However, to be safe, I'm allowing the possibility of
 726                  * an ADS entry at the very end of the metadata resource ending
 727                  * un-aligned.  So although we still need to increment the input
 728                  * pointer by @length to reach the next ADS entry, it's possible
 729                  * that less than @length is actually remaining in the metadata
 730                  * resource. We should set the remaining bytes to 0 if this
 731                  * happens. */
 732                 length = (length + 7) & ~7;
 733                 p += length;
 734                 if (nbytes_remaining < length)
 735                         nbytes_remaining = 0;
 736                 else
 737                         nbytes_remaining -= length;
 738         }
 739         inode->i_ads_entries = ads_entries;
 740         inode->i_next_stream_id = inode->i_num_ads + 1;
 741         *nbytes_remaining_p = nbytes_remaining;
 742         ret = 0;
 743         goto out;
 744 out_of_memory:
 745         ret = WIMLIB_ERR_NOMEM;
 746         goto out_free_ads_entries;
 747 out_invalid:
 748         ERROR("An alternate data stream entry is invalid");
 749         ret = WIMLIB_ERR_INVALID_METADATA_RESOURCE;
 750 out_free_ads_entries:
 751         if (ads_entries) {
 752                 for (u16 i = 0; i < num_ads; i++)
 753                         destroy_ads_entry(&ads_entries[i]);
 754                 FREE(ads_entries);
 755         }
 756 out:
 757         return ret;
 758 }
 759
 760 /* Check a WIM inode for unusual field values.  */
 761 void
 762 check_inode(struct wim_inode *inode, const struct wim_security_data *sd)
 763 {
 764         /* Check the security ID.  -1 is valid and means "no security
 765          * descriptor".  Anything else has to be a valid index into the WIM
 766          * image's security descriptors table. */
 767         if (inode->i_security_id < -1 ||
 768             (inode->i_security_id >= 0 &&
 769              inode->i_security_id >= sd->num_entries))
 770         {
 771                 WARNING("\"%"TS"\" has an invalid security ID (%d)",
 772                         inode_first_full_path(inode), inode->i_security_id);
 773                 inode->i_security_id = -1;
 774         }
 775
 776         /* Make sure there is only one unnamed data stream. */
 777         unsigned num_unnamed_streams = 0;
 778         for (unsigned i = 0; i <= inode->i_num_ads; i++) {
 779                 const u8 *hash;
 780                 hash = inode_stream_hash(inode, i);
 781                 if (inode_stream_name_nbytes(inode, i) == 0 && !is_zero_hash(hash))
 782                         num_unnamed_streams++;
 783         }
 784         if (num_unnamed_streams > 1) {
 785                 WARNING("\"%"TS"\" has multiple (%u) un-named streams",
 786                         inode_first_full_path(inode), num_unnamed_streams);
 787                 /* We currently don't treat this as an error and will just end
 788                  * up using the first unnamed data stream in the inode.  */
 789         }
 790 }
 791
 792 /* Acquire another reference to each single-instance stream referenced by this
 793  * inode.  This is necessary when creating a hard link to this inode.
 794  *
 795  * The inode must be resolved.  */
 796 void
 797 inode_ref_streams(struct wim_inode *inode)
 798 {
 799         for (unsigned i = 0; i <= inode->i_num_ads; i++) {
 800                 struct wim_lookup_table_entry *lte;
 801
 802                 lte = inode_stream_lte_resolved(inode, i);
 803                 if (lte)
 804                         lte->refcnt++;
 805         }
 806 }
 807
 808 /* Drop a reference to each single-instance stream referenced by this inode.
 809  * This is necessary when deleting a hard link to this inode.  */
 810 void
 811 inode_unref_streams(struct wim_inode *inode,
 812                     struct wim_lookup_table *lookup_table)
 813 {
 814         for (unsigned i = 0; i <= inode->i_num_ads; i++) {
 815                 struct wim_lookup_table_entry *lte;
 816
 817                 lte = inode_stream_lte(inode, i, lookup_table);
 818                 if (lte)
 819                         lte_decrement_refcnt(lte, lookup_table);
 820         }
 821 }
 822
 823 /* Initialize a hash table for hard link detection.  */
 824 int
 825 init_inode_table(struct wim_inode_table *table, size_t capacity)
 826 {
 827         table->array = CALLOC(capacity, sizeof(table->array[0]));
 828         if (!table->array)
 829                 return WIMLIB_ERR_NOMEM;
 830         table->num_entries  = 0;
 831         table->capacity  = capacity;
 832         INIT_LIST_HEAD(&table->extra_inodes);
 833         return 0;
 834 }
 835
 836 /* Free the memory allocated by init_inode_table().  */
 837 void
 838 destroy_inode_table(struct wim_inode_table *table)
 839 {
 840         FREE(table->array);
 841 }
 842
 843 static struct wim_inode *
 844 inode_table_get_inode(struct wim_inode_table *table, u64 ino, u64 devno)
 845 {
 846         u64 hash = hash_u64(hash_u64(ino) + hash_u64(devno));
 847         size_t pos = hash % table->capacity;
 848         struct wim_inode *inode;
 849         struct hlist_node *cur;
 850
 851         /* Search for an existing inode having the same inode number and device
 852          * number.  */
 853         hlist_for_each_entry(inode, cur, &table->array[pos], i_hlist) {
 854                 if (inode->i_ino == ino && inode->i_devno == devno) {
 855                         /* Found; use the existing inode.  */
 856                         inode->i_nlink++;
 857                         return inode;
 858                 }
 859         }
 860
 861         /* Create a new inode and insert it into the table.  */
 862         inode = new_timeless_inode();
 863         if (inode) {
 864                 inode->i_ino = ino;
 865                 inode->i_devno = devno;
 866                 hlist_add_head(&inode->i_hlist, &table->array[pos]);
 867                 table->num_entries++;
 868         }
 869         return inode;
 870 }
 871
 872 /*
 873  * Allocate a new dentry, with hard link detection.
 874  *
 875  * @table
 876  *      The inode table being used for the current directory scan operation.  It
 877  *      will contain the mapping from (ino, devno) pairs to inodes.
 878  *
 879  * @name
 880  *      The name to give the new dentry.
 881  *
 882  * @ino
 883  *      The inode number of the file, read from the filesystem.
 884  *
 885  * @devno
 886  *      The device number of the file, read from the filesystem.  Proper setting
 887  *      of this parameter prevents cross-device hardlinks from being created.
 888  *      If this is not a problem (perhaps because the current directory scan
 889  *      operation is guaranteed to never traverse a filesystem boundary), then
 890  *      this parameter can just be a fixed value such as 0.
 891  *
 892  * @noshare
 893  *      If %true, the new dentry will not be hard linked to any existing inode,
 894  *      regardless of the values of @ino and @devno.  If %false, normal hard
 895  *      link detection will be done.
 896  *
 897  * @dentry_ret
 898  *      On success, a pointer to the new dentry will be returned in this
 899  *      location.  If i_nlink of the dentry's inode is greater than 1, then this
 900  *      function created a hard link to an existing inode rather than creating a
 901  *      new inode.
 902  *
 903  * On success, returns 0.  On failure, returns WIMLIB_ERR_NOMEM or an error code
 904  * resulting from a failed string conversion.
 905  */
 906 int
 907 inode_table_new_dentry(struct wim_inode_table *table, const tchar *name,
 908                        u64 ino, u64 devno, bool noshare,
 909                        struct wim_dentry **dentry_ret)
 910 {
 911         struct wim_dentry *dentry;
 912         struct wim_inode *inode;
 913         int ret;
 914
 915         if (noshare) {
 916                 /* File that cannot be hardlinked--- Return a new inode with its
 917                  * inode and device numbers left at 0. */
 918                 ret = new_dentry_with_timeless_inode(name, &dentry);
 919                 if (ret)
 920                         return ret;
 921                 list_add_tail(&dentry->d_inode->i_list, &table->extra_inodes);
 922         } else {
 923                 /* File that can be hardlinked--- search the table for an
 924                  * existing inode matching the inode number and device;
 925                  * otherwise create a new inode. */
 926                 ret = new_dentry(name, &dentry);
 927                 if (ret)
 928                         return ret;
 929                 inode = inode_table_get_inode(table, ino, devno);
 930                 if (!inode) {
 931                         free_dentry(dentry);
 932                         return WIMLIB_ERR_NOMEM;
 933                 }
 934                 /* If using an existing inode, we need to gain a reference to
 935                  * each of its streams. */
 936                 if (inode->i_nlink > 1)
 937                         inode_ref_streams(inode);
 938                 dentry->d_inode = inode;
 939                 inode_add_dentry(dentry, inode);
 940         }
 941         *dentry_ret = dentry;
 942         return 0;
 943 }
 944
 945
 946
 947 /*
 948  * Following the allocation of dentries with hard link detection using
 949  * inode_table_new_dentry(), this function will assign consecutive inode numbers
 950  * to the new set of inodes.  It will also append the list of new inodes to the
 951  * list @head, which must contain any inodes already existing in the WIM image.
 952  */
 953 void
 954 inode_table_prepare_inode_list(struct wim_inode_table *table,
 955                                struct list_head *head)
 956 {
 957         struct wim_inode *inode, *tmp_inode;
 958         struct hlist_node *cur, *tmp;
 959         u64 cur_ino = 1;
 960
 961         /* Re-assign inode numbers in the existing list to avoid duplicates. */
 962         list_for_each_entry(inode, head, i_list)
 963                 inode->i_ino = cur_ino++;
 964
 965         /* Assign inode numbers to the new inodes and move them to the image's
 966          * inode list. */
 967         for (size_t i = 0; i < table->capacity; i++) {
 968                 hlist_for_each_entry_safe(inode, cur, tmp, &table->array[i], i_hlist)
 969                 {
 970                         inode->i_ino = cur_ino++;
 971                         inode->i_devno = 0;
 972                         list_add_tail(&inode->i_list, head);
 973                 }
 974                 INIT_HLIST_HEAD(&table->array[i]);
 975         }
 976         list_for_each_entry_safe(inode, tmp_inode, &table->extra_inodes, i_list)
 977         {
 978                 inode->i_ino = cur_ino++;
 979                 inode->i_devno = 0;
 980                 list_add_tail(&inode->i_list, head);
 981         }
 982         INIT_LIST_HEAD(&table->extra_inodes);
 983         table->num_entries = 0;
 984 }