]> wimlib.net Git - wimlib/blob - src/symlink.c
3472ed1148fc0ee6bddd04bc936ac6623c429ae7
[wimlib] / src / symlink.c
1 #include "dentry.h"
2 #include "io.h"
3 #include "lookup_table.h"
4 #include "sha1.h"
5 #include <errno.h>
6
7 /*
8  * Find the symlink target of a symbolic link or junction point in the WIM.
9  *
10  * See http://msdn.microsoft.com/en-us/library/cc232006(v=prot.10).aspx
11  * Except the first 8 bytes aren't included in the resource (presumably because
12  * we already know the reparse tag from the dentry, and we already know the
13  * reparse tag len from the lookup table entry resource length).
14  */
15 static ssize_t get_symlink_name(const u8 *resource, size_t resource_len,
16                                 char *buf, size_t buf_len,
17                                 u32 reparse_tag)
18 {
19         const u8 *p = resource;
20         u16 substitute_name_offset;
21         u16 substitute_name_len;
22         u16 print_name_offset;
23         u16 print_name_len;
24         char *link_target;
25         size_t link_target_len;
26         ssize_t ret;
27         unsigned header_size;
28         char *translated_target;
29         bool is_absolute;
30         u32 flags;
31
32         if (resource_len < 12)
33                 return -EIO;
34         p = get_u16(p, &substitute_name_offset);
35         p = get_u16(p, &substitute_name_len);
36         p = get_u16(p, &print_name_offset);
37         p = get_u16(p, &print_name_len);
38         get_u32(p, &flags);
39
40         wimlib_assert(reparse_tag == WIM_IO_REPARSE_TAG_SYMLINK ||
41                       reparse_tag == WIM_IO_REPARSE_TAG_MOUNT_POINT);
42
43         /* I think that some junction points incorrectly get marked as symbolic
44          * links.  So, parse the link buffer as a symlink if the flags seem
45          * plausible. */
46         if (flags <= 1)
47                 reparse_tag = WIM_IO_REPARSE_TAG_SYMLINK;
48
49         if (reparse_tag == WIM_IO_REPARSE_TAG_MOUNT_POINT) {
50                 header_size = 8;
51         } else {
52                 is_absolute = (flags & 1) ? false : true;
53                 header_size = 12;
54                 p += 4;
55         }
56         if (header_size + substitute_name_offset + substitute_name_len > resource_len)
57                 return -EIO;
58         link_target = utf16_to_utf8(p + substitute_name_offset,
59                                     substitute_name_len,
60                                     &link_target_len);
61
62         if (!link_target)
63                 return -EIO;
64
65         if (link_target_len + 1 > buf_len) {
66                 ret = -ENAMETOOLONG;
67                 goto out;
68         }
69
70         translated_target = link_target;
71         if (reparse_tag == WIM_IO_REPARSE_TAG_MOUNT_POINT || is_absolute) {
72                 if (link_target_len < 7
73                       || memcmp(translated_target, "\\??\\", 4) != 0
74                       || translated_target[4] == '\0'
75                       || translated_target[5] != ':'
76                       || translated_target[6] != '\\') {
77                         ret = -EIO;
78                         goto out;
79                 }
80                 translated_target += 4;
81                 link_target_len -= 4;
82                 /* There's a drive letter, so just leave the backslashes since
83                  * it won't go anyhwere on UNIX anyway... */
84         } else {
85                 for (size_t i = 0; i < link_target_len; i++)
86                         if (translated_target[i] == '\\')
87                                 translated_target[i] = '/';
88         }
89
90         memcpy(buf, translated_target, link_target_len + 1);
91         ret = link_target_len;
92 out:
93         FREE(link_target);
94         return ret;
95 }
96
97 void *make_symlink_reparse_data_buf(const char *symlink_target, size_t *len_ret)
98 {
99         size_t utf8_len = strlen(symlink_target);
100         size_t utf16_len;
101         char *name_utf16 = utf8_to_utf16(symlink_target, utf8_len, &utf16_len);
102         if (!name_utf16)
103                 return NULL;
104         /*DEBUG("utf16_len = %zu", utf16_len);*/
105         for (size_t i = 0; i < utf16_len / 2; i++)
106                 if (((u16*)name_utf16)[i] == to_le16('/'))
107                         ((u16*)name_utf16)[i] = to_le16('\\');
108         size_t len = 12 + utf16_len * 2;
109         void *buf = MALLOC(len);
110         if (!buf)
111                 goto out;
112         /* XXX Fix absolute paths */
113
114         u8 *p = buf;
115         p = put_u16(p, 0); /* Substitute name offset */
116         p = put_u16(p, utf16_len); /* Substitute name length */
117         p = put_u16(p, utf16_len); /* Print name offset */
118         p = put_u16(p, utf16_len); /* Print name length */
119         p = put_u32(p, 1);
120         p = put_bytes(p, utf16_len, name_utf16);
121         p = put_bytes(p, utf16_len, name_utf16);
122         /*DEBUG("utf16_len = %zu, len = %zu", utf16_len, len);*/
123         *len_ret = len;
124 out:
125         FREE(name_utf16);
126         return buf;
127 }
128
129 static const struct lookup_table_entry *
130 dentry_first_lte(const struct dentry *dentry, const struct lookup_table *table)
131 {
132         const struct lookup_table_entry *lte;
133         if (dentry->resolved) {
134                 if (dentry->lte)
135                         return dentry->lte;
136                 for (u16 i = 0; i < dentry->num_ads; i++)
137                         if (dentry->ads_entries[i].lte)
138                                 return dentry->ads_entries[i].lte;
139         } else {
140                 const u8 *hash = dentry->hash;
141                 u16 i = 0;
142                 while (1) {
143                         if ((lte = __lookup_resource(table, hash)))
144                                 break;
145                         if (i == dentry->num_ads)
146                                 return NULL;
147                         hash = dentry->ads_entries[i].hash;
148                         i++;
149                 }
150         }
151         return NULL;
152 }
153
154 /* Get the symlink target from a dentry that's already checked to be either a
155  * "real" symlink or a junction point. */
156 ssize_t dentry_readlink(const struct dentry *dentry, char *buf, size_t buf_len,
157                         const WIMStruct *w)
158 {
159         const struct resource_entry *res_entry;
160         const struct lookup_table_entry *lte;
161
162         wimlib_assert(dentry_is_symlink(dentry));
163
164         lte = dentry_first_lte(dentry, w->lookup_table);
165         if (!lte)
166                 return -EIO;
167
168         res_entry = &lte->resource_entry;
169         if (res_entry->original_size > 10000)
170                 return -EIO;
171
172         char __res_buf[res_entry->original_size];
173         const char *res_buf;
174         if (lte->is_symlink && lte->symlink_buf) {
175                 res_buf = lte->symlink_buf;
176         } else {
177                 res_buf = __res_buf;
178                 if (read_full_resource(w->fp, res_entry->size, 
179                                        res_entry->original_size,
180                                        res_entry->offset,
181                                        wim_resource_compression_type(w, res_entry),
182                                        __res_buf) != 0)
183                         return -EIO;
184                 res_buf = __res_buf;
185         }
186         return get_symlink_name(res_buf, res_entry->original_size, buf,
187                                 buf_len, dentry->reparse_tag);
188 }
189
190 static int dentry_set_symlink_buf(struct dentry *dentry,
191                                   const u8 symlink_buf_hash[])
192 {
193         struct ads_entry *ads_entries;
194
195         ads_entries = CALLOC(2, sizeof(struct ads_entry));
196         if (!ads_entries)
197                 return WIMLIB_ERR_NOMEM;
198         memcpy(ads_entries[1].hash, symlink_buf_hash, WIM_HASH_SIZE);
199         wimlib_assert(dentry->num_ads == 0);
200         wimlib_assert(!dentry->ads_entries);
201         /*dentry_free_ads_entries(dentry);*/
202         dentry->num_ads = 2;
203         dentry->ads_entries = ads_entries;
204         return 0;
205 }
206
207 int dentry_set_symlink(struct dentry *dentry, const char *target,
208                        struct lookup_table *lookup_table,
209                        struct lookup_table_entry **lte_ret)
210
211 {
212         int ret;
213         size_t symlink_buf_len;
214         struct lookup_table_entry *lte = NULL, *existing_lte;
215         u8 symlink_buf_hash[WIM_HASH_SIZE];
216         void *symlink_buf;
217         
218         symlink_buf = make_symlink_reparse_data_buf(target, &symlink_buf_len);
219         if (!symlink_buf)
220                 return WIMLIB_ERR_NOMEM;
221
222         DEBUG("Made symlink reparse data buf (len = %zu, name len = %zu)",
223                         symlink_buf_len, ret);
224         
225         sha1_buffer(symlink_buf, symlink_buf_len, symlink_buf_hash);
226
227         existing_lte = __lookup_resource(lookup_table, symlink_buf_hash);
228
229         if (existing_lte) {
230                 existing_lte->refcnt++;
231                 lte = existing_lte;
232         } else {
233                 DEBUG("Creating new lookup table entry for symlink buf");
234                 lte = new_lookup_table_entry();
235                 if (!lte) {
236                         ret = WIMLIB_ERR_NOMEM;
237                         goto out_free_symlink_buf;
238                 }
239                 lte->is_symlink = true;
240                 lte->symlink_buf = symlink_buf;
241                 lte->resource_entry.original_size = symlink_buf_len;
242                 lte->resource_entry.size = symlink_buf_len;
243                 memcpy(lte->hash, symlink_buf_hash, WIM_HASH_SIZE);
244         }
245
246         ret = dentry_set_symlink_buf(dentry, symlink_buf_hash);
247
248         if (ret != 0)
249                 goto out_free_lte;
250
251         DEBUG("Loaded symlink buf");
252
253         if (!existing_lte)
254                 lookup_table_insert(lookup_table, lte);
255         if (lte_ret)
256                 *lte_ret = lte;
257         return 0;
258 out_free_lte:
259         if (lte != existing_lte)
260                 FREE(lte);
261 out_free_symlink_buf:
262         FREE(symlink_buf);
263         return ret;
264 }