]>
Commit | Line | Data |
---|---|---|
b0d623f7 | 1 | /* |
d9a64523 | 2 | * Copyright (c) 2008-2018 Apple Inc. All rights reserved. |
b0d623f7 A |
3 | * |
4 | * @APPLE_OSREFERENCE_LICENSE_HEADER_START@ | |
0a7de745 | 5 | * |
b0d623f7 A |
6 | * This file contains Original Code and/or Modifications of Original Code |
7 | * as defined in and that are subject to the Apple Public Source License | |
8 | * Version 2.0 (the 'License'). You may not use this file except in | |
9 | * compliance with the License. The rights granted to you under the License | |
10 | * may not be used to create, or enable the creation or redistribution of, | |
11 | * unlawful or unlicensed copies of an Apple operating system, or to | |
12 | * circumvent, violate, or enable the circumvention or violation of, any | |
13 | * terms of an Apple operating system software license agreement. | |
0a7de745 | 14 | * |
b0d623f7 A |
15 | * Please obtain a copy of the License at |
16 | * http://www.opensource.apple.com/apsl/ and read it before using this file. | |
0a7de745 | 17 | * |
b0d623f7 A |
18 | * The Original Code and all software distributed under the License are |
19 | * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER | |
20 | * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES, | |
21 | * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY, | |
22 | * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT. | |
23 | * Please see the License for the specific language governing rights and | |
24 | * limitations under the License. | |
0a7de745 | 25 | * |
b0d623f7 A |
26 | * @APPLE_OSREFERENCE_LICENSE_HEADER_END@ |
27 | */ | |
39037602 A |
28 | #if !FS_COMPRESSION |
29 | ||
30 | /* We need these symbols even though compression is turned off */ | |
31 | ||
0a7de745 | 32 | #define UNUSED_SYMBOL(x) asm(".global _" #x "\n.set _" #x ", 0\n"); |
39037602 A |
33 | |
34 | UNUSED_SYMBOL(register_decmpfs_decompressor) | |
35 | UNUSED_SYMBOL(unregister_decmpfs_decompressor) | |
36 | UNUSED_SYMBOL(decmpfs_init) | |
37 | UNUSED_SYMBOL(decmpfs_read_compressed) | |
38 | UNUSED_SYMBOL(decmpfs_cnode_cmp_type) | |
39 | UNUSED_SYMBOL(decmpfs_cnode_get_vnode_state) | |
40 | UNUSED_SYMBOL(decmpfs_cnode_get_vnode_cached_size) | |
cb323159 A |
41 | UNUSED_SYMBOL(decmpfs_cnode_get_vnode_cached_nchildren) |
42 | UNUSED_SYMBOL(decmpfs_cnode_get_vnode_cached_total_size) | |
39037602 A |
43 | UNUSED_SYMBOL(decmpfs_lock_compressed_data) |
44 | UNUSED_SYMBOL(decmpfs_cnode_free) | |
45 | UNUSED_SYMBOL(decmpfs_cnode_alloc) | |
46 | UNUSED_SYMBOL(decmpfs_cnode_destroy) | |
47 | UNUSED_SYMBOL(decmpfs_decompress_file) | |
48 | UNUSED_SYMBOL(decmpfs_unlock_compressed_data) | |
49 | UNUSED_SYMBOL(decmpfs_cnode_init) | |
50 | UNUSED_SYMBOL(decmpfs_cnode_set_vnode_state) | |
51 | UNUSED_SYMBOL(decmpfs_hides_xattr) | |
52 | UNUSED_SYMBOL(decmpfs_ctx) | |
53 | UNUSED_SYMBOL(decmpfs_file_is_compressed) | |
54 | UNUSED_SYMBOL(decmpfs_update_attributes) | |
55 | UNUSED_SYMBOL(decmpfs_hides_rsrc) | |
56 | UNUSED_SYMBOL(decmpfs_pagein_compressed) | |
57 | UNUSED_SYMBOL(decmpfs_validate_compressed_file) | |
58 | ||
59 | #else /* FS_COMPRESSION */ | |
b0d623f7 A |
60 | #include <sys/kernel.h> |
61 | #include <sys/vnode_internal.h> | |
62 | #include <sys/file_internal.h> | |
63 | #include <sys/stat.h> | |
64 | #include <sys/fcntl.h> | |
65 | #include <sys/xattr.h> | |
66 | #include <sys/namei.h> | |
67 | #include <sys/user.h> | |
68 | #include <sys/mount_internal.h> | |
69 | #include <sys/ubc.h> | |
70 | #include <sys/decmpfs.h> | |
71 | #include <sys/uio_internal.h> | |
72 | #include <libkern/OSByteOrder.h> | |
5ba3f43e | 73 | #include <libkern/section_keywords.h> |
b0d623f7 | 74 | |
f427ee49 A |
75 | #include <ptrauth.h> |
76 | ||
b0d623f7 A |
77 | #pragma mark --- debugging --- |
78 | ||
79 | #define COMPRESSION_DEBUG 0 | |
80 | #define COMPRESSION_DEBUG_VERBOSE 0 | |
81 | #define MALLOC_DEBUG 0 | |
82 | ||
83 | static const char * | |
84 | baseName(const char *path) | |
85 | { | |
0a7de745 A |
86 | if (!path) { |
87 | return NULL; | |
88 | } | |
89 | const char *ret = path; | |
90 | int i; | |
91 | for (i = 0; path[i] != 0; i++) { | |
92 | if (path[i] == '/') { | |
93 | ret = &path[i + 1]; | |
94 | } | |
95 | } | |
96 | return ret; | |
b0d623f7 A |
97 | } |
98 | ||
f427ee49 | 99 | #if COMPRESSION_DEBUG |
3e170ce0 A |
100 | static char* |
101 | vnpath(vnode_t vp, char *path, int len) | |
102 | { | |
0a7de745 A |
103 | int origlen = len; |
104 | path[0] = 0; | |
105 | vn_getpath(vp, path, &len); | |
106 | path[origlen - 1] = 0; | |
107 | return path; | |
3e170ce0 | 108 | } |
f427ee49 | 109 | #endif |
3e170ce0 | 110 | |
b0d623f7 | 111 | #define ErrorLog(x, args...) printf("%s:%d:%s: " x, baseName(__FILE__), __LINE__, __FUNCTION__, ## args) |
f427ee49 | 112 | #if COMPRESSION_DEBUG |
3e170ce0 | 113 | #define ErrorLogWithPath(x, args...) do { char *path; MALLOC(path, char *, PATH_MAX, M_TEMP, M_WAITOK); printf("%s:%d:%s: %s: " x, baseName(__FILE__), __LINE__, __FUNCTION__, vnpath(vp, path, PATH_MAX), ## args); FREE(path, M_TEMP); } while(0) |
f427ee49 A |
114 | #else |
115 | #define ErrorLogWithPath(x, args...) do { (void*)vp; printf("%s:%d:%s: %s: " x, baseName(__FILE__), __LINE__, __FUNCTION__, "<private>", ## args); } while(0) | |
116 | #endif | |
b0d623f7 A |
117 | |
118 | #if COMPRESSION_DEBUG | |
119 | #define DebugLog ErrorLog | |
3e170ce0 | 120 | #define DebugLogWithPath ErrorLogWithPath |
b0d623f7 A |
121 | #else |
122 | #define DebugLog(x...) do { } while(0) | |
3e170ce0 | 123 | #define DebugLogWithPath(x...) do { } while(0) |
b0d623f7 A |
124 | #endif |
125 | ||
126 | #if COMPRESSION_DEBUG_VERBOSE | |
127 | #define VerboseLog ErrorLog | |
3e170ce0 | 128 | #define VerboseLogWithPath ErrorLogWithPath |
b0d623f7 A |
129 | #else |
130 | #define VerboseLog(x...) do { } while(0) | |
3e170ce0 | 131 | #define VerboseLogWithPath(x...) do { } while(0) |
b0d623f7 A |
132 | #endif |
133 | ||
134 | #if MALLOC_DEBUG | |
135 | ||
136 | static SInt32 totalAlloc; | |
137 | ||
138 | typedef struct { | |
0a7de745 A |
139 | uint32_t allocSz; |
140 | uint32_t magic; | |
141 | const char *file; | |
142 | int line; | |
b0d623f7 A |
143 | } allocated; |
144 | ||
145 | static void * | |
146 | _malloc(uint32_t sz, __unused int type, __unused int flags, const char *file, int line) | |
147 | { | |
0a7de745 A |
148 | uint32_t allocSz = sz + 2 * sizeof(allocated); |
149 | ||
150 | allocated *alloc = NULL; | |
151 | MALLOC(alloc, allocated *, allocSz, type, flags); | |
152 | if (!alloc) { | |
153 | ErrorLog("malloc failed\n"); | |
154 | return NULL; | |
155 | } | |
156 | ||
157 | char *ret = (char*)&alloc[1]; | |
158 | allocated *alloc2 = (allocated*)(ret + sz); | |
159 | ||
160 | alloc->allocSz = allocSz; | |
161 | alloc->magic = 0xdadadada; | |
162 | alloc->file = file; | |
163 | alloc->line = line; | |
164 | ||
165 | *alloc2 = *alloc; | |
166 | ||
167 | int s = OSAddAtomic(sz, &totalAlloc); | |
168 | ErrorLog("malloc(%d) -> %p, total allocations %d\n", sz, ret, s + sz); | |
169 | ||
170 | return ret; | |
b0d623f7 A |
171 | } |
172 | ||
173 | static void | |
174 | _free(char *ret, __unused int type, const char *file, int line) | |
175 | { | |
0a7de745 A |
176 | if (!ret) { |
177 | ErrorLog("freeing null\n"); | |
178 | return; | |
179 | } | |
180 | allocated *alloc = (allocated*)ret; | |
181 | alloc--; | |
182 | uint32_t sz = alloc->allocSz - 2 * sizeof(allocated); | |
183 | allocated *alloc2 = (allocated*)(ret + sz); | |
184 | ||
185 | if (alloc->magic != 0xdadadada) { | |
186 | panic("freeing bad pointer"); | |
187 | } | |
188 | ||
189 | if (memcmp(alloc, alloc2, sizeof(*alloc)) != 0) { | |
190 | panic("clobbered data"); | |
191 | } | |
192 | ||
193 | memset(ret, 0xce, sz); | |
194 | alloc2->file = file; | |
195 | alloc2->line = line; | |
196 | FREE(alloc, type); | |
197 | int s = OSAddAtomic(-sz, &totalAlloc); | |
198 | ErrorLog("free(%p,%d) -> total allocations %d\n", ret, sz, s - sz); | |
b0d623f7 A |
199 | } |
200 | ||
201 | #undef MALLOC | |
202 | #undef FREE | |
0a7de745 | 203 | #define MALLOC(space, cast, size, type, flags) (space) = (cast)_malloc(size, type, flags, __FILE__, __LINE__) |
b0d623f7 A |
204 | #define FREE(addr, type) _free((void *)addr, type, __FILE__, __LINE__) |
205 | ||
206 | #endif /* MALLOC_DEBUG */ | |
207 | ||
208 | #pragma mark --- globals --- | |
209 | ||
210 | static lck_grp_t *decmpfs_lockgrp; | |
211 | ||
f427ee49 | 212 | static const decmpfs_registration *decompressors[CMP_MAX]; /* the registered compressors */ |
b0d623f7 A |
213 | static lck_rw_t * decompressorsLock; |
214 | static int decompress_channel; /* channel used by decompress_file to wake up waiters */ | |
215 | static lck_mtx_t *decompress_channel_mtx; | |
216 | ||
217 | vfs_context_t decmpfs_ctx; | |
218 | ||
219 | #pragma mark --- decmp_get_func --- | |
220 | ||
f427ee49 | 221 | #define offsetof_func(func) ((uintptr_t)offsetof(decmpfs_registration, func)) |
b0d623f7 A |
222 | |
223 | static void * | |
f427ee49 | 224 | _func_from_offset(uint32_t type, uintptr_t offset, uint32_t discriminator) |
b0d623f7 | 225 | { |
0a7de745 A |
226 | /* get the function at the given offset in the registration for the given type */ |
227 | const decmpfs_registration *reg = decompressors[type]; | |
0a7de745 A |
228 | |
229 | switch (reg->decmpfs_registration) { | |
230 | case DECMPFS_REGISTRATION_VERSION_V1: | |
231 | if (offset > offsetof_func(free_data)) { | |
232 | return NULL; | |
233 | } | |
234 | break; | |
235 | case DECMPFS_REGISTRATION_VERSION_V3: | |
236 | if (offset > offsetof_func(get_flags)) { | |
237 | return NULL; | |
238 | } | |
239 | break; | |
240 | default: | |
241 | return NULL; | |
242 | } | |
243 | ||
f427ee49 A |
244 | void *ptr = *(void * const *)((const void *)reg + offset); |
245 | if (ptr != NULL) { | |
246 | /* Resign as a function-in-void* */ | |
247 | ptr = ptrauth_auth_and_resign(ptr, ptrauth_key_asia, discriminator, ptrauth_key_asia, 0); | |
248 | } | |
249 | return ptr; | |
b0d623f7 A |
250 | } |
251 | ||
d1ecb069 A |
252 | extern void IOServicePublishResource( const char * property, boolean_t value ); |
253 | extern boolean_t IOServiceWaitForMatchingResource( const char * property, uint64_t timeout ); | |
254 | extern boolean_t IOCatalogueMatchingDriversPresent( const char * property ); | |
255 | ||
b0d623f7 | 256 | static void * |
f427ee49 | 257 | _decmp_get_func(vnode_t vp, uint32_t type, uintptr_t offset, uint32_t discriminator) |
b0d623f7 A |
258 | { |
259 | /* | |
0a7de745 A |
260 | * this function should be called while holding a shared lock to decompressorsLock, |
261 | * and will return with the lock held | |
b0d623f7 | 262 | */ |
0a7de745 A |
263 | |
264 | if (type >= CMP_MAX) { | |
b0d623f7 | 265 | return NULL; |
0a7de745 A |
266 | } |
267 | ||
b0d623f7 A |
268 | if (decompressors[type] != NULL) { |
269 | // the compressor has already registered but the function might be null | |
f427ee49 | 270 | return _func_from_offset(type, offset, discriminator); |
b0d623f7 | 271 | } |
0a7de745 A |
272 | |
273 | // does IOKit know about a kext that is supposed to provide this type? | |
274 | char providesName[80]; | |
275 | snprintf(providesName, sizeof(providesName), "com.apple.AppleFSCompression.providesType%u", type); | |
276 | if (IOCatalogueMatchingDriversPresent(providesName)) { | |
277 | // there is a kext that says it will register for this type, so let's wait for it | |
278 | char resourceName[80]; | |
279 | uint64_t delay = 10000000ULL; // 10 milliseconds. | |
280 | snprintf(resourceName, sizeof(resourceName), "com.apple.AppleFSCompression.Type%u", type); | |
281 | ErrorLogWithPath("waiting for %s\n", resourceName); | |
282 | while (decompressors[type] == NULL) { | |
283 | lck_rw_unlock_shared(decompressorsLock); // we have to unlock to allow the kext to register | |
284 | if (IOServiceWaitForMatchingResource(resourceName, delay)) { | |
285 | lck_rw_lock_shared(decompressorsLock); | |
286 | break; | |
287 | } | |
288 | if (!IOCatalogueMatchingDriversPresent(providesName)) { | |
289 | // | |
290 | ErrorLogWithPath("the kext with %s is no longer present\n", providesName); | |
291 | lck_rw_lock_shared(decompressorsLock); | |
292 | break; | |
293 | } | |
294 | ErrorLogWithPath("still waiting for %s\n", resourceName); | |
295 | delay *= 2; | |
296 | lck_rw_lock_shared(decompressorsLock); | |
297 | } | |
298 | // IOKit says the kext is loaded, so it should be registered too! | |
299 | if (decompressors[type] == NULL) { | |
300 | ErrorLogWithPath("we found %s, but the type still isn't registered\n", providesName); | |
301 | return NULL; | |
302 | } | |
303 | // it's now registered, so let's return the function | |
f427ee49 | 304 | return _func_from_offset(type, offset, discriminator); |
0a7de745 A |
305 | } |
306 | ||
b0d623f7 | 307 | // the compressor hasn't registered, so it never will unless someone manually kextloads it |
3e170ce0 | 308 | ErrorLogWithPath("tried to access a compressed file of unregistered type %d\n", type); |
b0d623f7 A |
309 | return NULL; |
310 | } | |
311 | ||
f427ee49 | 312 | #define decmp_get_func(vp, type, func) (typeof(decompressors[0]->func))_decmp_get_func(vp, type, offsetof_func(func), ptrauth_function_pointer_type_discriminator(typeof(decompressors[0]->func))) |
b0d623f7 A |
313 | |
314 | #pragma mark --- utilities --- | |
315 | ||
316 | #if COMPRESSION_DEBUG | |
b0d623f7 A |
317 | static int |
318 | vnsize(vnode_t vp, uint64_t *size) | |
319 | { | |
0a7de745 A |
320 | struct vnode_attr va; |
321 | VATTR_INIT(&va); | |
322 | VATTR_WANTED(&va, va_data_size); | |
b0d623f7 | 323 | int error = vnode_getattr(vp, &va, decmpfs_ctx); |
0a7de745 A |
324 | if (error != 0) { |
325 | ErrorLogWithPath("vnode_getattr err %d\n", error); | |
326 | return error; | |
327 | } | |
328 | *size = va.va_data_size; | |
329 | return 0; | |
b0d623f7 A |
330 | } |
331 | #endif /* COMPRESSION_DEBUG */ | |
332 | ||
333 | #pragma mark --- cnode routines --- | |
334 | ||
f427ee49 A |
335 | ZONE_DECLARE(decmpfs_cnode_zone, "decmpfs_cnode", |
336 | sizeof(struct decmpfs_cnode), ZC_NONE); | |
337 | ||
0a7de745 A |
338 | decmpfs_cnode * |
339 | decmpfs_cnode_alloc(void) | |
39037602 | 340 | { |
f427ee49 | 341 | return zalloc(decmpfs_cnode_zone); |
39037602 A |
342 | } |
343 | ||
0a7de745 A |
344 | void |
345 | decmpfs_cnode_free(decmpfs_cnode *dp) | |
39037602 | 346 | { |
f427ee49 | 347 | zfree(decmpfs_cnode_zone, dp); |
39037602 A |
348 | } |
349 | ||
b0d623f7 A |
350 | void |
351 | decmpfs_cnode_init(decmpfs_cnode *cp) | |
352 | { | |
0a7de745 | 353 | memset(cp, 0, sizeof(*cp)); |
b0d623f7 | 354 | lck_rw_init(&cp->compressed_data_lock, decmpfs_lockgrp, NULL); |
b0d623f7 A |
355 | } |
356 | ||
357 | void | |
358 | decmpfs_cnode_destroy(decmpfs_cnode *cp) | |
359 | { | |
360 | lck_rw_destroy(&cp->compressed_data_lock, decmpfs_lockgrp); | |
b0d623f7 A |
361 | } |
362 | ||
39037602 | 363 | bool |
b0d623f7 A |
364 | decmpfs_trylock_compressed_data(decmpfs_cnode *cp, int exclusive) |
365 | { | |
366 | void *thread = current_thread(); | |
39037602 | 367 | bool retval = false; |
b0d623f7 A |
368 | |
369 | if (cp->lockowner == thread) { | |
370 | /* this thread is already holding an exclusive lock, so bump the count */ | |
371 | cp->lockcount++; | |
39037602 | 372 | retval = true; |
b0d623f7 A |
373 | } else if (exclusive) { |
374 | if ((retval = lck_rw_try_lock_exclusive(&cp->compressed_data_lock))) { | |
375 | cp->lockowner = thread; | |
376 | cp->lockcount = 1; | |
377 | } | |
378 | } else { | |
379 | if ((retval = lck_rw_try_lock_shared(&cp->compressed_data_lock))) { | |
380 | cp->lockowner = (void *)-1; | |
381 | } | |
382 | } | |
383 | return retval; | |
384 | } | |
385 | ||
386 | void | |
387 | decmpfs_lock_compressed_data(decmpfs_cnode *cp, int exclusive) | |
388 | { | |
389 | void *thread = current_thread(); | |
0a7de745 | 390 | |
b0d623f7 A |
391 | if (cp->lockowner == thread) { |
392 | /* this thread is already holding an exclusive lock, so bump the count */ | |
393 | cp->lockcount++; | |
394 | } else if (exclusive) { | |
395 | lck_rw_lock_exclusive(&cp->compressed_data_lock); | |
396 | cp->lockowner = thread; | |
397 | cp->lockcount = 1; | |
398 | } else { | |
399 | lck_rw_lock_shared(&cp->compressed_data_lock); | |
400 | cp->lockowner = (void *)-1; | |
401 | } | |
402 | } | |
403 | ||
404 | void | |
405 | decmpfs_unlock_compressed_data(decmpfs_cnode *cp, __unused int exclusive) | |
406 | { | |
407 | void *thread = current_thread(); | |
0a7de745 | 408 | |
b0d623f7 A |
409 | if (cp->lockowner == thread) { |
410 | /* this thread is holding an exclusive lock, so decrement the count */ | |
411 | if ((--cp->lockcount) > 0) { | |
412 | /* the caller still has outstanding locks, so we're done */ | |
413 | return; | |
414 | } | |
415 | cp->lockowner = NULL; | |
416 | } | |
0a7de745 | 417 | |
b0d623f7 A |
418 | lck_rw_done(&cp->compressed_data_lock); |
419 | } | |
420 | ||
421 | uint32_t | |
422 | decmpfs_cnode_get_vnode_state(decmpfs_cnode *cp) | |
423 | { | |
0a7de745 | 424 | return cp->cmp_state; |
b0d623f7 A |
425 | } |
426 | ||
427 | void | |
428 | decmpfs_cnode_set_vnode_state(decmpfs_cnode *cp, uint32_t state, int skiplock) | |
429 | { | |
0a7de745 A |
430 | if (!skiplock) { |
431 | decmpfs_lock_compressed_data(cp, 1); | |
432 | } | |
f427ee49 | 433 | cp->cmp_state = (uint8_t)state; |
0a7de745 A |
434 | if (state == FILE_TYPE_UNKNOWN) { |
435 | /* clear out the compression type too */ | |
436 | cp->cmp_type = 0; | |
437 | } | |
438 | if (!skiplock) { | |
439 | decmpfs_unlock_compressed_data(cp, 1); | |
440 | } | |
b0d623f7 A |
441 | } |
442 | ||
443 | static void | |
444 | decmpfs_cnode_set_vnode_cmp_type(decmpfs_cnode *cp, uint32_t cmp_type, int skiplock) | |
445 | { | |
0a7de745 A |
446 | if (!skiplock) { |
447 | decmpfs_lock_compressed_data(cp, 1); | |
448 | } | |
449 | cp->cmp_type = cmp_type; | |
450 | if (!skiplock) { | |
451 | decmpfs_unlock_compressed_data(cp, 1); | |
452 | } | |
b0d623f7 A |
453 | } |
454 | ||
455 | static void | |
456 | decmpfs_cnode_set_vnode_minimal_xattr(decmpfs_cnode *cp, int minimal_xattr, int skiplock) | |
457 | { | |
0a7de745 A |
458 | if (!skiplock) { |
459 | decmpfs_lock_compressed_data(cp, 1); | |
460 | } | |
f427ee49 | 461 | cp->cmp_minimal_xattr = !!minimal_xattr; |
0a7de745 A |
462 | if (!skiplock) { |
463 | decmpfs_unlock_compressed_data(cp, 1); | |
464 | } | |
b0d623f7 A |
465 | } |
466 | ||
467 | uint64_t | |
468 | decmpfs_cnode_get_vnode_cached_size(decmpfs_cnode *cp) | |
469 | { | |
0a7de745 | 470 | return cp->uncompressed_size; |
b0d623f7 A |
471 | } |
472 | ||
cb323159 A |
473 | uint64_t |
474 | decmpfs_cnode_get_vnode_cached_nchildren(decmpfs_cnode *cp) | |
475 | { | |
476 | return cp->nchildren; | |
477 | } | |
478 | ||
479 | uint64_t | |
480 | decmpfs_cnode_get_vnode_cached_total_size(decmpfs_cnode *cp) | |
481 | { | |
482 | return cp->total_size; | |
483 | } | |
484 | ||
485 | void | |
b0d623f7 A |
486 | decmpfs_cnode_set_vnode_cached_size(decmpfs_cnode *cp, uint64_t size) |
487 | { | |
0a7de745 A |
488 | while (1) { |
489 | uint64_t old = cp->uncompressed_size; | |
490 | if (OSCompareAndSwap64(old, size, (UInt64*)&cp->uncompressed_size)) { | |
491 | return; | |
492 | } else { | |
493 | /* failed to write our value, so loop */ | |
494 | } | |
495 | } | |
316670eb A |
496 | } |
497 | ||
cb323159 A |
498 | void |
499 | decmpfs_cnode_set_vnode_cached_nchildren(decmpfs_cnode *cp, uint64_t nchildren) | |
500 | { | |
501 | while (1) { | |
502 | uint64_t old = cp->nchildren; | |
503 | if (OSCompareAndSwap64(old, nchildren, (UInt64*)&cp->nchildren)) { | |
504 | return; | |
505 | } else { | |
506 | /* failed to write our value, so loop */ | |
507 | } | |
508 | } | |
509 | } | |
510 | ||
511 | void | |
512 | decmpfs_cnode_set_vnode_cached_total_size(decmpfs_cnode *cp, uint64_t total_sz) | |
513 | { | |
514 | while (1) { | |
515 | uint64_t old = cp->total_size; | |
516 | if (OSCompareAndSwap64(old, total_sz, (UInt64*)&cp->total_size)) { | |
517 | return; | |
518 | } else { | |
519 | /* failed to write our value, so loop */ | |
520 | } | |
521 | } | |
522 | } | |
523 | ||
316670eb A |
524 | static uint64_t |
525 | decmpfs_cnode_get_decompression_flags(decmpfs_cnode *cp) | |
526 | { | |
0a7de745 | 527 | return cp->decompression_flags; |
316670eb A |
528 | } |
529 | ||
530 | static void | |
531 | decmpfs_cnode_set_decompression_flags(decmpfs_cnode *cp, uint64_t flags) | |
532 | { | |
0a7de745 A |
533 | while (1) { |
534 | uint64_t old = cp->decompression_flags; | |
535 | if (OSCompareAndSwap64(old, flags, (UInt64*)&cp->decompression_flags)) { | |
536 | return; | |
537 | } else { | |
538 | /* failed to write our value, so loop */ | |
539 | } | |
540 | } | |
b0d623f7 A |
541 | } |
542 | ||
0a7de745 A |
543 | uint32_t |
544 | decmpfs_cnode_cmp_type(decmpfs_cnode *cp) | |
39037602 A |
545 | { |
546 | return cp->cmp_type; | |
547 | } | |
548 | ||
b0d623f7 A |
549 | #pragma mark --- decmpfs state routines --- |
550 | ||
551 | static int | |
552 | decmpfs_fetch_compressed_header(vnode_t vp, decmpfs_cnode *cp, decmpfs_header **hdrOut, int returnInvalid) | |
553 | { | |
0a7de745 A |
554 | /* |
555 | * fetches vp's compression xattr, converting it into a decmpfs_header; returns 0 or errno | |
556 | * if returnInvalid == 1, returns the header even if the type was invalid (out of range), | |
557 | * and return ERANGE in that case | |
558 | */ | |
559 | ||
560 | size_t read_size = 0; | |
561 | size_t attr_size = 0; | |
562 | uio_t attr_uio = NULL; | |
563 | int err = 0; | |
564 | char *data = NULL; | |
565 | const bool no_additional_data = ((cp != NULL) | |
566 | && (cp->cmp_type != 0) | |
567 | && (cp->cmp_minimal_xattr != 0)); | |
568 | char uio_buf[UIO_SIZEOF(1)]; | |
569 | decmpfs_header *hdr = NULL; | |
570 | ||
571 | /* | |
572 | * Trace the following parameters on entry with event-id 0x03120004 | |
573 | * | |
574 | * @vp->v_id: vnode-id for which to fetch compressed header. | |
575 | * @no_additional_data: If set true then xattr didn't have any extra data. | |
576 | * @returnInvalid: return the header even though the type is out of range. | |
577 | */ | |
578 | DECMPFS_EMIT_TRACE_ENTRY(DECMPDBG_FETCH_COMPRESSED_HEADER, vp->v_id, | |
579 | no_additional_data, returnInvalid); | |
580 | ||
581 | if (no_additional_data) { | |
582 | /* this file's xattr didn't have any extra data when we fetched it, so we can synthesize a header from the data in the cnode */ | |
583 | ||
584 | MALLOC(data, char *, sizeof(decmpfs_header), M_TEMP, M_WAITOK); | |
585 | if (!data) { | |
586 | err = ENOMEM; | |
587 | goto out; | |
588 | } | |
589 | hdr = (decmpfs_header*)data; | |
590 | hdr->attr_size = sizeof(decmpfs_disk_header); | |
591 | hdr->compression_magic = DECMPFS_MAGIC; | |
592 | hdr->compression_type = cp->cmp_type; | |
cb323159 A |
593 | if (hdr->compression_type == DATALESS_PKG_CMPFS_TYPE) { |
594 | if (!vnode_isdir(vp)) { | |
595 | err = EINVAL; | |
596 | goto out; | |
597 | } | |
598 | hdr->_size.value = DECMPFS_PKG_VALUE_FROM_SIZE_COUNT( | |
599 | decmpfs_cnode_get_vnode_cached_size(cp), | |
600 | decmpfs_cnode_get_vnode_cached_nchildren(cp)); | |
601 | } else if (vnode_isdir(vp)) { | |
602 | hdr->_size.value = decmpfs_cnode_get_vnode_cached_nchildren(cp); | |
603 | } else { | |
604 | hdr->_size.value = decmpfs_cnode_get_vnode_cached_size(cp); | |
605 | } | |
0a7de745 A |
606 | } else { |
607 | /* figure out how big the xattr is on disk */ | |
608 | err = vn_getxattr(vp, DECMPFS_XATTR_NAME, NULL, &attr_size, XATTR_NOSECURITY, decmpfs_ctx); | |
609 | if (err != 0) { | |
610 | goto out; | |
611 | } | |
612 | ||
613 | if (attr_size < sizeof(decmpfs_disk_header) || attr_size > MAX_DECMPFS_XATTR_SIZE) { | |
614 | err = EINVAL; | |
615 | goto out; | |
616 | } | |
617 | ||
618 | /* allocation includes space for the extra attr_size field of a compressed_header */ | |
619 | MALLOC(data, char *, attr_size + sizeof(hdr->attr_size), M_TEMP, M_WAITOK); | |
620 | if (!data) { | |
621 | err = ENOMEM; | |
622 | goto out; | |
623 | } | |
624 | ||
625 | /* read the xattr into our buffer, skipping over the attr_size field at the beginning */ | |
626 | attr_uio = uio_createwithbuffer(1, 0, UIO_SYSSPACE, UIO_READ, &uio_buf[0], sizeof(uio_buf)); | |
627 | uio_addiov(attr_uio, CAST_USER_ADDR_T(data + sizeof(hdr->attr_size)), attr_size); | |
628 | ||
629 | err = vn_getxattr(vp, DECMPFS_XATTR_NAME, attr_uio, &read_size, XATTR_NOSECURITY, decmpfs_ctx); | |
630 | if (err != 0) { | |
631 | goto out; | |
632 | } | |
633 | if (read_size != attr_size) { | |
634 | err = EINVAL; | |
635 | goto out; | |
636 | } | |
637 | hdr = (decmpfs_header*)data; | |
f427ee49 | 638 | hdr->attr_size = (uint32_t)attr_size; |
0a7de745 A |
639 | /* swap the fields to native endian */ |
640 | hdr->compression_magic = OSSwapLittleToHostInt32(hdr->compression_magic); | |
641 | hdr->compression_type = OSSwapLittleToHostInt32(hdr->compression_type); | |
642 | hdr->uncompressed_size = OSSwapLittleToHostInt64(hdr->uncompressed_size); | |
643 | } | |
644 | ||
645 | if (hdr->compression_magic != DECMPFS_MAGIC) { | |
646 | ErrorLogWithPath("invalid compression_magic 0x%08x, should be 0x%08x\n", hdr->compression_magic, DECMPFS_MAGIC); | |
647 | err = EINVAL; | |
b0d623f7 | 648 | goto out; |
0a7de745 A |
649 | } |
650 | ||
cb323159 A |
651 | /* |
652 | * Special-case the DATALESS compressor here; that is a valid type, | |
653 | * even through there will never be an entry in the decompressor | |
654 | * handler table for it. If we don't do this, then the cmp_state | |
655 | * for this cnode will end up being marked NOT_COMPRESSED, and | |
656 | * we'll be stuck in limbo. | |
657 | */ | |
658 | if (hdr->compression_type >= CMP_MAX && !decmpfs_type_is_dataless(hdr->compression_type)) { | |
0a7de745 A |
659 | if (returnInvalid) { |
660 | /* return the header even though the type is out of range */ | |
661 | err = ERANGE; | |
662 | } else { | |
663 | ErrorLogWithPath("compression_type %d out of range\n", hdr->compression_type); | |
664 | err = EINVAL; | |
665 | } | |
b0d623f7 | 666 | goto out; |
0a7de745 A |
667 | } |
668 | ||
b0d623f7 | 669 | out: |
0a7de745 A |
670 | if (err && (err != ERANGE)) { |
671 | DebugLogWithPath("err %d\n", err); | |
672 | if (data) { | |
673 | FREE(data, M_TEMP); | |
674 | } | |
675 | *hdrOut = NULL; | |
676 | } else { | |
677 | *hdrOut = hdr; | |
678 | } | |
679 | /* | |
680 | * Trace the following parameters on return with event-id 0x03120004. | |
681 | * | |
682 | * @vp->v_id: vnode-id for which to fetch compressed header. | |
683 | * @err: value returned from this function. | |
684 | */ | |
685 | DECMPFS_EMIT_TRACE_RETURN(DECMPDBG_FETCH_COMPRESSED_HEADER, vp->v_id, err); | |
686 | return err; | |
b0d623f7 A |
687 | } |
688 | ||
689 | static int | |
690 | decmpfs_fast_get_state(decmpfs_cnode *cp) | |
691 | { | |
0a7de745 A |
692 | /* |
693 | * return the cached state | |
694 | * this should *only* be called when we know that decmpfs_file_is_compressed has already been called, | |
695 | * because this implies that the cached state is valid | |
696 | */ | |
697 | int cmp_state = decmpfs_cnode_get_vnode_state(cp); | |
698 | ||
699 | switch (cmp_state) { | |
700 | case FILE_IS_NOT_COMPRESSED: | |
701 | case FILE_IS_COMPRESSED: | |
702 | case FILE_IS_CONVERTING: | |
703 | return cmp_state; | |
704 | case FILE_TYPE_UNKNOWN: | |
705 | /* | |
706 | * we should only get here if decmpfs_file_is_compressed was not called earlier on this vnode, | |
707 | * which should not be possible | |
708 | */ | |
709 | ErrorLog("decmpfs_fast_get_state called on unknown file\n"); | |
710 | return FILE_IS_NOT_COMPRESSED; | |
711 | default: | |
712 | /* */ | |
713 | ErrorLog("unknown cmp_state %d\n", cmp_state); | |
714 | return FILE_IS_NOT_COMPRESSED; | |
715 | } | |
b0d623f7 A |
716 | } |
717 | ||
718 | static int | |
719 | decmpfs_fast_file_is_compressed(decmpfs_cnode *cp) | |
720 | { | |
0a7de745 A |
721 | int cmp_state = decmpfs_cnode_get_vnode_state(cp); |
722 | ||
723 | switch (cmp_state) { | |
724 | case FILE_IS_NOT_COMPRESSED: | |
725 | return 0; | |
726 | case FILE_IS_COMPRESSED: | |
727 | case FILE_IS_CONVERTING: | |
728 | return 1; | |
729 | case FILE_TYPE_UNKNOWN: | |
730 | /* | |
731 | * we should only get here if decmpfs_file_is_compressed was not called earlier on this vnode, | |
732 | * which should not be possible | |
733 | */ | |
734 | ErrorLog("decmpfs_fast_get_state called on unknown file\n"); | |
735 | return 0; | |
736 | default: | |
737 | /* */ | |
738 | ErrorLog("unknown cmp_state %d\n", cmp_state); | |
739 | return 0; | |
740 | } | |
b0d623f7 A |
741 | } |
742 | ||
743 | errno_t | |
744 | decmpfs_validate_compressed_file(vnode_t vp, decmpfs_cnode *cp) | |
745 | { | |
0a7de745 A |
746 | /* give a compressor a chance to indicate that a compressed file is invalid */ |
747 | ||
748 | decmpfs_header *hdr = NULL; | |
749 | errno_t err = decmpfs_fetch_compressed_header(vp, cp, &hdr, 0); | |
750 | if (err) { | |
751 | /* we couldn't get the header */ | |
752 | if (decmpfs_fast_get_state(cp) == FILE_IS_NOT_COMPRESSED) { | |
753 | /* the file is no longer compressed, so return success */ | |
754 | err = 0; | |
755 | } | |
756 | goto out; | |
757 | } | |
758 | ||
cb323159 A |
759 | if (!decmpfs_type_is_dataless(hdr->compression_type)) { |
760 | lck_rw_lock_shared(decompressorsLock); | |
761 | decmpfs_validate_compressed_file_func validate = decmp_get_func(vp, hdr->compression_type, validate); | |
762 | if (validate) { /* make sure this validation function is valid */ | |
763 | /* is the data okay? */ | |
764 | err = validate(vp, decmpfs_ctx, hdr); | |
765 | } else if (decmp_get_func(vp, hdr->compression_type, fetch) == NULL) { | |
766 | /* the type isn't registered */ | |
767 | err = EIO; | |
768 | } else { | |
769 | /* no validate registered, so nothing to do */ | |
770 | err = 0; | |
771 | } | |
772 | lck_rw_unlock_shared(decompressorsLock); | |
0a7de745 | 773 | } |
b0d623f7 | 774 | out: |
0a7de745 A |
775 | if (hdr) { |
776 | FREE(hdr, M_TEMP); | |
777 | } | |
b0d623f7 | 778 | #if COMPRESSION_DEBUG |
0a7de745 A |
779 | if (err) { |
780 | DebugLogWithPath("decmpfs_validate_compressed_file ret %d, vp->v_flag %d\n", err, vp->v_flag); | |
781 | } | |
b0d623f7 | 782 | #endif |
0a7de745 | 783 | return err; |
b0d623f7 A |
784 | } |
785 | ||
786 | int | |
787 | decmpfs_file_is_compressed(vnode_t vp, decmpfs_cnode *cp) | |
788 | { | |
0a7de745 A |
789 | /* |
790 | * determines whether vp points to a compressed file | |
791 | * | |
792 | * to speed up this operation, we cache the result in the cnode, and do as little as possible | |
793 | * in the case where the cnode already has a valid cached state | |
794 | * | |
795 | */ | |
796 | ||
797 | int ret = 0; | |
798 | int error = 0; | |
799 | uint32_t cmp_state; | |
800 | struct vnode_attr va_fetch; | |
801 | decmpfs_header *hdr = NULL; | |
802 | mount_t mp = NULL; | |
803 | int cnode_locked = 0; | |
804 | int saveInvalid = 0; // save the header data even though the type was out of range | |
805 | uint64_t decompression_flags = 0; | |
806 | bool is_mounted, is_local_fs; | |
807 | ||
808 | if (vnode_isnamedstream(vp)) { | |
809 | /* | |
810 | * named streams can't be compressed | |
811 | * since named streams of the same file share the same cnode, | |
812 | * we don't want to get/set the state in the cnode, just return 0 | |
813 | */ | |
814 | return 0; | |
815 | } | |
816 | ||
817 | /* examine the cached a state in this cnode */ | |
818 | cmp_state = decmpfs_cnode_get_vnode_state(cp); | |
819 | switch (cmp_state) { | |
820 | case FILE_IS_NOT_COMPRESSED: | |
821 | return 0; | |
822 | case FILE_IS_COMPRESSED: | |
823 | return 1; | |
824 | case FILE_IS_CONVERTING: | |
825 | /* treat the file as compressed, because this gives us a way to block future reads until decompression is done */ | |
826 | return 1; | |
827 | case FILE_TYPE_UNKNOWN: | |
828 | /* the first time we encountered this vnode, so we need to check it out */ | |
829 | break; | |
830 | default: | |
831 | /* unknown state, assume file is not compressed */ | |
832 | ErrorLogWithPath("unknown cmp_state %d\n", cmp_state); | |
833 | return 0; | |
834 | } | |
835 | ||
0a7de745 A |
836 | is_mounted = false; |
837 | is_local_fs = false; | |
838 | mp = vnode_mount(vp); | |
839 | if (mp) { | |
840 | is_mounted = true; | |
841 | } | |
842 | if (is_mounted) { | |
843 | is_local_fs = ((mp->mnt_flag & MNT_LOCAL)); | |
844 | } | |
845 | /* | |
846 | * Trace the following parameters on entry with event-id 0x03120014. | |
847 | * | |
848 | * @vp->v_id: vnode-id of the file being queried. | |
849 | * @is_mounted: set to true if @vp belongs to a mounted fs. | |
850 | * @is_local_fs: set to true if @vp belongs to local fs. | |
851 | */ | |
852 | DECMPFS_EMIT_TRACE_ENTRY(DECMPDBG_FILE_IS_COMPRESSED, vp->v_id, | |
853 | is_mounted, is_local_fs); | |
854 | ||
855 | if (!is_mounted) { | |
856 | /* | |
857 | * this should only be true before we mount the root filesystem | |
858 | * we short-cut this return to avoid the call to getattr below, which | |
859 | * will fail before root is mounted | |
860 | */ | |
861 | ret = FILE_IS_NOT_COMPRESSED; | |
862 | goto done; | |
863 | } | |
864 | ||
865 | if (!is_local_fs) { | |
866 | /* compression only supported on local filesystems */ | |
867 | ret = FILE_IS_NOT_COMPRESSED; | |
868 | goto done; | |
869 | } | |
870 | ||
b0d623f7 A |
871 | /* lock our cnode data so that another caller doesn't change the state under us */ |
872 | decmpfs_lock_compressed_data(cp, 1); | |
873 | cnode_locked = 1; | |
0a7de745 | 874 | |
b0d623f7 A |
875 | VATTR_INIT(&va_fetch); |
876 | VATTR_WANTED(&va_fetch, va_flags); | |
877 | error = vnode_getattr(vp, &va_fetch, decmpfs_ctx); | |
878 | if (error) { | |
0a7de745 A |
879 | /* failed to get the bsd flags so the file is not compressed */ |
880 | ret = FILE_IS_NOT_COMPRESSED; | |
881 | goto done; | |
882 | } | |
b0d623f7 A |
883 | if (va_fetch.va_flags & UF_COMPRESSED) { |
884 | /* UF_COMPRESSED is on, make sure the file has the DECMPFS_XATTR_NAME xattr */ | |
0a7de745 A |
885 | error = decmpfs_fetch_compressed_header(vp, cp, &hdr, 1); |
886 | if ((hdr != NULL) && (error == ERANGE)) { | |
887 | saveInvalid = 1; | |
888 | } | |
889 | if (error) { | |
890 | /* failed to get the xattr so the file is not compressed */ | |
891 | ret = FILE_IS_NOT_COMPRESSED; | |
892 | goto done; | |
893 | } | |
cb323159 A |
894 | /* |
895 | * We got the xattr, so the file is at least tagged compressed. | |
896 | * For DATALESS, regular files and directories can be "compressed". | |
897 | * For all other types, only files are allowed. | |
898 | */ | |
899 | if (!vnode_isreg(vp) && | |
900 | !(decmpfs_type_is_dataless(hdr->compression_type) && vnode_isdir(vp))) { | |
901 | ret = FILE_IS_NOT_COMPRESSED; | |
902 | goto done; | |
903 | } | |
0a7de745 A |
904 | ret = FILE_IS_COMPRESSED; |
905 | goto done; | |
906 | } | |
907 | /* UF_COMPRESSED isn't on, so the file isn't compressed */ | |
908 | ret = FILE_IS_NOT_COMPRESSED; | |
909 | ||
b0d623f7 | 910 | done: |
0a7de745 | 911 | if (((ret == FILE_IS_COMPRESSED) || saveInvalid) && hdr) { |
b0d623f7 | 912 | /* |
0a7de745 | 913 | * cache the uncompressed size away in the cnode |
b0d623f7 | 914 | */ |
0a7de745 | 915 | |
b0d623f7 A |
916 | if (!cnode_locked) { |
917 | /* | |
0a7de745 A |
918 | * we should never get here since the only place ret is set to FILE_IS_COMPRESSED |
919 | * is after the call to decmpfs_lock_compressed_data above | |
b0d623f7 A |
920 | */ |
921 | decmpfs_lock_compressed_data(cp, 1); | |
922 | cnode_locked = 1; | |
923 | } | |
0a7de745 | 924 | |
cb323159 A |
925 | if (vnode_isdir(vp)) { |
926 | decmpfs_cnode_set_vnode_cached_size(cp, 64); | |
927 | decmpfs_cnode_set_vnode_cached_nchildren(cp, decmpfs_get_directory_entries(hdr)); | |
928 | if (hdr->compression_type == DATALESS_PKG_CMPFS_TYPE) { | |
929 | decmpfs_cnode_set_vnode_cached_total_size(cp, DECMPFS_PKG_SIZE(hdr->_size)); | |
930 | } | |
931 | } else { | |
932 | decmpfs_cnode_set_vnode_cached_size(cp, hdr->uncompressed_size); | |
933 | } | |
b0d623f7 | 934 | decmpfs_cnode_set_vnode_state(cp, ret, 1); |
0a7de745 A |
935 | decmpfs_cnode_set_vnode_cmp_type(cp, hdr->compression_type, 1); |
936 | /* remember if the xattr's size was equal to the minimal xattr */ | |
937 | if (hdr->attr_size == sizeof(decmpfs_disk_header)) { | |
938 | decmpfs_cnode_set_vnode_minimal_xattr(cp, 1, 1); | |
939 | } | |
940 | if (ret == FILE_IS_COMPRESSED) { | |
941 | /* update the ubc's size for this file */ | |
942 | ubc_setsize(vp, hdr->uncompressed_size); | |
943 | ||
944 | /* update the decompression flags in the decmpfs cnode */ | |
945 | lck_rw_lock_shared(decompressorsLock); | |
946 | decmpfs_get_decompression_flags_func get_flags = decmp_get_func(vp, hdr->compression_type, get_flags); | |
947 | if (get_flags) { | |
948 | decompression_flags = get_flags(vp, decmpfs_ctx, hdr); | |
949 | } | |
950 | lck_rw_unlock_shared(decompressorsLock); | |
951 | decmpfs_cnode_set_decompression_flags(cp, decompression_flags); | |
952 | } | |
b0d623f7 A |
953 | } else { |
954 | /* we might have already taken the lock above; if so, skip taking it again by passing cnode_locked as the skiplock parameter */ | |
955 | decmpfs_cnode_set_vnode_state(cp, ret, cnode_locked); | |
956 | } | |
0a7de745 A |
957 | |
958 | if (cnode_locked) { | |
959 | decmpfs_unlock_compressed_data(cp, 1); | |
960 | } | |
961 | ||
962 | if (hdr) { | |
963 | FREE(hdr, M_TEMP); | |
964 | } | |
965 | /* | |
966 | * Trace the following parameters on return with event-id 0x03120014. | |
967 | * | |
968 | * @vp->v_id: vnode-id of the file being queried. | |
969 | * @return: set to 1 is file is compressed. | |
970 | */ | |
971 | switch (ret) { | |
972 | case FILE_IS_NOT_COMPRESSED: | |
973 | DECMPFS_EMIT_TRACE_RETURN(DECMPDBG_FILE_IS_COMPRESSED, vp->v_id, 0); | |
974 | return 0; | |
975 | case FILE_IS_COMPRESSED: | |
976 | case FILE_IS_CONVERTING: | |
977 | DECMPFS_EMIT_TRACE_RETURN(DECMPDBG_FILE_IS_COMPRESSED, vp->v_id, 1); | |
978 | return 1; | |
979 | default: | |
980 | /* unknown state, assume file is not compressed */ | |
981 | DECMPFS_EMIT_TRACE_RETURN(DECMPDBG_FILE_IS_COMPRESSED, vp->v_id, 0); | |
982 | ErrorLogWithPath("unknown ret %d\n", ret); | |
983 | return 0; | |
984 | } | |
b0d623f7 A |
985 | } |
986 | ||
987 | int | |
988 | decmpfs_update_attributes(vnode_t vp, struct vnode_attr *vap) | |
989 | { | |
0a7de745 A |
990 | int error = 0; |
991 | ||
992 | if (VATTR_IS_ACTIVE(vap, va_flags)) { | |
993 | /* the BSD flags are being updated */ | |
994 | if (vap->va_flags & UF_COMPRESSED) { | |
995 | /* the compressed bit is being set, did it change? */ | |
996 | struct vnode_attr va_fetch; | |
997 | int old_flags = 0; | |
998 | VATTR_INIT(&va_fetch); | |
999 | VATTR_WANTED(&va_fetch, va_flags); | |
b0d623f7 | 1000 | error = vnode_getattr(vp, &va_fetch, decmpfs_ctx); |
0a7de745 A |
1001 | if (error) { |
1002 | return error; | |
1003 | } | |
1004 | ||
1005 | old_flags = va_fetch.va_flags; | |
1006 | ||
1007 | if (!(old_flags & UF_COMPRESSED)) { | |
1008 | /* | |
1009 | * Compression bit was turned on, make sure the file has the DECMPFS_XATTR_NAME attribute. | |
1010 | * This precludes anyone from using the UF_COMPRESSED bit for anything else, and it enforces | |
1011 | * an order of operation -- you must first do the setxattr and then the chflags. | |
1012 | */ | |
1013 | ||
b0d623f7 A |
1014 | if (VATTR_IS_ACTIVE(vap, va_data_size)) { |
1015 | /* | |
1016 | * don't allow the caller to set the BSD flag and the size in the same call | |
1017 | * since this doesn't really make sense | |
1018 | */ | |
1019 | vap->va_flags &= ~UF_COMPRESSED; | |
1020 | return 0; | |
1021 | } | |
0a7de745 A |
1022 | |
1023 | decmpfs_header *hdr = NULL; | |
1024 | error = decmpfs_fetch_compressed_header(vp, NULL, &hdr, 1); | |
1025 | if (error == 0) { | |
1026 | /* | |
cb323159 A |
1027 | * Allow the flag to be set since the decmpfs attribute |
1028 | * is present. | |
1029 | * | |
1030 | * If we're creating a dataless file we do not want to | |
1031 | * truncate it to zero which allows the file resolver to | |
1032 | * have more control over when truncation should happen. | |
1033 | * All other types of compressed files are truncated to | |
1034 | * zero. | |
0a7de745 | 1035 | */ |
cb323159 A |
1036 | if (!decmpfs_type_is_dataless(hdr->compression_type)) { |
1037 | VATTR_SET_ACTIVE(vap, va_data_size); | |
1038 | vap->va_data_size = 0; | |
1039 | } | |
0a7de745 A |
1040 | } else if (error == ERANGE) { |
1041 | /* the file had a decmpfs attribute but the type was out of range, so don't muck with the file's data size */ | |
1042 | } else { | |
1043 | /* no DECMPFS_XATTR_NAME attribute, so deny the update */ | |
b0d623f7 | 1044 | vap->va_flags &= ~UF_COMPRESSED; |
0a7de745 A |
1045 | } |
1046 | if (hdr) { | |
1047 | FREE(hdr, M_TEMP); | |
1048 | } | |
1049 | } | |
1050 | } | |
1051 | } | |
1052 | ||
1053 | return 0; | |
b0d623f7 A |
1054 | } |
1055 | ||
1056 | static int | |
1057 | wait_for_decompress(decmpfs_cnode *cp) | |
1058 | { | |
0a7de745 A |
1059 | int state; |
1060 | lck_mtx_lock(decompress_channel_mtx); | |
1061 | do { | |
1062 | state = decmpfs_fast_get_state(cp); | |
1063 | if (state != FILE_IS_CONVERTING) { | |
1064 | /* file is not decompressing */ | |
1065 | lck_mtx_unlock(decompress_channel_mtx); | |
1066 | return state; | |
1067 | } | |
1068 | msleep((caddr_t)&decompress_channel, decompress_channel_mtx, PINOD, "wait_for_decompress", NULL); | |
1069 | } while (1); | |
b0d623f7 A |
1070 | } |
1071 | ||
1072 | #pragma mark --- decmpfs hide query routines --- | |
1073 | ||
1074 | int | |
1075 | decmpfs_hides_rsrc(vfs_context_t ctx, decmpfs_cnode *cp) | |
1076 | { | |
1077 | /* | |
0a7de745 A |
1078 | * WARNING!!! |
1079 | * callers may (and do) pass NULL for ctx, so we should only use it | |
1080 | * for this equality comparison | |
1081 | * | |
1082 | * This routine should only be called after a file has already been through decmpfs_file_is_compressed | |
b0d623f7 | 1083 | */ |
0a7de745 A |
1084 | |
1085 | if (ctx == decmpfs_ctx) { | |
b0d623f7 | 1086 | return 0; |
0a7de745 A |
1087 | } |
1088 | ||
1089 | if (!decmpfs_fast_file_is_compressed(cp)) { | |
b0d623f7 | 1090 | return 0; |
0a7de745 A |
1091 | } |
1092 | ||
b0d623f7 A |
1093 | /* all compressed files hide their resource fork */ |
1094 | return 1; | |
1095 | } | |
1096 | ||
1097 | int | |
1098 | decmpfs_hides_xattr(vfs_context_t ctx, decmpfs_cnode *cp, const char *xattr) | |
1099 | { | |
1100 | /* | |
0a7de745 A |
1101 | * WARNING!!! |
1102 | * callers may (and do) pass NULL for ctx, so we should only use it | |
1103 | * for this equality comparison | |
1104 | * | |
1105 | * This routine should only be called after a file has already been through decmpfs_file_is_compressed | |
b0d623f7 | 1106 | */ |
0a7de745 A |
1107 | |
1108 | if (ctx == decmpfs_ctx) { | |
b0d623f7 | 1109 | return 0; |
0a7de745 A |
1110 | } |
1111 | if (strncmp(xattr, XATTR_RESOURCEFORK_NAME, sizeof(XATTR_RESOURCEFORK_NAME) - 1) == 0) { | |
b0d623f7 | 1112 | return decmpfs_hides_rsrc(ctx, cp); |
0a7de745 A |
1113 | } |
1114 | if (!decmpfs_fast_file_is_compressed(cp)) { | |
1115 | /* file is not compressed, so don't hide this xattr */ | |
b0d623f7 | 1116 | return 0; |
0a7de745 A |
1117 | } |
1118 | if (strncmp(xattr, DECMPFS_XATTR_NAME, sizeof(DECMPFS_XATTR_NAME) - 1) == 0) { | |
1119 | /* it's our xattr, so hide it */ | |
b0d623f7 | 1120 | return 1; |
0a7de745 | 1121 | } |
b0d623f7 A |
1122 | /* don't hide this xattr */ |
1123 | return 0; | |
1124 | } | |
1125 | ||
1126 | #pragma mark --- registration/validation routines --- | |
1127 | ||
0a7de745 A |
1128 | static inline int |
1129 | registration_valid(const decmpfs_registration *registration) | |
316670eb | 1130 | { |
0a7de745 | 1131 | return registration && ((registration->decmpfs_registration == DECMPFS_REGISTRATION_VERSION_V1) || (registration->decmpfs_registration == DECMPFS_REGISTRATION_VERSION_V3)); |
316670eb A |
1132 | } |
1133 | ||
b0d623f7 | 1134 | errno_t |
5ba3f43e | 1135 | register_decmpfs_decompressor(uint32_t compression_type, const decmpfs_registration *registration) |
b0d623f7 | 1136 | { |
0a7de745 A |
1137 | /* called by kexts to register decompressors */ |
1138 | ||
1139 | errno_t ret = 0; | |
1140 | int locked = 0; | |
1141 | char resourceName[80]; | |
1142 | ||
1143 | if ((compression_type >= CMP_MAX) || !registration_valid(registration)) { | |
1144 | ret = EINVAL; | |
1145 | goto out; | |
1146 | } | |
1147 | ||
1148 | lck_rw_lock_exclusive(decompressorsLock); locked = 1; | |
1149 | ||
1150 | /* make sure the registration for this type is zero */ | |
b0d623f7 A |
1151 | if (decompressors[compression_type] != NULL) { |
1152 | ret = EEXIST; | |
1153 | goto out; | |
1154 | } | |
0a7de745 A |
1155 | decompressors[compression_type] = registration; |
1156 | snprintf(resourceName, sizeof(resourceName), "com.apple.AppleFSCompression.Type%u", compression_type); | |
1157 | IOServicePublishResource(resourceName, TRUE); | |
1158 | ||
b0d623f7 | 1159 | out: |
0a7de745 A |
1160 | if (locked) { |
1161 | lck_rw_unlock_exclusive(decompressorsLock); | |
1162 | } | |
1163 | return ret; | |
b0d623f7 A |
1164 | } |
1165 | ||
1166 | errno_t | |
1167 | unregister_decmpfs_decompressor(uint32_t compression_type, decmpfs_registration *registration) | |
1168 | { | |
0a7de745 A |
1169 | /* called by kexts to unregister decompressors */ |
1170 | ||
1171 | errno_t ret = 0; | |
1172 | int locked = 0; | |
1173 | char resourceName[80]; | |
1174 | ||
1175 | if ((compression_type >= CMP_MAX) || !registration_valid(registration)) { | |
1176 | ret = EINVAL; | |
1177 | goto out; | |
1178 | } | |
1179 | ||
1180 | lck_rw_lock_exclusive(decompressorsLock); locked = 1; | |
1181 | if (decompressors[compression_type] != registration) { | |
1182 | ret = EEXIST; | |
1183 | goto out; | |
1184 | } | |
1185 | decompressors[compression_type] = NULL; | |
1186 | snprintf(resourceName, sizeof(resourceName), "com.apple.AppleFSCompression.Type%u", compression_type); | |
1187 | IOServicePublishResource(resourceName, FALSE); | |
1188 | ||
b0d623f7 | 1189 | out: |
0a7de745 A |
1190 | if (locked) { |
1191 | lck_rw_unlock_exclusive(decompressorsLock); | |
1192 | } | |
1193 | return ret; | |
b0d623f7 A |
1194 | } |
1195 | ||
1196 | static int | |
3e170ce0 | 1197 | compression_type_valid(vnode_t vp, decmpfs_header *hdr) |
b0d623f7 | 1198 | { |
0a7de745 A |
1199 | /* fast pre-check to determine if the given compressor has checked in */ |
1200 | int ret = 0; | |
1201 | ||
1202 | /* every compressor must have at least a fetch function */ | |
1203 | lck_rw_lock_shared(decompressorsLock); | |
1204 | if (decmp_get_func(vp, hdr->compression_type, fetch) != NULL) { | |
1205 | ret = 1; | |
1206 | } | |
1207 | lck_rw_unlock_shared(decompressorsLock); | |
1208 | ||
1209 | return ret; | |
b0d623f7 A |
1210 | } |
1211 | ||
1212 | #pragma mark --- compression/decompression routines --- | |
1213 | ||
1214 | static int | |
316670eb | 1215 | decmpfs_fetch_uncompressed_data(vnode_t vp, decmpfs_cnode *cp, decmpfs_header *hdr, off_t offset, user_ssize_t size, int nvec, decmpfs_vector *vec, uint64_t *bytes_read) |
b0d623f7 | 1216 | { |
0a7de745 A |
1217 | /* get the uncompressed bytes for the specified region of vp by calling out to the registered compressor */ |
1218 | ||
1219 | int err = 0; | |
1220 | ||
1221 | *bytes_read = 0; | |
1222 | ||
f427ee49 | 1223 | if (offset >= (off_t)hdr->uncompressed_size) { |
0a7de745 A |
1224 | /* reading past end of file; nothing to do */ |
1225 | err = 0; | |
1226 | goto out; | |
1227 | } | |
1228 | if (offset < 0) { | |
1229 | /* tried to read from before start of file */ | |
1230 | err = EINVAL; | |
1231 | goto out; | |
1232 | } | |
f427ee49 | 1233 | if (hdr->uncompressed_size - offset < size) { |
0a7de745 | 1234 | /* adjust size so we don't read past the end of the file */ |
f427ee49 | 1235 | size = (user_ssize_t)(hdr->uncompressed_size - offset); |
b0d623f7 | 1236 | } |
0a7de745 A |
1237 | if (size == 0) { |
1238 | /* nothing to read */ | |
1239 | err = 0; | |
1240 | goto out; | |
1241 | } | |
1242 | ||
1243 | /* | |
1244 | * Trace the following parameters on entry with event-id 0x03120008. | |
1245 | * | |
1246 | * @vp->v_id: vnode-id of the file being decompressed. | |
1247 | * @hdr->compression_type: compression type. | |
1248 | * @offset: offset from where to fetch uncompressed data. | |
1249 | * @size: amount of uncompressed data to fetch. | |
1250 | * | |
1251 | * Please NOTE: @offset and @size can overflow in theory but | |
1252 | * here it is safe. | |
1253 | */ | |
1254 | DECMPFS_EMIT_TRACE_ENTRY(DECMPDBG_FETCH_UNCOMPRESSED_DATA, vp->v_id, | |
1255 | hdr->compression_type, (int)offset, (int)size); | |
1256 | lck_rw_lock_shared(decompressorsLock); | |
1257 | decmpfs_fetch_uncompressed_data_func fetch = decmp_get_func(vp, hdr->compression_type, fetch); | |
1258 | if (fetch) { | |
b0d623f7 | 1259 | err = fetch(vp, decmpfs_ctx, hdr, offset, size, nvec, vec, bytes_read); |
316670eb | 1260 | lck_rw_unlock_shared(decompressorsLock); |
0a7de745 A |
1261 | if (err == 0) { |
1262 | uint64_t decompression_flags = decmpfs_cnode_get_decompression_flags(cp); | |
1263 | if (decompression_flags & DECMPFS_FLAGS_FORCE_FLUSH_ON_DECOMPRESS) { | |
1264 | #if !defined(__i386__) && !defined(__x86_64__) | |
1265 | int i; | |
1266 | for (i = 0; i < nvec; i++) { | |
f427ee49 A |
1267 | assert(vec[i].size >= 0 && vec[i].size <= UINT_MAX); |
1268 | flush_dcache64((addr64_t)(uintptr_t)vec[i].buf, (unsigned int)vec[i].size, FALSE); | |
0a7de745 | 1269 | } |
316670eb | 1270 | #endif |
0a7de745 A |
1271 | } |
1272 | } | |
1273 | } else { | |
1274 | err = ENOTSUP; | |
1275 | lck_rw_unlock_shared(decompressorsLock); | |
1276 | } | |
1277 | /* | |
1278 | * Trace the following parameters on return with event-id 0x03120008. | |
1279 | * | |
1280 | * @vp->v_id: vnode-id of the file being decompressed. | |
1281 | * @bytes_read: amount of uncompressed bytes fetched in bytes. | |
1282 | * @err: value returned from this function. | |
1283 | * | |
1284 | * Please NOTE: @bytes_read can overflow in theory but here it is safe. | |
1285 | */ | |
1286 | DECMPFS_EMIT_TRACE_RETURN(DECMPDBG_FETCH_UNCOMPRESSED_DATA, vp->v_id, | |
1287 | (int)*bytes_read, err); | |
b0d623f7 | 1288 | out: |
0a7de745 | 1289 | return err; |
b0d623f7 A |
1290 | } |
1291 | ||
1292 | static kern_return_t | |
1293 | commit_upl(upl_t upl, upl_offset_t pl_offset, size_t uplSize, int flags, int abort) | |
1294 | { | |
0a7de745 | 1295 | kern_return_t kr = 0; |
fe8ab488 A |
1296 | |
1297 | #if CONFIG_IOSCHED | |
0a7de745 | 1298 | upl_unmark_decmp(upl); |
fe8ab488 | 1299 | #endif /* CONFIG_IOSCHED */ |
0a7de745 A |
1300 | |
1301 | /* commit the upl pages */ | |
1302 | if (abort) { | |
1303 | VerboseLog("aborting upl, flags 0x%08x\n", flags); | |
f427ee49 | 1304 | kr = ubc_upl_abort_range(upl, pl_offset, (upl_size_t)uplSize, flags); |
0a7de745 A |
1305 | if (kr != KERN_SUCCESS) { |
1306 | ErrorLog("ubc_upl_abort_range error %d\n", (int)kr); | |
1307 | } | |
1308 | } else { | |
1309 | VerboseLog("committing upl, flags 0x%08x\n", flags | UPL_COMMIT_CLEAR_DIRTY); | |
f427ee49 | 1310 | kr = ubc_upl_commit_range(upl, pl_offset, (upl_size_t)uplSize, flags | UPL_COMMIT_CLEAR_DIRTY | UPL_COMMIT_WRITTEN_BY_KERNEL); |
0a7de745 A |
1311 | if (kr != KERN_SUCCESS) { |
1312 | ErrorLog("ubc_upl_commit_range error %d\n", (int)kr); | |
1313 | } | |
1314 | } | |
1315 | return kr; | |
b0d623f7 A |
1316 | } |
1317 | ||
fe8ab488 | 1318 | |
b0d623f7 A |
1319 | errno_t |
1320 | decmpfs_pagein_compressed(struct vnop_pagein_args *ap, int *is_compressed, decmpfs_cnode *cp) | |
1321 | { | |
0a7de745 A |
1322 | /* handles a page-in request from vfs for a compressed file */ |
1323 | ||
1324 | int err = 0; | |
1325 | vnode_t vp = ap->a_vp; | |
1326 | upl_t pl = ap->a_pl; | |
b0d623f7 | 1327 | upl_offset_t pl_offset = ap->a_pl_offset; |
0a7de745 A |
1328 | off_t f_offset = ap->a_f_offset; |
1329 | size_t size = ap->a_size; | |
b0d623f7 | 1330 | int flags = ap->a_flags; |
0a7de745 A |
1331 | off_t uplPos = 0; |
1332 | user_ssize_t uplSize = 0; | |
f427ee49 | 1333 | size_t verify_block_size = 0; |
b0d623f7 | 1334 | void *data = NULL; |
0a7de745 A |
1335 | decmpfs_header *hdr = NULL; |
1336 | uint64_t cachedSize = 0; | |
b0d623f7 | 1337 | int cmpdata_locked = 0; |
f427ee49 A |
1338 | bool file_tail_page_valid = false; |
1339 | int num_valid_pages = 0; | |
1340 | int num_invalid_pages = 0; | |
0a7de745 A |
1341 | |
1342 | if (!decmpfs_trylock_compressed_data(cp, 0)) { | |
1343 | return EAGAIN; | |
1344 | } | |
1345 | cmpdata_locked = 1; | |
1346 | ||
1347 | ||
b0d623f7 | 1348 | if (flags & ~(UPL_IOSYNC | UPL_NOCOMMIT | UPL_NORDAHEAD)) { |
3e170ce0 | 1349 | DebugLogWithPath("pagein: unknown flags 0x%08x\n", (flags & ~(UPL_IOSYNC | UPL_NOCOMMIT | UPL_NORDAHEAD))); |
b0d623f7 | 1350 | } |
0a7de745 A |
1351 | |
1352 | err = decmpfs_fetch_compressed_header(vp, cp, &hdr, 0); | |
1353 | if (err != 0) { | |
1354 | goto out; | |
1355 | } | |
1356 | ||
1357 | cachedSize = hdr->uncompressed_size; | |
1358 | ||
1359 | if (!compression_type_valid(vp, hdr)) { | |
1360 | /* compressor not registered */ | |
1361 | err = ENOTSUP; | |
1362 | goto out; | |
1363 | } | |
fe8ab488 | 1364 | |
f427ee49 A |
1365 | /* |
1366 | * If the verify block size is larger than the page size, the UPL needs | |
1367 | * to be aligned to it, Since the UPL has been created by the filesystem, | |
1368 | * we will only check if the passed in UPL length conforms to the | |
1369 | * alignment requirements. | |
1370 | */ | |
1371 | err = VNOP_VERIFY(vp, f_offset, NULL, 0, &verify_block_size, | |
1372 | VNODE_VERIFY_DEFAULT, NULL); | |
1373 | if (err) { | |
1374 | goto out; | |
1375 | } else if (verify_block_size) { | |
1376 | if (verify_block_size & (verify_block_size - 1)) { | |
1377 | ErrorLogWithPath("verify block size is not power of 2, no verification will be done\n"); | |
1378 | err = EINVAL; | |
1379 | } else if (size % verify_block_size) { | |
1380 | ErrorLogWithPath("upl size is not a multiple of verify block size\n"); | |
1381 | err = EINVAL; | |
1382 | } | |
1383 | if (err) { | |
1384 | goto out; | |
1385 | } | |
1386 | } | |
1387 | ||
fe8ab488 A |
1388 | #if CONFIG_IOSCHED |
1389 | /* Mark the UPL as the requesting UPL for decompression */ | |
1390 | upl_mark_decmp(pl); | |
1391 | #endif /* CONFIG_IOSCHED */ | |
1392 | ||
0a7de745 | 1393 | /* map the upl so we can fetch into it */ |
b0d623f7 A |
1394 | kern_return_t kr = ubc_upl_map(pl, (vm_offset_t*)&data); |
1395 | if ((kr != KERN_SUCCESS) || (data == NULL)) { | |
fe8ab488 | 1396 | err = ENOSPC; |
39037602 | 1397 | data = NULL; |
fe8ab488 A |
1398 | #if CONFIG_IOSCHED |
1399 | upl_unmark_decmp(pl); | |
0a7de745 | 1400 | #endif /* CONFIG_IOSCHED */ |
b0d623f7 A |
1401 | goto out; |
1402 | } | |
0a7de745 A |
1403 | |
1404 | uplPos = f_offset; | |
1405 | uplSize = size; | |
1406 | ||
1407 | /* clip the size to the size of the file */ | |
1408 | if ((uint64_t)uplPos + uplSize > cachedSize) { | |
1409 | /* truncate the read to the size of the file */ | |
f427ee49 | 1410 | uplSize = (user_ssize_t)(cachedSize - uplPos); |
0a7de745 A |
1411 | } |
1412 | ||
1413 | /* do the fetch */ | |
1414 | decmpfs_vector vec; | |
1415 | ||
b0d623f7 | 1416 | decompress: |
0a7de745 | 1417 | /* the mapped data pointer points to the first page of the page list, so we want to start filling in at an offset of pl_offset */ |
f427ee49 A |
1418 | vec = (decmpfs_vector) { |
1419 | .buf = (char*)data + pl_offset, | |
1420 | .size = size, | |
1421 | }; | |
0a7de745 A |
1422 | |
1423 | uint64_t did_read = 0; | |
b0d623f7 | 1424 | if (decmpfs_fast_get_state(cp) == FILE_IS_CONVERTING) { |
3e170ce0 | 1425 | ErrorLogWithPath("unexpected pagein during decompress\n"); |
b0d623f7 | 1426 | /* |
0a7de745 A |
1427 | * if the file is converting, this must be a recursive call to pagein from underneath a call to decmpfs_decompress_file; |
1428 | * pretend that it succeeded but don't do anything since we're just going to write over the pages anyway | |
b0d623f7 A |
1429 | */ |
1430 | err = 0; | |
b0d623f7 | 1431 | } else { |
f427ee49 A |
1432 | if (!verify_block_size || (verify_block_size <= PAGE_SIZE)) { |
1433 | err = decmpfs_fetch_uncompressed_data(vp, cp, hdr, uplPos, uplSize, 1, &vec, &did_read); | |
1434 | } else { | |
1435 | off_t l_uplPos = uplPos; | |
1436 | off_t l_pl_offset = pl_offset; | |
1437 | user_ssize_t l_uplSize = uplSize; | |
1438 | upl_page_info_t *pl_info = ubc_upl_pageinfo(pl); | |
1439 | ||
1440 | err = 0; | |
1441 | /* | |
1442 | * When the system page size is less than the "verify block size", | |
1443 | * the UPL passed may not consist solely of absent pages. | |
1444 | * We have to detect the "absent" pages and only decompress | |
1445 | * into those absent/invalid page ranges. | |
1446 | * | |
1447 | * Things that will change in each iteration of the loop : | |
1448 | * | |
1449 | * l_pl_offset = where we are inside the UPL [0, caller_upl_created_size) | |
1450 | * l_uplPos = the file offset the l_pl_offset corresponds to. | |
1451 | * l_uplSize = the size of the upl still unprocessed; | |
1452 | * | |
1453 | * In this picture, we have to do the transfer on 2 ranges | |
1454 | * (One 2 page range and one 3 page range) and the loop | |
1455 | * below will skip the first two pages and then identify | |
1456 | * the next two as invalid and fill those in and | |
1457 | * then skip the next one and then do the last pages. | |
1458 | * | |
1459 | * uplPos(file_offset) | |
1460 | * | uplSize | |
1461 | * 0 V<--------------> file_size | |
1462 | * |---------------------------------------------------> | |
1463 | * | | |V|V|I|I|V|I|I|I| | |
1464 | * ^ | |
1465 | * | upl | |
1466 | * <-------------------> | |
1467 | * | | |
1468 | * pl_offset | |
1469 | * | |
1470 | * uplSize will be clipped in case the UPL range exceeds | |
1471 | * the file size. | |
1472 | * | |
1473 | */ | |
1474 | while (l_uplSize) { | |
1475 | uint64_t l_did_read = 0; | |
1476 | int pl_offset_pg = (int)(l_pl_offset / PAGE_SIZE); | |
1477 | int pages_left_in_upl; | |
1478 | int start_pg; | |
1479 | int last_pg; | |
1480 | ||
1481 | /* | |
1482 | * l_uplSize may start off less than the size of the upl, | |
1483 | * we have to round it up to PAGE_SIZE to calculate | |
1484 | * how many more pages are left. | |
1485 | */ | |
1486 | pages_left_in_upl = (int)(round_page((vm_offset_t)l_uplSize) / PAGE_SIZE); | |
1487 | ||
1488 | /* | |
1489 | * scan from the beginning of the upl looking for the first | |
1490 | * non-valid page.... this will become the first page in | |
1491 | * the request we're going to make to | |
1492 | * 'decmpfs_fetch_uncompressed_data'... if all | |
1493 | * of the pages are valid, we won't call through | |
1494 | * to 'decmpfs_fetch_uncompressed_data' | |
1495 | */ | |
1496 | for (start_pg = 0; start_pg < pages_left_in_upl; start_pg++) { | |
1497 | if (!upl_valid_page(pl_info, pl_offset_pg + start_pg)) { | |
1498 | break; | |
1499 | } | |
1500 | } | |
1501 | ||
1502 | num_valid_pages += start_pg; | |
1503 | ||
1504 | /* | |
1505 | * scan from the starting invalid page looking for | |
1506 | * a valid page before the end of the upl is | |
1507 | * reached, if we find one, then it will be the | |
1508 | * last page of the request to 'decmpfs_fetch_uncompressed_data' | |
1509 | */ | |
1510 | for (last_pg = start_pg; last_pg < pages_left_in_upl; last_pg++) { | |
1511 | if (upl_valid_page(pl_info, pl_offset_pg + last_pg)) { | |
1512 | break; | |
1513 | } | |
1514 | } | |
1515 | ||
1516 | if (start_pg < last_pg) { | |
1517 | off_t inval_offset = start_pg * PAGE_SIZE; | |
1518 | int inval_pages = last_pg - start_pg; | |
1519 | int inval_size = inval_pages * PAGE_SIZE; | |
1520 | decmpfs_vector l_vec; | |
1521 | ||
1522 | num_invalid_pages += inval_pages; | |
1523 | if (inval_offset) { | |
1524 | did_read += inval_offset; | |
1525 | l_pl_offset += inval_offset; | |
1526 | l_uplPos += inval_offset; | |
1527 | l_uplSize -= inval_offset; | |
1528 | } | |
1529 | ||
1530 | l_vec = (decmpfs_vector) { | |
1531 | .buf = (char*)data + l_pl_offset, | |
1532 | .size = inval_size, | |
1533 | }; | |
1534 | ||
1535 | err = decmpfs_fetch_uncompressed_data(vp, cp, hdr, l_uplPos, | |
1536 | MIN(l_uplSize, inval_size), 1, &l_vec, &l_did_read); | |
1537 | ||
1538 | if (!err && (l_did_read != inval_size) && (l_uplSize > inval_size)) { | |
1539 | ErrorLogWithPath("Unexpected size fetch of decompressed data, l_uplSize = %d, l_did_read = %d, inval_size = %d\n", | |
1540 | (int)l_uplSize, (int)l_did_read, (int)inval_size); | |
1541 | err = EINVAL; | |
1542 | } | |
1543 | } else { | |
1544 | /* no invalid pages left */ | |
1545 | l_did_read = l_uplSize; | |
1546 | if (uplSize < size) { | |
1547 | file_tail_page_valid = true; | |
1548 | } | |
1549 | } | |
1550 | ||
1551 | if (err) { | |
1552 | break; | |
1553 | } | |
1554 | ||
1555 | did_read += l_did_read; | |
1556 | l_pl_offset += l_did_read; | |
1557 | l_uplPos += l_did_read; | |
1558 | l_uplSize -= l_did_read; | |
1559 | } | |
1560 | } | |
0a7de745 A |
1561 | } |
1562 | if (err) { | |
1563 | DebugLogWithPath("decmpfs_fetch_uncompressed_data err %d\n", err); | |
1564 | int cmp_state = decmpfs_fast_get_state(cp); | |
1565 | if (cmp_state == FILE_IS_CONVERTING) { | |
1566 | DebugLogWithPath("cmp_state == FILE_IS_CONVERTING\n"); | |
1567 | cmp_state = wait_for_decompress(cp); | |
1568 | if (cmp_state == FILE_IS_COMPRESSED) { | |
1569 | DebugLogWithPath("cmp_state == FILE_IS_COMPRESSED\n"); | |
1570 | /* a decompress was attempted but it failed, let's try calling fetch again */ | |
1571 | goto decompress; | |
1572 | } | |
1573 | } | |
1574 | if (cmp_state == FILE_IS_NOT_COMPRESSED) { | |
1575 | DebugLogWithPath("cmp_state == FILE_IS_NOT_COMPRESSED\n"); | |
1576 | /* the file was decompressed after we started reading it */ | |
1577 | *is_compressed = 0; /* instruct caller to fall back to its normal path */ | |
1578 | } | |
1579 | } | |
1580 | ||
1581 | /* zero out whatever we didn't read, and zero out the end of the last page(s) */ | |
1582 | uint64_t total_size = (size + (PAGE_SIZE - 1)) & ~(PAGE_SIZE - 1); | |
f427ee49 A |
1583 | if (did_read < total_size && !(verify_block_size && err)) { |
1584 | uint64_t rounded_up_did_read = file_tail_page_valid ? (uint64_t)(round_page((vm_offset_t)did_read)) : did_read; | |
1585 | memset((char*)vec.buf + rounded_up_did_read, 0, (size_t)(total_size - rounded_up_did_read)); | |
1586 | } | |
1587 | ||
1588 | if (!err && verify_block_size) { | |
1589 | size_t cur_verify_block_size = verify_block_size; | |
1590 | ||
1591 | if ((err = VNOP_VERIFY(vp, uplPos, vec.buf, size, &cur_verify_block_size, 0, NULL))) { | |
1592 | ErrorLogWithPath("Verification failed with error %d, uplPos = %lld, uplSize = %d, did_read = %d, total_size = %d, valid_pages = %d, invalid_pages = %d, tail_page_valid = %d\n", | |
1593 | err, (long long)uplPos, (int)uplSize, (int)did_read, (int)total_size, num_valid_pages, num_invalid_pages, file_tail_page_valid); | |
1594 | } | |
1595 | /* XXX : If the verify block size changes, redo the read */ | |
0a7de745 A |
1596 | } |
1597 | ||
fe8ab488 A |
1598 | #if CONFIG_IOSCHED |
1599 | upl_unmark_decmp(pl); | |
0a7de745 A |
1600 | #endif /* CONFIG_IOSCHED */ |
1601 | ||
b0d623f7 | 1602 | kr = ubc_upl_unmap(pl); data = NULL; /* make sure to set data to NULL so we don't try to unmap again below */ |
0a7de745 A |
1603 | if (kr != KERN_SUCCESS) { |
1604 | ErrorLogWithPath("ubc_upl_unmap error %d\n", (int)kr); | |
1605 | } else { | |
1606 | if (!err) { | |
1607 | /* commit our pages */ | |
f427ee49 | 1608 | kr = commit_upl(pl, pl_offset, (size_t)total_size, UPL_COMMIT_FREE_ON_EMPTY, 0); |
0a7de745 A |
1609 | } |
1610 | } | |
1611 | ||
b0d623f7 | 1612 | out: |
0a7de745 A |
1613 | if (data) { |
1614 | ubc_upl_unmap(pl); | |
1615 | } | |
1616 | if (hdr) { | |
1617 | FREE(hdr, M_TEMP); | |
1618 | } | |
1619 | if (cmpdata_locked) { | |
1620 | decmpfs_unlock_compressed_data(cp, 0); | |
1621 | } | |
1622 | if (err) { | |
39037602 | 1623 | #if 0 |
0a7de745 A |
1624 | if (err != ENXIO && err != ENOSPC) { |
1625 | char *path; | |
1626 | MALLOC(path, char *, PATH_MAX, M_TEMP, M_WAITOK); | |
1627 | panic("%s: decmpfs_pagein_compressed: err %d", vnpath(vp, path, PATH_MAX), err); | |
1628 | FREE(path, M_TEMP); | |
1629 | } | |
39037602 | 1630 | #endif /* 0 */ |
0a7de745 A |
1631 | ErrorLogWithPath("err %d\n", err); |
1632 | } | |
b0d623f7 A |
1633 | return err; |
1634 | } | |
1635 | ||
0a7de745 | 1636 | errno_t |
b0d623f7 A |
1637 | decmpfs_read_compressed(struct vnop_read_args *ap, int *is_compressed, decmpfs_cnode *cp) |
1638 | { | |
0a7de745 A |
1639 | /* handles a read request from vfs for a compressed file */ |
1640 | ||
1641 | uio_t uio = ap->a_uio; | |
1642 | vnode_t vp = ap->a_vp; | |
1643 | int err = 0; | |
1644 | int countInt = 0; | |
1645 | off_t uplPos = 0; | |
1646 | user_ssize_t uplSize = 0; | |
1647 | user_ssize_t uplRemaining = 0; | |
1648 | off_t curUplPos = 0; | |
1649 | user_ssize_t curUplSize = 0; | |
1650 | kern_return_t kr = KERN_SUCCESS; | |
1651 | int abort_read = 0; | |
1652 | void *data = NULL; | |
1653 | uint64_t did_read = 0; | |
1654 | upl_t upl = NULL; | |
1655 | upl_page_info_t *pli = NULL; | |
1656 | decmpfs_header *hdr = NULL; | |
1657 | uint64_t cachedSize = 0; | |
1658 | off_t uioPos = 0; | |
1659 | user_ssize_t uioRemaining = 0; | |
f427ee49 A |
1660 | size_t verify_block_size = 0; |
1661 | size_t alignment_size = PAGE_SIZE; | |
b0d623f7 | 1662 | int cmpdata_locked = 0; |
0a7de745 | 1663 | |
b0d623f7 | 1664 | decmpfs_lock_compressed_data(cp, 0); cmpdata_locked = 1; |
0a7de745 A |
1665 | |
1666 | uplPos = uio_offset(uio); | |
1667 | uplSize = uio_resid(uio); | |
1668 | VerboseLogWithPath("uplPos %lld uplSize %lld\n", uplPos, uplSize); | |
1669 | ||
1670 | cachedSize = decmpfs_cnode_get_vnode_cached_size(cp); | |
1671 | ||
1672 | if ((uint64_t)uplPos + uplSize > cachedSize) { | |
1673 | /* truncate the read to the size of the file */ | |
f427ee49 | 1674 | uplSize = (user_ssize_t)(cachedSize - uplPos); |
0a7de745 A |
1675 | } |
1676 | ||
1677 | /* give the cluster layer a chance to fill in whatever it already has */ | |
f427ee49 | 1678 | countInt = (uplSize > INT_MAX) ? INT_MAX : (int)uplSize; |
0a7de745 A |
1679 | err = cluster_copy_ubc_data(vp, uio, &countInt, 0); |
1680 | if (err != 0) { | |
1681 | goto out; | |
1682 | } | |
1683 | ||
1684 | /* figure out what's left */ | |
1685 | uioPos = uio_offset(uio); | |
1686 | uioRemaining = uio_resid(uio); | |
1687 | if ((uint64_t)uioPos + uioRemaining > cachedSize) { | |
1688 | /* truncate the read to the size of the file */ | |
f427ee49 | 1689 | uioRemaining = (user_ssize_t)(cachedSize - uioPos); |
0a7de745 A |
1690 | } |
1691 | ||
1692 | if (uioRemaining <= 0) { | |
1693 | /* nothing left */ | |
1694 | goto out; | |
1695 | } | |
1696 | ||
1697 | err = decmpfs_fetch_compressed_header(vp, cp, &hdr, 0); | |
1698 | if (err != 0) { | |
1699 | goto out; | |
1700 | } | |
1701 | if (!compression_type_valid(vp, hdr)) { | |
1702 | err = ENOTSUP; | |
1703 | goto out; | |
1704 | } | |
1705 | ||
1706 | uplPos = uioPos; | |
1707 | uplSize = uioRemaining; | |
b0d623f7 | 1708 | #if COMPRESSION_DEBUG |
0a7de745 | 1709 | DebugLogWithPath("uplPos %lld uplSize %lld\n", (uint64_t)uplPos, (uint64_t)uplSize); |
b0d623f7 | 1710 | #endif |
0a7de745 A |
1711 | |
1712 | lck_rw_lock_shared(decompressorsLock); | |
1713 | decmpfs_adjust_fetch_region_func adjust_fetch = decmp_get_func(vp, hdr->compression_type, adjust_fetch); | |
1714 | if (adjust_fetch) { | |
1715 | /* give the compressor a chance to adjust the portion of the file that we read */ | |
b0d623f7 | 1716 | adjust_fetch(vp, decmpfs_ctx, hdr, &uplPos, &uplSize); |
0a7de745 A |
1717 | VerboseLogWithPath("adjusted uplPos %lld uplSize %lld\n", (uint64_t)uplPos, (uint64_t)uplSize); |
1718 | } | |
1719 | lck_rw_unlock_shared(decompressorsLock); | |
1720 | ||
1721 | /* clip the adjusted size to the size of the file */ | |
1722 | if ((uint64_t)uplPos + uplSize > cachedSize) { | |
1723 | /* truncate the read to the size of the file */ | |
f427ee49 | 1724 | uplSize = (user_ssize_t)(cachedSize - uplPos); |
0a7de745 A |
1725 | } |
1726 | ||
1727 | if (uplSize <= 0) { | |
1728 | /* nothing left */ | |
1729 | goto out; | |
1730 | } | |
1731 | ||
1732 | /* | |
1733 | * since we're going to create a upl for the given region of the file, | |
1734 | * make sure we're on page boundaries | |
1735 | */ | |
1736 | ||
f427ee49 A |
1737 | /* If the verify block size is larger than the page size, the UPL needs to aligned to it */ |
1738 | err = VNOP_VERIFY(vp, uplPos, NULL, 0, &verify_block_size, VNODE_VERIFY_DEFAULT, NULL); | |
1739 | if (err) { | |
1740 | goto out; | |
1741 | } else if (verify_block_size) { | |
1742 | if (verify_block_size & (verify_block_size - 1)) { | |
1743 | ErrorLogWithPath("verify block size is not power of 2, no verification will be done\n"); | |
1744 | verify_block_size = 0; | |
1745 | } else if (verify_block_size > PAGE_SIZE) { | |
1746 | alignment_size = verify_block_size; | |
1747 | } | |
1748 | } | |
1749 | ||
1750 | if (uplPos & (alignment_size - 1)) { | |
0a7de745 | 1751 | /* round position down to page boundary */ |
f427ee49 A |
1752 | uplSize += (uplPos & (alignment_size - 1)); |
1753 | uplPos &= ~(alignment_size - 1); | |
0a7de745 | 1754 | } |
f427ee49 A |
1755 | |
1756 | /* round size up to alignement_size multiple */ | |
1757 | uplSize = (uplSize + (alignment_size - 1)) & ~(alignment_size - 1); | |
0a7de745 A |
1758 | |
1759 | VerboseLogWithPath("new uplPos %lld uplSize %lld\n", (uint64_t)uplPos, (uint64_t)uplSize); | |
fe8ab488 | 1760 | |
0a7de745 A |
1761 | uplRemaining = uplSize; |
1762 | curUplPos = uplPos; | |
1763 | curUplSize = 0; | |
fe8ab488 | 1764 | |
0a7de745 A |
1765 | while (uplRemaining > 0) { |
1766 | /* start after the last upl */ | |
1767 | curUplPos += curUplSize; | |
1768 | ||
1769 | /* clip to max upl size */ | |
1770 | curUplSize = uplRemaining; | |
1771 | if (curUplSize > MAX_UPL_SIZE_BYTES) { | |
1772 | curUplSize = MAX_UPL_SIZE_BYTES; | |
1773 | } | |
1774 | ||
1775 | /* create the upl */ | |
f427ee49 | 1776 | kr = ubc_create_upl_kernel(vp, curUplPos, (int)curUplSize, &upl, &pli, UPL_SET_LITE, VM_KERN_MEMORY_FILE); |
0a7de745 A |
1777 | if (kr != KERN_SUCCESS) { |
1778 | ErrorLogWithPath("ubc_create_upl error %d\n", (int)kr); | |
1779 | err = EINVAL; | |
1780 | goto out; | |
1781 | } | |
1782 | VerboseLogWithPath("curUplPos %lld curUplSize %lld\n", (uint64_t)curUplPos, (uint64_t)curUplSize); | |
1783 | ||
1784 | #if CONFIG_IOSCHED | |
1785 | /* Mark the UPL as the requesting UPL for decompression */ | |
1786 | upl_mark_decmp(upl); | |
1787 | #endif /* CONFIG_IOSCHED */ | |
1788 | ||
1789 | /* map the upl */ | |
1790 | kr = ubc_upl_map(upl, (vm_offset_t*)&data); | |
1791 | if (kr != KERN_SUCCESS) { | |
1792 | commit_upl(upl, 0, curUplSize, UPL_ABORT_FREE_ON_EMPTY, 1); | |
39037602 | 1793 | #if 0 |
0a7de745 A |
1794 | char *path; |
1795 | MALLOC(path, char *, PATH_MAX, M_TEMP, M_WAITOK); | |
1796 | panic("%s: decmpfs_read_compressed: ubc_upl_map error %d", vnpath(vp, path, PATH_MAX), (int)kr); | |
1797 | FREE(path, M_TEMP); | |
39037602 | 1798 | #else /* 0 */ |
0a7de745 | 1799 | ErrorLogWithPath("ubc_upl_map kr=0x%x\n", (int)kr); |
39037602 | 1800 | #endif /* 0 */ |
0a7de745 A |
1801 | err = EINVAL; |
1802 | goto out; | |
1803 | } | |
1804 | ||
1805 | /* make sure the map succeeded */ | |
1806 | if (!data) { | |
1807 | commit_upl(upl, 0, curUplSize, UPL_ABORT_FREE_ON_EMPTY, 1); | |
1808 | ||
1809 | ErrorLogWithPath("ubc_upl_map mapped null\n"); | |
1810 | err = EINVAL; | |
1811 | goto out; | |
1812 | } | |
1813 | ||
1814 | /* fetch uncompressed data into the mapped upl */ | |
1815 | decmpfs_vector vec; | |
1816 | decompress: | |
1817 | vec = (decmpfs_vector){ .buf = data, .size = curUplSize }; | |
1818 | err = decmpfs_fetch_uncompressed_data(vp, cp, hdr, curUplPos, curUplSize, 1, &vec, &did_read); | |
1819 | if (err) { | |
1820 | ErrorLogWithPath("decmpfs_fetch_uncompressed_data err %d\n", err); | |
1821 | ||
1822 | /* maybe the file is converting to decompressed */ | |
1823 | int cmp_state = decmpfs_fast_get_state(cp); | |
1824 | if (cmp_state == FILE_IS_CONVERTING) { | |
1825 | ErrorLogWithPath("cmp_state == FILE_IS_CONVERTING\n"); | |
1826 | cmp_state = wait_for_decompress(cp); | |
1827 | if (cmp_state == FILE_IS_COMPRESSED) { | |
1828 | ErrorLogWithPath("cmp_state == FILE_IS_COMPRESSED\n"); | |
1829 | /* a decompress was attempted but it failed, let's try fetching again */ | |
1830 | goto decompress; | |
1831 | } | |
1832 | } | |
1833 | if (cmp_state == FILE_IS_NOT_COMPRESSED) { | |
1834 | ErrorLogWithPath("cmp_state == FILE_IS_NOT_COMPRESSED\n"); | |
1835 | /* the file was decompressed after we started reading it */ | |
1836 | abort_read = 1; /* we're not going to commit our data */ | |
1837 | *is_compressed = 0; /* instruct caller to fall back to its normal path */ | |
1838 | } | |
1839 | kr = KERN_FAILURE; | |
1840 | did_read = 0; | |
1841 | } | |
f427ee49 | 1842 | |
0a7de745 | 1843 | /* zero out the remainder of the last page */ |
f427ee49 A |
1844 | memset((char*)data + did_read, 0, (size_t)(curUplSize - did_read)); |
1845 | if (!err && verify_block_size) { | |
1846 | size_t cur_verify_block_size = verify_block_size; | |
1847 | ||
1848 | if ((err = VNOP_VERIFY(vp, curUplPos, data, curUplSize, &cur_verify_block_size, 0, NULL))) { | |
1849 | ErrorLogWithPath("Verification failed with error %d\n", err); | |
1850 | abort_read = 1; | |
1851 | } | |
1852 | /* XXX : If the verify block size changes, redo the read */ | |
1853 | } | |
1854 | ||
0a7de745 A |
1855 | kr = ubc_upl_unmap(upl); |
1856 | if (kr == KERN_SUCCESS) { | |
1857 | if (abort_read) { | |
b0d623f7 | 1858 | kr = commit_upl(upl, 0, curUplSize, UPL_ABORT_FREE_ON_EMPTY, 1); |
0a7de745 A |
1859 | } else { |
1860 | VerboseLogWithPath("uioPos %lld uioRemaining %lld\n", (uint64_t)uioPos, (uint64_t)uioRemaining); | |
1861 | if (uioRemaining) { | |
1862 | off_t uplOff = uioPos - curUplPos; | |
1863 | if (uplOff < 0) { | |
1864 | ErrorLogWithPath("uplOff %lld should never be negative\n", (int64_t)uplOff); | |
1865 | err = EINVAL; | |
f427ee49 A |
1866 | } else if (uplOff > INT_MAX) { |
1867 | ErrorLogWithPath("uplOff %lld too large\n", (int64_t)uplOff); | |
1868 | err = EINVAL; | |
0a7de745 A |
1869 | } else { |
1870 | off_t count = curUplPos + curUplSize - uioPos; | |
1871 | if (count < 0) { | |
1872 | /* this upl is entirely before the uio */ | |
1873 | } else { | |
1874 | if (count > uioRemaining) { | |
1875 | count = uioRemaining; | |
1876 | } | |
f427ee49 A |
1877 | int icount = (count > INT_MAX) ? INT_MAX : (int)count; |
1878 | int io_resid = icount; | |
1879 | err = cluster_copy_upl_data(uio, upl, (int)uplOff, &io_resid); | |
1880 | int copied = icount - io_resid; | |
0a7de745 A |
1881 | VerboseLogWithPath("uplOff %lld count %lld copied %lld\n", (uint64_t)uplOff, (uint64_t)count, (uint64_t)copied); |
1882 | if (err) { | |
1883 | ErrorLogWithPath("cluster_copy_upl_data err %d\n", err); | |
1884 | } | |
1885 | uioPos += copied; | |
1886 | uioRemaining -= copied; | |
1887 | } | |
1888 | } | |
1889 | } | |
b0d623f7 | 1890 | kr = commit_upl(upl, 0, curUplSize, UPL_COMMIT_FREE_ON_EMPTY | UPL_COMMIT_INACTIVATE, 0); |
0a7de745 A |
1891 | if (err) { |
1892 | goto out; | |
1893 | } | |
1894 | } | |
1895 | } else { | |
1896 | ErrorLogWithPath("ubc_upl_unmap error %d\n", (int)kr); | |
1897 | } | |
1898 | ||
1899 | uplRemaining -= curUplSize; | |
1900 | } | |
1901 | ||
b0d623f7 | 1902 | out: |
fe8ab488 | 1903 | |
0a7de745 A |
1904 | if (hdr) { |
1905 | FREE(hdr, M_TEMP); | |
1906 | } | |
1907 | if (cmpdata_locked) { | |
1908 | decmpfs_unlock_compressed_data(cp, 0); | |
1909 | } | |
1910 | if (err) {/* something went wrong */ | |
1911 | ErrorLogWithPath("err %d\n", err); | |
1912 | return err; | |
1913 | } | |
1914 | ||
b0d623f7 | 1915 | #if COMPRESSION_DEBUG |
0a7de745 A |
1916 | uplSize = uio_resid(uio); |
1917 | if (uplSize) { | |
1918 | VerboseLogWithPath("still %lld bytes to copy\n", uplSize); | |
1919 | } | |
b0d623f7 | 1920 | #endif |
0a7de745 | 1921 | return 0; |
b0d623f7 A |
1922 | } |
1923 | ||
1924 | int | |
1925 | decmpfs_free_compressed_data(vnode_t vp, decmpfs_cnode *cp) | |
1926 | { | |
0a7de745 A |
1927 | /* |
1928 | * call out to the decompressor to free remove any data associated with this compressed file | |
1929 | * then delete the file's compression xattr | |
1930 | */ | |
1931 | decmpfs_header *hdr = NULL; | |
1932 | ||
1933 | /* | |
1934 | * Trace the following parameters on entry with event-id 0x03120010. | |
1935 | * | |
1936 | * @vp->v_id: vnode-id of the file for which to free compressed data. | |
1937 | */ | |
1938 | DECMPFS_EMIT_TRACE_ENTRY(DECMPDBG_FREE_COMPRESSED_DATA, vp->v_id); | |
1939 | ||
1940 | int err = decmpfs_fetch_compressed_header(vp, cp, &hdr, 0); | |
1941 | if (err) { | |
1942 | ErrorLogWithPath("decmpfs_fetch_compressed_header err %d\n", err); | |
1943 | } else { | |
1944 | lck_rw_lock_shared(decompressorsLock); | |
1945 | decmpfs_free_compressed_data_func free_data = decmp_get_func(vp, hdr->compression_type, free_data); | |
1946 | if (free_data) { | |
b0d623f7 | 1947 | err = free_data(vp, decmpfs_ctx, hdr); |
0a7de745 A |
1948 | } else { |
1949 | /* nothing to do, so no error */ | |
1950 | err = 0; | |
1951 | } | |
1952 | lck_rw_unlock_shared(decompressorsLock); | |
1953 | ||
1954 | if (err != 0) { | |
1955 | ErrorLogWithPath("decompressor err %d\n", err); | |
1956 | } | |
1957 | } | |
1958 | /* | |
1959 | * Trace the following parameters on return with event-id 0x03120010. | |
1960 | * | |
1961 | * @vp->v_id: vnode-id of the file for which to free compressed data. | |
1962 | * @err: value returned from this function. | |
1963 | */ | |
1964 | DECMPFS_EMIT_TRACE_RETURN(DECMPDBG_FREE_COMPRESSED_DATA, vp->v_id, err); | |
1965 | ||
1966 | /* delete the xattr */ | |
b0d623f7 | 1967 | err = vn_removexattr(vp, DECMPFS_XATTR_NAME, 0, decmpfs_ctx); |
0a7de745 A |
1968 | if (err != 0) { |
1969 | goto out; | |
1970 | } | |
1971 | ||
b0d623f7 | 1972 | out: |
0a7de745 A |
1973 | if (hdr) { |
1974 | FREE(hdr, M_TEMP); | |
1975 | } | |
1976 | return err; | |
b0d623f7 A |
1977 | } |
1978 | ||
1979 | #pragma mark --- file conversion routines --- | |
1980 | ||
1981 | static int | |
1982 | unset_compressed_flag(vnode_t vp) | |
1983 | { | |
0a7de745 A |
1984 | int err = 0; |
1985 | struct vnode_attr va; | |
1986 | int new_bsdflags = 0; | |
1987 | ||
1988 | VATTR_INIT(&va); | |
1989 | VATTR_WANTED(&va, va_flags); | |
b0d623f7 | 1990 | err = vnode_getattr(vp, &va, decmpfs_ctx); |
0a7de745 A |
1991 | |
1992 | if (err != 0) { | |
1993 | ErrorLogWithPath("vnode_getattr err %d\n", err); | |
1994 | } else { | |
1995 | new_bsdflags = va.va_flags & ~UF_COMPRESSED; | |
1996 | ||
1997 | VATTR_INIT(&va); | |
1998 | VATTR_SET(&va, va_flags, new_bsdflags); | |
b0d623f7 | 1999 | err = vnode_setattr(vp, &va, decmpfs_ctx); |
0a7de745 A |
2000 | if (err != 0) { |
2001 | ErrorLogWithPath("vnode_setattr err %d\n", err); | |
2002 | } | |
2003 | } | |
2004 | return err; | |
b0d623f7 A |
2005 | } |
2006 | ||
2007 | int | |
2008 | decmpfs_decompress_file(vnode_t vp, decmpfs_cnode *cp, off_t toSize, int truncate_okay, int skiplock) | |
2009 | { | |
2010 | /* convert a compressed file to an uncompressed file */ | |
0a7de745 | 2011 | |
b0d623f7 A |
2012 | int err = 0; |
2013 | char *data = NULL; | |
2014 | uio_t uio_w = 0; | |
2015 | off_t offset = 0; | |
2016 | uint32_t old_state = 0; | |
2017 | uint32_t new_state = 0; | |
2018 | int update_file_state = 0; | |
f427ee49 | 2019 | size_t allocSize = 0; |
d9a64523 | 2020 | decmpfs_header *hdr = NULL; |
b0d623f7 A |
2021 | int cmpdata_locked = 0; |
2022 | off_t remaining = 0; | |
2023 | uint64_t uncompressed_size = 0; | |
d9a64523 A |
2024 | |
2025 | /* | |
2026 | * Trace the following parameters on entry with event-id 0x03120000. | |
2027 | * | |
2028 | * @vp->v_id: vnode-id of the file being decompressed. | |
2029 | * @toSize: uncompress given bytes of the file. | |
2030 | * @truncate_okay: on error it is OK to truncate. | |
2031 | * @skiplock: compressed data is locked, skip locking again. | |
2032 | * | |
2033 | * Please NOTE: @toSize can overflow in theory but here it is safe. | |
2034 | */ | |
2035 | DECMPFS_EMIT_TRACE_ENTRY(DECMPDBG_DECOMPRESS_FILE, vp->v_id, | |
0a7de745 A |
2036 | (int)toSize, truncate_okay, skiplock); |
2037 | ||
b0d623f7 A |
2038 | if (!skiplock) { |
2039 | decmpfs_lock_compressed_data(cp, 1); cmpdata_locked = 1; | |
2040 | } | |
0a7de745 | 2041 | |
b0d623f7 A |
2042 | decompress: |
2043 | old_state = decmpfs_fast_get_state(cp); | |
0a7de745 A |
2044 | |
2045 | switch (old_state) { | |
2046 | case FILE_IS_NOT_COMPRESSED: | |
2047 | { | |
2048 | /* someone else decompressed the file */ | |
2049 | err = 0; | |
2050 | goto out; | |
2051 | } | |
2052 | ||
2053 | case FILE_TYPE_UNKNOWN: | |
2054 | { | |
2055 | /* the file is in an unknown state, so update the state and retry */ | |
2056 | (void)decmpfs_file_is_compressed(vp, cp); | |
2057 | ||
2058 | /* try again */ | |
2059 | goto decompress; | |
2060 | } | |
2061 | ||
2062 | case FILE_IS_COMPRESSED: | |
2063 | { | |
2064 | /* the file is compressed, so decompress it */ | |
2065 | break; | |
2066 | } | |
2067 | ||
2068 | default: | |
2069 | { | |
2070 | /* | |
2071 | * this shouldn't happen since multiple calls to decmpfs_decompress_file lock each other out, | |
2072 | * and when decmpfs_decompress_file returns, the state should be always be set back to | |
2073 | * FILE_IS_NOT_COMPRESSED or FILE_IS_UNKNOWN | |
2074 | */ | |
2075 | err = EINVAL; | |
2076 | goto out; | |
b0d623f7 | 2077 | } |
0a7de745 A |
2078 | } |
2079 | ||
2080 | err = decmpfs_fetch_compressed_header(vp, cp, &hdr, 0); | |
b0d623f7 A |
2081 | if (err != 0) { |
2082 | goto out; | |
2083 | } | |
0a7de745 | 2084 | |
b0d623f7 | 2085 | uncompressed_size = hdr->uncompressed_size; |
0a7de745 | 2086 | if (toSize == -1) { |
b0d623f7 | 2087 | toSize = hdr->uncompressed_size; |
0a7de745 A |
2088 | } |
2089 | ||
b0d623f7 A |
2090 | if (toSize == 0) { |
2091 | /* special case truncating the file to zero bytes */ | |
2092 | goto nodecmp; | |
2093 | } else if ((uint64_t)toSize > hdr->uncompressed_size) { | |
2094 | /* the caller is trying to grow the file, so we should decompress all the data */ | |
2095 | toSize = hdr->uncompressed_size; | |
2096 | } | |
0a7de745 | 2097 | |
f427ee49 | 2098 | allocSize = MIN(64 * 1024, (size_t)toSize); |
b0d623f7 A |
2099 | MALLOC(data, char *, allocSize, M_TEMP, M_WAITOK); |
2100 | if (!data) { | |
2101 | err = ENOMEM; | |
2102 | goto out; | |
2103 | } | |
0a7de745 | 2104 | |
b0d623f7 A |
2105 | uio_w = uio_create(1, 0LL, UIO_SYSSPACE, UIO_WRITE); |
2106 | if (!uio_w) { | |
2107 | err = ENOMEM; | |
2108 | goto out; | |
2109 | } | |
2110 | uio_w->uio_flags |= UIO_FLAGS_IS_COMPRESSED_FILE; | |
0a7de745 | 2111 | |
b0d623f7 | 2112 | remaining = toSize; |
0a7de745 | 2113 | |
b0d623f7 A |
2114 | /* tell the buffer cache that this is an empty file */ |
2115 | ubc_setsize(vp, 0); | |
0a7de745 | 2116 | |
b0d623f7 A |
2117 | /* if we got here, we need to decompress the file */ |
2118 | decmpfs_cnode_set_vnode_state(cp, FILE_IS_CONVERTING, 1); | |
0a7de745 A |
2119 | |
2120 | while (remaining > 0) { | |
b0d623f7 | 2121 | /* loop decompressing data from the file and writing it into the data fork */ |
0a7de745 | 2122 | |
b0d623f7 | 2123 | uint64_t bytes_read = 0; |
f427ee49 | 2124 | decmpfs_vector vec = { .buf = data, .size = (user_ssize_t)MIN(allocSize, remaining) }; |
316670eb | 2125 | err = decmpfs_fetch_uncompressed_data(vp, cp, hdr, offset, vec.size, 1, &vec, &bytes_read); |
b0d623f7 | 2126 | if (err != 0) { |
3e170ce0 | 2127 | ErrorLogWithPath("decmpfs_fetch_uncompressed_data err %d\n", err); |
b0d623f7 A |
2128 | goto out; |
2129 | } | |
0a7de745 | 2130 | |
b0d623f7 A |
2131 | if (bytes_read == 0) { |
2132 | /* we're done reading data */ | |
2133 | break; | |
2134 | } | |
0a7de745 | 2135 | |
b0d623f7 | 2136 | uio_reset(uio_w, offset, UIO_SYSSPACE, UIO_WRITE); |
f427ee49 | 2137 | err = uio_addiov(uio_w, CAST_USER_ADDR_T(data), (user_size_t)bytes_read); |
b0d623f7 | 2138 | if (err != 0) { |
3e170ce0 | 2139 | ErrorLogWithPath("uio_addiov err %d\n", err); |
b0d623f7 A |
2140 | err = ENOMEM; |
2141 | goto out; | |
2142 | } | |
0a7de745 | 2143 | |
b0d623f7 A |
2144 | err = VNOP_WRITE(vp, uio_w, 0, decmpfs_ctx); |
2145 | if (err != 0) { | |
2146 | /* if the write failed, truncate the file to zero bytes */ | |
3e170ce0 | 2147 | ErrorLogWithPath("VNOP_WRITE err %d\n", err); |
b0d623f7 A |
2148 | break; |
2149 | } | |
2150 | offset += bytes_read; | |
2151 | remaining -= bytes_read; | |
2152 | } | |
0a7de745 | 2153 | |
b0d623f7 A |
2154 | if (err == 0) { |
2155 | if (offset != toSize) { | |
3e170ce0 | 2156 | ErrorLogWithPath("file decompressed to %lld instead of %lld\n", offset, toSize); |
b0d623f7 A |
2157 | err = EINVAL; |
2158 | goto out; | |
2159 | } | |
2160 | } | |
0a7de745 | 2161 | |
b0d623f7 A |
2162 | if (err == 0) { |
2163 | /* sync the data and metadata */ | |
2164 | err = VNOP_FSYNC(vp, MNT_WAIT, decmpfs_ctx); | |
2165 | if (err != 0) { | |
3e170ce0 | 2166 | ErrorLogWithPath("VNOP_FSYNC err %d\n", err); |
b0d623f7 A |
2167 | goto out; |
2168 | } | |
2169 | } | |
0a7de745 | 2170 | |
b0d623f7 A |
2171 | if (err != 0) { |
2172 | /* write, setattr, or fsync failed */ | |
3e170ce0 | 2173 | ErrorLogWithPath("aborting decompress, err %d\n", err); |
b0d623f7 A |
2174 | if (truncate_okay) { |
2175 | /* truncate anything we might have written */ | |
2176 | int error = vnode_setsize(vp, 0, 0, decmpfs_ctx); | |
3e170ce0 | 2177 | ErrorLogWithPath("vnode_setsize err %d\n", error); |
b0d623f7 A |
2178 | } |
2179 | goto out; | |
2180 | } | |
0a7de745 | 2181 | |
b0d623f7 A |
2182 | nodecmp: |
2183 | /* if we're truncating the file to zero bytes, we'll skip ahead to here */ | |
0a7de745 | 2184 | |
b0d623f7 A |
2185 | /* unset the compressed flag */ |
2186 | unset_compressed_flag(vp); | |
0a7de745 | 2187 | |
b0d623f7 A |
2188 | /* free the compressed data associated with this file */ |
2189 | err = decmpfs_free_compressed_data(vp, cp); | |
2190 | if (err != 0) { | |
3e170ce0 | 2191 | ErrorLogWithPath("decmpfs_free_compressed_data err %d\n", err); |
b0d623f7 | 2192 | } |
0a7de745 | 2193 | |
b0d623f7 | 2194 | /* |
0a7de745 A |
2195 | * even if free_compressed_data or vnode_getattr/vnode_setattr failed, return success |
2196 | * since we succeeded in writing all of the file data to the data fork | |
b0d623f7 A |
2197 | */ |
2198 | err = 0; | |
0a7de745 | 2199 | |
b0d623f7 A |
2200 | /* if we got this far, the file was successfully decompressed */ |
2201 | update_file_state = 1; | |
2202 | new_state = FILE_IS_NOT_COMPRESSED; | |
0a7de745 | 2203 | |
b0d623f7 A |
2204 | #if COMPRESSION_DEBUG |
2205 | { | |
2206 | uint64_t filesize = 0; | |
2207 | vnsize(vp, &filesize); | |
3e170ce0 | 2208 | DebugLogWithPath("new file size %lld\n", filesize); |
b0d623f7 A |
2209 | } |
2210 | #endif | |
0a7de745 | 2211 | |
b0d623f7 | 2212 | out: |
0a7de745 A |
2213 | if (hdr) { |
2214 | FREE(hdr, M_TEMP); | |
2215 | } | |
2216 | if (data) { | |
2217 | FREE(data, M_TEMP); | |
2218 | } | |
2219 | if (uio_w) { | |
2220 | uio_free(uio_w); | |
2221 | } | |
2222 | ||
b0d623f7 A |
2223 | if (err != 0) { |
2224 | /* if there was a failure, reset compression flags to unknown and clear the buffer cache data */ | |
2225 | update_file_state = 1; | |
2226 | new_state = FILE_TYPE_UNKNOWN; | |
2227 | if (uncompressed_size) { | |
2228 | ubc_setsize(vp, 0); | |
2229 | ubc_setsize(vp, uncompressed_size); | |
0a7de745 | 2230 | } |
b0d623f7 | 2231 | } |
0a7de745 | 2232 | |
b0d623f7 A |
2233 | if (update_file_state) { |
2234 | lck_mtx_lock(decompress_channel_mtx); | |
2235 | decmpfs_cnode_set_vnode_state(cp, new_state, 1); | |
2236 | wakeup((caddr_t)&decompress_channel); /* wake up anyone who might have been waiting for decompression */ | |
2237 | lck_mtx_unlock(decompress_channel_mtx); | |
2238 | } | |
0a7de745 A |
2239 | |
2240 | if (cmpdata_locked) { | |
2241 | decmpfs_unlock_compressed_data(cp, 1); | |
2242 | } | |
d9a64523 A |
2243 | /* |
2244 | * Trace the following parameters on return with event-id 0x03120000. | |
2245 | * | |
2246 | * @vp->v_id: vnode-id of the file being decompressed. | |
2247 | * @err: value returned from this function. | |
2248 | */ | |
2249 | DECMPFS_EMIT_TRACE_RETURN(DECMPDBG_DECOMPRESS_FILE, vp->v_id, err); | |
b0d623f7 A |
2250 | return err; |
2251 | } | |
2252 | ||
2253 | #pragma mark --- Type1 compressor --- | |
2254 | ||
2255 | /* | |
0a7de745 | 2256 | * The "Type1" compressor stores the data fork directly in the compression xattr |
b0d623f7 A |
2257 | */ |
2258 | ||
2259 | static int | |
2260 | decmpfs_validate_compressed_file_Type1(__unused vnode_t vp, __unused vfs_context_t ctx, decmpfs_header *hdr) | |
2261 | { | |
0a7de745 A |
2262 | int err = 0; |
2263 | ||
2264 | if (hdr->uncompressed_size + sizeof(decmpfs_disk_header) != (uint64_t)hdr->attr_size) { | |
2265 | err = EINVAL; | |
2266 | goto out; | |
2267 | } | |
b0d623f7 | 2268 | out: |
0a7de745 | 2269 | return err; |
b0d623f7 A |
2270 | } |
2271 | ||
2272 | static int | |
2273 | decmpfs_fetch_uncompressed_data_Type1(__unused vnode_t vp, __unused vfs_context_t ctx, decmpfs_header *hdr, off_t offset, user_ssize_t size, int nvec, decmpfs_vector *vec, uint64_t *bytes_read) | |
2274 | { | |
0a7de745 A |
2275 | int err = 0; |
2276 | int i; | |
2277 | user_ssize_t remaining; | |
2278 | ||
2279 | if (hdr->uncompressed_size + sizeof(decmpfs_disk_header) != (uint64_t)hdr->attr_size) { | |
2280 | err = EINVAL; | |
2281 | goto out; | |
2282 | } | |
2283 | ||
b0d623f7 | 2284 | #if COMPRESSION_DEBUG |
0a7de745 A |
2285 | static int dummy = 0; // prevent syslog from coalescing printfs |
2286 | DebugLogWithPath("%d memcpy %lld at %lld\n", dummy++, size, (uint64_t)offset); | |
b0d623f7 | 2287 | #endif |
0a7de745 A |
2288 | |
2289 | remaining = size; | |
2290 | for (i = 0; (i < nvec) && (remaining > 0); i++) { | |
2291 | user_ssize_t curCopy = vec[i].size; | |
2292 | if (curCopy > remaining) { | |
2293 | curCopy = remaining; | |
2294 | } | |
2295 | memcpy(vec[i].buf, hdr->attr_bytes + offset, curCopy); | |
2296 | offset += curCopy; | |
2297 | remaining -= curCopy; | |
2298 | } | |
2299 | ||
2300 | if ((bytes_read) && (err == 0)) { | |
2301 | *bytes_read = (size - remaining); | |
2302 | } | |
2303 | ||
b0d623f7 | 2304 | out: |
0a7de745 | 2305 | return err; |
b0d623f7 A |
2306 | } |
2307 | ||
5ba3f43e | 2308 | SECURITY_READ_ONLY_EARLY(static decmpfs_registration) Type1Reg = |
b0d623f7 | 2309 | { |
0a7de745 A |
2310 | .decmpfs_registration = DECMPFS_REGISTRATION_VERSION, |
2311 | .validate = decmpfs_validate_compressed_file_Type1, | |
2312 | .adjust_fetch = NULL,/* no adjust necessary */ | |
2313 | .fetch = decmpfs_fetch_uncompressed_data_Type1, | |
2314 | .free_data = NULL,/* no free necessary */ | |
2315 | .get_flags = NULL/* no flags */ | |
b0d623f7 A |
2316 | }; |
2317 | ||
2318 | #pragma mark --- decmpfs initialization --- | |
2319 | ||
0a7de745 A |
2320 | void |
2321 | decmpfs_init() | |
b0d623f7 | 2322 | { |
0a7de745 A |
2323 | static int done = 0; |
2324 | if (done) { | |
2325 | return; | |
2326 | } | |
2327 | ||
b0d623f7 | 2328 | decmpfs_ctx = vfs_context_create(vfs_context_kernel()); |
0a7de745 A |
2329 | |
2330 | lck_grp_attr_t *attr = lck_grp_attr_alloc_init(); | |
2331 | decmpfs_lockgrp = lck_grp_alloc_init("VFSCOMP", attr); | |
2332 | lck_grp_attr_free(attr); | |
2333 | decompressorsLock = lck_rw_alloc_init(decmpfs_lockgrp, NULL); | |
2334 | decompress_channel_mtx = lck_mtx_alloc_init(decmpfs_lockgrp, NULL); | |
2335 | ||
2336 | register_decmpfs_decompressor(CMP_Type1, &Type1Reg); | |
2337 | ||
2338 | done = 1; | |
b0d623f7 | 2339 | } |
39037602 | 2340 | #endif /* FS_COMPRESSION */ |