2 * Copyright (c) 1999-2008 Apple Inc. All rights reserved.
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
30 * Author: Umesh Vaishampayan [umeshv@apple.com]
31 * 05-Aug-1999 umeshv Created.
33 * Functions related to Unified Buffer cache.
35 * Caller of UBC functions MUST have a valid reference on the vnode.
39 #include <sys/types.h>
40 #include <sys/param.h>
41 #include <sys/systm.h>
44 #include <sys/mount_internal.h>
45 #include <sys/vnode_internal.h>
46 #include <sys/ubc_internal.h>
47 #include <sys/ucred.h>
48 #include <sys/proc_internal.h>
49 #include <sys/kauth.h>
52 #include <sys/codesign.h>
54 #include <mach/mach_types.h>
55 #include <mach/memory_object_types.h>
56 #include <mach/memory_object_control.h>
57 #include <mach/vm_map.h>
58 #include <mach/mach_vm.h>
61 #include <kern/kern_types.h>
62 #include <kern/kalloc.h>
63 #include <kern/zalloc.h>
64 #include <kern/thread.h>
65 #include <vm/vm_kern.h>
66 #include <vm/vm_protos.h> /* last */
68 #include <libkern/crypto/sha1.h>
70 #include <security/mac_framework.h>
72 /* XXX These should be in a BSD accessible Mach header, but aren't. */
73 extern kern_return_t
memory_object_pages_resident(memory_object_control_t
,
75 extern kern_return_t
memory_object_signed(memory_object_control_t control
,
77 extern void Debugger(const char *message
);
80 /* XXX no one uses this interface! */
81 kern_return_t
ubc_page_op_with_control(
82 memory_object_control_t control
,
93 #define assert(cond) \
94 ((void) ((cond) ? 0 : panic("Assert failed: %s", # cond)))
96 #include <kern/assert.h>
97 #endif /* DIAGNOSTIC */
99 static int ubc_info_init_internal(struct vnode
*vp
, int withfsize
, off_t filesize
);
100 static int ubc_umcallback(vnode_t
, void *);
101 static int ubc_msync_internal(vnode_t
, off_t
, off_t
, off_t
*, int, int *);
102 static void ubc_cs_free(struct ubc_info
*uip
);
104 struct zone
*ubc_info_zone
;
109 * Routines to navigate code signing data structures in the kernel...
118 const void *lower_bound
,
119 const void *upper_bound
)
121 if (upper_bound
< lower_bound
||
126 if (start
< lower_bound
||
135 * Magic numbers used by Code Signing
138 CSMAGIC_REQUIREMENT
= 0xfade0c00, /* single Requirement blob */
139 CSMAGIC_REQUIREMENTS
= 0xfade0c01, /* Requirements vector (internal requirements) */
140 CSMAGIC_CODEDIRECTORY
= 0xfade0c02, /* CodeDirectory blob */
141 CSMAGIC_EMBEDDED_SIGNATURE
= 0xfade0cc0, /* embedded form of signature data */
142 CSMAGIC_EMBEDDED_SIGNATURE_OLD
= 0xfade0b02, /* XXX */
143 CSMAGIC_DETACHED_SIGNATURE
= 0xfade0cc1, /* multi-arch collection of embedded signatures */
145 CSSLOT_CODEDIRECTORY
= 0, /* slot index for CodeDirectory */
148 static const uint32_t supportsScatter
= 0x20100; // first version to support scatter option
151 * Structure of an embedded-signature SuperBlob
153 typedef struct __BlobIndex
{
154 uint32_t type
; /* type of entry */
155 uint32_t offset
; /* offset of entry */
158 typedef struct __SuperBlob
{
159 uint32_t magic
; /* magic number */
160 uint32_t length
; /* total length of SuperBlob */
161 uint32_t count
; /* number of index entries following */
162 CS_BlobIndex index
[]; /* (count) entries */
163 /* followed by Blobs in no particular order as indicated by offsets in index */
167 uint32_t count
; // number of pages; zero for sentinel (only)
168 uint32_t base
; // first page number
169 uint64_t targetOffset
; // offset in target
170 uint64_t spare
; // reserved
174 * C form of a CodeDirectory.
176 typedef struct __CodeDirectory
{
177 uint32_t magic
; /* magic number (CSMAGIC_CODEDIRECTORY) */
178 uint32_t length
; /* total length of CodeDirectory blob */
179 uint32_t version
; /* compatibility version */
180 uint32_t flags
; /* setup and mode flags */
181 uint32_t hashOffset
; /* offset of hash slot element at index zero */
182 uint32_t identOffset
; /* offset of identifier string */
183 uint32_t nSpecialSlots
; /* number of special hash slots */
184 uint32_t nCodeSlots
; /* number of ordinary (code) hash slots */
185 uint32_t codeLimit
; /* limit to main image signature range */
186 uint8_t hashSize
; /* size of each hash in bytes */
187 uint8_t hashType
; /* type of hash (cdHashType* constants) */
188 uint8_t spare1
; /* unused (must be zero) */
189 uint8_t pageSize
; /* log2(page size in bytes); 0 => infinite */
190 uint32_t spare2
; /* unused (must be zero) */
191 /* Version 0x20100 */
192 uint32_t scatterOffset
; /* offset of optional scatter vector */
193 /* followed by dynamic content as located by offset fields above */
198 * Locate the CodeDirectory from an embedded signature blob
201 CS_CodeDirectory
*findCodeDirectory(
202 const CS_SuperBlob
*embedded
,
206 const CS_CodeDirectory
*cd
= NULL
;
209 cs_valid_range(embedded
, embedded
+ 1, lower_bound
, upper_bound
) &&
210 ntohl(embedded
->magic
) == CSMAGIC_EMBEDDED_SIGNATURE
) {
211 const CS_BlobIndex
*limit
;
212 const CS_BlobIndex
*p
;
214 limit
= &embedded
->index
[ntohl(embedded
->count
)];
215 if (!cs_valid_range(&embedded
->index
[0], limit
,
216 lower_bound
, upper_bound
)) {
219 for (p
= embedded
->index
; p
< limit
; ++p
) {
220 if (ntohl(p
->type
) == CSSLOT_CODEDIRECTORY
) {
221 const unsigned char *base
;
223 base
= (const unsigned char *)embedded
;
224 cd
= (const CS_CodeDirectory
*)(base
+ ntohl(p
->offset
));
230 * Detached signatures come as a bare CS_CodeDirectory,
233 cd
= (const CS_CodeDirectory
*) embedded
;
237 cs_valid_range(cd
, cd
+ 1, lower_bound
, upper_bound
) &&
238 cs_valid_range(cd
, (const char *) cd
+ ntohl(cd
->length
),
239 lower_bound
, upper_bound
) &&
240 cs_valid_range(cd
, (const char *) cd
+ ntohl(cd
->hashOffset
),
241 lower_bound
, upper_bound
) &&
242 cs_valid_range(cd
, (const char *) cd
+
243 ntohl(cd
->hashOffset
) +
244 (ntohl(cd
->nCodeSlots
) * SHA1_RESULTLEN
),
245 lower_bound
, upper_bound
) &&
247 ntohl(cd
->magic
) == CSMAGIC_CODEDIRECTORY
) {
251 // not found or not a valid code directory
257 * Locating a page hash
259 static const unsigned char *
261 const CS_CodeDirectory
*cd
,
266 const unsigned char *base
, *top
, *hash
;
267 uint32_t nCodeSlots
= ntohl(cd
->nCodeSlots
);
269 assert(cs_valid_range(cd
, cd
+ 1, lower_bound
, upper_bound
));
271 if((ntohl(cd
->version
) >= supportsScatter
) && (ntohl(cd
->scatterOffset
))) {
272 /* Get first scatter struct */
273 const struct Scatter
*scatter
= (const struct Scatter
*)
274 ((const char*)cd
+ ntohl(cd
->scatterOffset
));
275 uint32_t hashindex
=0, scount
, sbase
=0;
276 /* iterate all scatter structs */
278 if((const char*)scatter
> (const char*)cd
+ ntohl(cd
->length
)) {
280 printf("CODE SIGNING: Scatter extends past Code Directory\n");
285 scount
= ntohl(scatter
->count
);
286 uint32_t new_base
= ntohl(scatter
->base
);
293 if((hashindex
> 0) && (new_base
<= sbase
)) {
295 printf("CODE SIGNING: unordered Scatter, prev base %d, cur base %d\n",
298 return NULL
; /* unordered scatter array */
302 /* this scatter beyond page we're looking for? */
307 if (sbase
+scount
>= page
) {
308 /* Found the scatter struct that is
309 * referencing our page */
311 /* base = address of first hash covered by scatter */
312 base
= (const unsigned char *)cd
+ ntohl(cd
->hashOffset
) +
313 hashindex
* SHA1_RESULTLEN
;
314 /* top = address of first hash after this scatter */
315 top
= base
+ scount
* SHA1_RESULTLEN
;
316 if (!cs_valid_range(base
, top
, lower_bound
,
318 hashindex
> nCodeSlots
) {
325 /* this scatter struct is before the page we're looking
331 hash
= base
+ (page
- sbase
) * SHA1_RESULTLEN
;
333 base
= (const unsigned char *)cd
+ ntohl(cd
->hashOffset
);
334 top
= base
+ nCodeSlots
* SHA1_RESULTLEN
;
335 if (!cs_valid_range(base
, top
, lower_bound
, upper_bound
) ||
339 assert(page
< nCodeSlots
);
341 hash
= base
+ page
* SHA1_RESULTLEN
;
344 if (!cs_valid_range(hash
, hash
+ SHA1_RESULTLEN
,
345 lower_bound
, upper_bound
)) {
353 * End of routines to navigate code signing data structures in the kernel.
360 * Initialization of the zone for Unified Buffer Cache.
367 * ubc_info_zone(global) initialized for subsequent allocations
369 __private_extern__
void
374 i
= (vm_size_t
) sizeof (struct ubc_info
);
376 ubc_info_zone
= zinit (i
, 10000*i
, 8192, "ubc_info zone");
378 zone_change(ubc_info_zone
, Z_NOENCRYPT
, TRUE
);
385 * Allocate and attach an empty ubc_info structure to a vnode
387 * Parameters: vp Pointer to the vnode
390 * vnode_size:ENOMEM Not enough space
391 * vnode_size:??? Other error from vnode_getattr
395 ubc_info_init(struct vnode
*vp
)
397 return(ubc_info_init_internal(vp
, 0, 0));
402 * ubc_info_init_withsize
404 * Allocate and attach a sized ubc_info structure to a vnode
406 * Parameters: vp Pointer to the vnode
407 * filesize The size of the file
410 * vnode_size:ENOMEM Not enough space
411 * vnode_size:??? Other error from vnode_getattr
414 ubc_info_init_withsize(struct vnode
*vp
, off_t filesize
)
416 return(ubc_info_init_internal(vp
, 1, filesize
));
421 * ubc_info_init_internal
423 * Allocate and attach a ubc_info structure to a vnode
425 * Parameters: vp Pointer to the vnode
426 * withfsize{0,1} Zero if the size should be obtained
427 * from the vnode; otherwise, use filesize
428 * filesize The size of the file, if withfsize == 1
431 * vnode_size:ENOMEM Not enough space
432 * vnode_size:??? Other error from vnode_getattr
434 * Notes: We call a blocking zalloc(), and the zone was created as an
435 * expandable and collectable zone, so if no memory is available,
436 * it is possible for zalloc() to block indefinitely. zalloc()
437 * may also panic if the zone of zones is exhausted, since it's
440 * We unconditionally call vnode_pager_setup(), even if this is
441 * a reuse of a ubc_info; in that case, we should probably assert
442 * that it does not already have a pager association, but do not.
444 * Since memory_object_create_named() can only fail from receiving
445 * an invalid pager argument, the explicit check and panic is
446 * merely precautionary.
449 ubc_info_init_internal(vnode_t vp
, int withfsize
, off_t filesize
)
451 register struct ubc_info
*uip
;
455 memory_object_control_t control
;
460 * If there is not already a ubc_info attached to the vnode, we
461 * attach one; otherwise, we will reuse the one that's there.
463 if (uip
== UBC_INFO_NULL
) {
465 uip
= (struct ubc_info
*) zalloc(ubc_info_zone
);
466 bzero((char *)uip
, sizeof(struct ubc_info
));
469 uip
->ui_flags
= UI_INITED
;
470 uip
->ui_ucred
= NOCRED
;
472 assert(uip
->ui_flags
!= UI_NONE
);
473 assert(uip
->ui_vnode
== vp
);
475 /* now set this ubc_info in the vnode */
479 * Allocate a pager object for this vnode
481 * XXX The value of the pager parameter is currently ignored.
482 * XXX Presumably, this API changed to avoid the race between
483 * XXX setting the pager and the UI_HASPAGER flag.
485 pager
= (void *)vnode_pager_setup(vp
, uip
->ui_pager
);
489 * Explicitly set the pager into the ubc_info, after setting the
492 SET(uip
->ui_flags
, UI_HASPAGER
);
493 uip
->ui_pager
= pager
;
496 * Note: We can not use VNOP_GETATTR() to get accurate
497 * value of ui_size because this may be an NFS vnode, and
498 * nfs_getattr() can call vinvalbuf(); if this happens,
499 * ubc_info is not set up to deal with that event.
504 * create a vnode - vm_object association
505 * memory_object_create_named() creates a "named" reference on the
506 * memory object we hold this reference as long as the vnode is
507 * "alive." Since memory_object_create_named() took its own reference
508 * on the vnode pager we passed it, we can drop the reference
509 * vnode_pager_setup() returned here.
511 kret
= memory_object_create_named(pager
,
512 (memory_object_size_t
)uip
->ui_size
, &control
);
513 vnode_pager_deallocate(pager
);
514 if (kret
!= KERN_SUCCESS
)
515 panic("ubc_info_init: memory_object_create_named returned %d", kret
);
518 uip
->ui_control
= control
; /* cache the value of the mo control */
519 SET(uip
->ui_flags
, UI_HASOBJREF
); /* with a named reference */
521 if (withfsize
== 0) {
522 /* initialize the size */
523 error
= vnode_size(vp
, &uip
->ui_size
, vfs_context_current());
527 uip
->ui_size
= filesize
;
529 vp
->v_lflag
|= VNAMED_UBC
; /* vnode has a named ubc reference */
538 * Free a ubc_info structure
540 * Parameters: uip A pointer to the ubc_info to free
544 * Notes: If there is a credential that has subsequently been associated
545 * with the ubc_info via a call to ubc_setcred(), the reference
546 * to the credential is dropped.
548 * It's actually impossible for a ubc_info.ui_control to take the
549 * value MEMORY_OBJECT_CONTROL_NULL.
552 ubc_info_free(struct ubc_info
*uip
)
554 if (IS_VALID_CRED(uip
->ui_ucred
)) {
555 kauth_cred_unref(&uip
->ui_ucred
);
558 if (uip
->ui_control
!= MEMORY_OBJECT_CONTROL_NULL
)
559 memory_object_control_deallocate(uip
->ui_control
);
561 cluster_release(uip
);
564 zfree(ubc_info_zone
, uip
);
570 ubc_info_deallocate(struct ubc_info
*uip
)
579 * Tell the VM that the the size of the file represented by the vnode has
582 * Parameters: vp The vp whose backing file size is
584 * nsize The new size of the backing file
589 * Notes: This function will indicate failure if the new size that's
590 * being attempted to be set is negative.
592 * This function will fail if there is no ubc_info currently
593 * associated with the vnode.
595 * This function will indicate success it the new size is the
596 * same or larger than the old size (in this case, the remainder
597 * of the file will require modification or use of an existing upl
598 * to access successfully).
600 * This function will fail if the new file size is smaller, and
601 * the memory region being invalidated was unable to actually be
602 * invalidated and/or the last page could not be flushed, if the
603 * new size is not aligned to a page boundary. This is usually
604 * indicative of an I/O error.
607 ubc_setsize(struct vnode
*vp
, off_t nsize
)
609 off_t osize
; /* ui_size before change */
610 off_t lastpg
, olastpgend
, lastoff
;
611 struct ubc_info
*uip
;
612 memory_object_control_t control
;
613 kern_return_t kret
= KERN_SUCCESS
;
615 if (nsize
< (off_t
)0)
618 if (!UBCINFOEXISTS(vp
))
622 osize
= uip
->ui_size
;
624 * Update the size before flushing the VM
626 uip
->ui_size
= nsize
;
628 if (nsize
>= osize
) { /* Nothing more to do */
629 lock_vnode_and_post(vp
, NOTE_EXTEND
);
630 return (1); /* return success */
634 * When the file shrinks, invalidate the pages beyond the
635 * new size. Also get rid of garbage beyond nsize on the
636 * last page. The ui_size already has the nsize, so any
637 * subsequent page-in will zero-fill the tail properly
639 lastpg
= trunc_page_64(nsize
);
640 olastpgend
= round_page_64(osize
);
641 control
= uip
->ui_control
;
643 lastoff
= (nsize
& PAGE_MASK_64
);
651 * new EOF ends up in the middle of a page
652 * zero the tail of this page if its currently
653 * present in the cache
655 kret
= ubc_create_upl(vp
, lastpg
, PAGE_SIZE
, &upl
, &pl
, UPL_SET_LITE
);
657 if (kret
!= KERN_SUCCESS
)
658 panic("ubc_setsize: ubc_create_upl (error = %d)\n", kret
);
660 if (upl_valid_page(pl
, 0))
661 cluster_zero(upl
, (uint32_t)lastoff
, PAGE_SIZE
- (uint32_t)lastoff
, NULL
);
663 ubc_upl_abort_range(upl
, 0, PAGE_SIZE
, UPL_ABORT_FREE_ON_EMPTY
);
665 lastpg
+= PAGE_SIZE_64
;
667 if (olastpgend
> lastpg
) {
671 flags
= MEMORY_OBJECT_DATA_FLUSH_ALL
;
673 flags
= MEMORY_OBJECT_DATA_FLUSH
;
675 * invalidate the pages beyond the new EOF page
678 kret
= memory_object_lock_request(control
,
679 (memory_object_offset_t
)lastpg
,
680 (memory_object_size_t
)(olastpgend
- lastpg
), NULL
, NULL
,
681 MEMORY_OBJECT_RETURN_NONE
, flags
, VM_PROT_NO_CHANGE
);
682 if (kret
!= KERN_SUCCESS
)
683 printf("ubc_setsize: invalidate failed (error = %d)\n", kret
);
685 return ((kret
== KERN_SUCCESS
) ? 1 : 0);
692 * Get the size of the file assocated with the specified vnode
694 * Parameters: vp The vnode whose size is of interest
696 * Returns: 0 There is no ubc_info associated with
697 * this vnode, or the size is zero
698 * !0 The size of the file
700 * Notes: Using this routine, it is not possible for a caller to
701 * successfully distinguish between a vnode associate with a zero
702 * length file, and a vnode with no associated ubc_info. The
703 * caller therefore needs to not care, or needs to ensure that
704 * they have previously successfully called ubc_info_init() or
705 * ubc_info_init_withsize().
708 ubc_getsize(struct vnode
*vp
)
710 /* people depend on the side effect of this working this way
711 * as they call this for directory
713 if (!UBCINFOEXISTS(vp
))
715 return (vp
->v_ubcinfo
->ui_size
);
722 * Call ubc_sync_range(vp, 0, EOF, UBC_PUSHALL) on all the vnodes for this
725 * Parameters: mp The mount point
729 * Notes: There is no failure indication for this function.
731 * This function is used in the unmount path; since it may block
732 * I/O indefinitely, it should not be used in the forced unmount
733 * path, since a device unavailability could also block that
736 * Because there is no device ejection interlock on USB, FireWire,
737 * or similar devices, it's possible that an ejection that begins
738 * subsequent to the vnode_iterate() completing, either on one of
739 * those devices, or a network mount for which the server quits
740 * responding, etc., may cause the caller to block indefinitely.
742 __private_extern__
int
743 ubc_umount(struct mount
*mp
)
745 vnode_iterate(mp
, 0, ubc_umcallback
, 0);
753 * Used by ubc_umount() as an internal implementation detail; see ubc_umount()
754 * and vnode_iterate() for details of implementation.
757 ubc_umcallback(vnode_t vp
, __unused
void * args
)
760 if (UBCINFOEXISTS(vp
)) {
762 (void) ubc_msync(vp
, (off_t
)0, ubc_getsize(vp
), NULL
, UBC_PUSHALL
);
764 return (VNODE_RETURNED
);
771 * Get the credentials currently active for the ubc_info associated with the
774 * Parameters: vp The vnode whose ubc_info credentials
775 * are to be retrieved
777 * Returns: !NOCRED The credentials
778 * NOCRED If there is no ubc_info for the vnode,
779 * or if there is one, but it has not had
780 * any credentials associated with it via
781 * a call to ubc_setcred()
784 ubc_getcred(struct vnode
*vp
)
786 if (UBCINFOEXISTS(vp
))
787 return (vp
->v_ubcinfo
->ui_ucred
);
796 * If they are not already set, set the credentials of the ubc_info structure
797 * associated with the vnode to those of the supplied thread; otherwise leave
800 * Parameters: vp The vnode whose ubc_info creds are to
802 * p The process whose credentials are to
803 * be used, if not running on an assumed
805 * thread The thread whose credentials are to
808 * Returns: 1 This vnode has no associated ubc_info
811 * Notes: This function takes a proc parameter to account for bootstrap
812 * issues where a task or thread may call this routine, either
813 * before credentials have been initialized by bsd_init(), or if
814 * there is no BSD info asscoiate with a mach thread yet. This
815 * is known to happen in both the initial swap and memory mapping
818 * This function is generally used only in the following cases:
820 * o a memory mapped file via the mmap() system call
821 * o a memory mapped file via the deprecated map_fd() call
822 * o a swap store backing file
823 * o subsequent to a successful write via vn_write()
825 * The information is then used by the NFS client in order to
826 * cons up a wire message in either the page-in or page-out path.
828 * There are two potential problems with the use of this API:
830 * o Because the write path only set it on a successful
831 * write, there is a race window between setting the
832 * credential and its use to evict the pages to the
835 * o Because a page-in may occur prior to a write, the
836 * credential may not be set at this time, if the page-in
837 * is not the result of a mapping established via mmap()
840 * In both these cases, this will be triggered from the paging
841 * path, which will instead use the credential of the current
842 * process, which in this case is either the dynamic_pager or
843 * the kernel task, both of which utilize "root" credentials.
845 * This may potentially permit operations to occur which should
846 * be denied, or it may cause to be denied operations which
847 * should be permitted, depending on the configuration of the NFS
851 ubc_setthreadcred(struct vnode
*vp
, proc_t p
, thread_t thread
)
853 struct ubc_info
*uip
;
855 struct uthread
*uthread
= get_bsdthread_info(thread
);
857 if (!UBCINFOEXISTS(vp
))
863 credp
= uip
->ui_ucred
;
865 if (!IS_VALID_CRED(credp
)) {
866 /* use per-thread cred, if assumed identity, else proc cred */
867 if (uthread
== NULL
|| (uthread
->uu_flag
& UT_SETUID
) == 0) {
868 uip
->ui_ucred
= kauth_cred_proc_ref(p
);
870 uip
->ui_ucred
= uthread
->uu_ucred
;
871 kauth_cred_ref(uip
->ui_ucred
);
883 * If they are not already set, set the credentials of the ubc_info structure
884 * associated with the vnode to those of the process; otherwise leave them
887 * Parameters: vp The vnode whose ubc_info creds are to
889 * p The process whose credentials are to
892 * Returns: 0 This vnode has no associated ubc_info
895 * Notes: The return values for this function are inverted from nearly
896 * all other uses in the kernel.
898 * See also ubc_setthreadcred(), above.
900 * This function is considered deprecated, and generally should
901 * not be used, as it is incompatible with per-thread credentials;
902 * it exists for legacy KPI reasons.
904 * DEPRECATION: ubc_setcred() is being deprecated. Please use
905 * ubc_setthreadcred() instead.
908 ubc_setcred(struct vnode
*vp
, proc_t p
)
910 struct ubc_info
*uip
;
913 /* If there is no ubc_info, deny the operation */
914 if ( !UBCINFOEXISTS(vp
))
918 * Check to see if there is already a credential reference in the
919 * ubc_info; if there is not, take one on the supplied credential.
923 credp
= uip
->ui_ucred
;
924 if (!IS_VALID_CRED(credp
)) {
925 uip
->ui_ucred
= kauth_cred_proc_ref(p
);
935 * Get the pager associated with the ubc_info associated with the vnode.
937 * Parameters: vp The vnode to obtain the pager from
939 * Returns: !VNODE_PAGER_NULL The memory_object_t for the pager
940 * VNODE_PAGER_NULL There is no ubc_info for this vnode
942 * Notes: For each vnode that has a ubc_info associated with it, that
943 * ubc_info SHALL have a pager associated with it, so in the
944 * normal case, it's impossible to return VNODE_PAGER_NULL for
945 * a vnode with an associated ubc_info.
947 __private_extern__ memory_object_t
948 ubc_getpager(struct vnode
*vp
)
950 if (UBCINFOEXISTS(vp
))
951 return (vp
->v_ubcinfo
->ui_pager
);
960 * Get the memory object control associated with the ubc_info associated with
963 * Parameters: vp The vnode to obtain the memory object
967 * Returns: !MEMORY_OBJECT_CONTROL_NULL
968 * MEMORY_OBJECT_CONTROL_NULL
970 * Notes: Historically, if the flags were not "do not reactivate", this
971 * function would look up the memory object using the pager if
972 * it did not exist (this could be the case if the vnode had
973 * been previously reactivated). The flags would also permit a
974 * hold to be requested, which would have created an object
975 * reference, if one had not already existed. This usage is
976 * deprecated, as it would permit a race between finding and
977 * taking the reference vs. a single reference being dropped in
980 memory_object_control_t
981 ubc_getobject(struct vnode
*vp
, __unused
int flags
)
983 if (UBCINFOEXISTS(vp
))
984 return((vp
->v_ubcinfo
->ui_control
));
986 return (MEMORY_OBJECT_CONTROL_NULL
);
993 * Convert a given block number to a memory backing object (file) offset for a
996 * Parameters: vp The vnode in which the block is located
997 * blkno The block number to convert
999 * Returns: !-1 The offset into the backing object
1000 * -1 There is no ubc_info associated with
1002 * -1 An error occurred in the underlying VFS
1003 * while translating the block to an
1004 * offset; the most likely cause is that
1005 * the caller specified a block past the
1006 * end of the file, but this could also be
1007 * any other error from VNOP_BLKTOOFF().
1009 * Note: Representing the error in band loses some information, but does
1010 * not occlude a valid offset, since an off_t of -1 is normally
1011 * used to represent EOF. If we had a more reliable constant in
1012 * our header files for it (i.e. explicitly cast to an off_t), we
1013 * would use it here instead.
1016 ubc_blktooff(vnode_t vp
, daddr64_t blkno
)
1018 off_t file_offset
= -1;
1021 if (UBCINFOEXISTS(vp
)) {
1022 error
= VNOP_BLKTOOFF(vp
, blkno
, &file_offset
);
1027 return (file_offset
);
1034 * Convert a given offset in a memory backing object into a block number for a
1037 * Parameters: vp The vnode in which the offset is
1039 * offset The offset into the backing object
1041 * Returns: !-1 The returned block number
1042 * -1 There is no ubc_info associated with
1044 * -1 An error occurred in the underlying VFS
1045 * while translating the block to an
1046 * offset; the most likely cause is that
1047 * the caller specified a block past the
1048 * end of the file, but this could also be
1049 * any other error from VNOP_OFFTOBLK().
1051 * Note: Representing the error in band loses some information, but does
1052 * not occlude a valid block number, since block numbers exceed
1053 * the valid range for offsets, due to their relative sizes. If
1054 * we had a more reliable constant than -1 in our header files
1055 * for it (i.e. explicitly cast to an daddr64_t), we would use it
1059 ubc_offtoblk(vnode_t vp
, off_t offset
)
1061 daddr64_t blkno
= -1;
1064 if (UBCINFOEXISTS(vp
)) {
1065 error
= VNOP_OFFTOBLK(vp
, offset
, &blkno
);
1075 * ubc_pages_resident
1077 * Determine whether or not a given vnode has pages resident via the memory
1078 * object control associated with the ubc_info associated with the vnode
1080 * Parameters: vp The vnode we want to know about
1086 ubc_pages_resident(vnode_t vp
)
1089 boolean_t has_pages_resident
;
1091 if (!UBCINFOEXISTS(vp
))
1095 * The following call may fail if an invalid ui_control is specified,
1096 * or if there is no VM object associated with the control object. In
1097 * either case, reacting to it as if there were no pages resident will
1098 * result in correct behavior.
1100 kret
= memory_object_pages_resident(vp
->v_ubcinfo
->ui_control
, &has_pages_resident
);
1102 if (kret
!= KERN_SUCCESS
)
1105 if (has_pages_resident
== TRUE
)
1115 * Clean and/or invalidate a range in the memory object that backs this vnode
1117 * Parameters: vp The vnode whose associated ubc_info's
1118 * associated memory object is to have a
1119 * range invalidated within it
1120 * beg_off The start of the range, as an offset
1121 * end_off The end of the range, as an offset
1122 * flags See ubc_msync_internal()
1124 * Returns: 1 Success
1127 * Notes: see ubc_msync_internal() for more detailed information.
1129 * DEPRECATED: This interface is obsolete due to a failure to return error
1130 * information needed in order to correct failures. The currently
1131 * recommended interface is ubc_msync().
1134 ubc_sync_range(vnode_t vp
, off_t beg_off
, off_t end_off
, int flags
)
1136 return (ubc_msync_internal(vp
, beg_off
, end_off
, NULL
, flags
, NULL
));
1143 * Clean and/or invalidate a range in the memory object that backs this vnode
1145 * Parameters: vp The vnode whose associated ubc_info's
1146 * associated memory object is to have a
1147 * range invalidated within it
1148 * beg_off The start of the range, as an offset
1149 * end_off The end of the range, as an offset
1150 * resid_off The address of an off_t supplied by the
1151 * caller; may be set to NULL to ignore
1152 * flags See ubc_msync_internal()
1154 * Returns: 0 Success
1155 * !0 Failure; an errno is returned
1158 * *resid_off, modified If non-NULL, the contents are ALWAYS
1159 * modified; they are initialized to the
1160 * beg_off, and in case of an I/O error,
1161 * the difference between beg_off and the
1162 * current value will reflect what was
1163 * able to be written before the error
1164 * occurred. If no error is returned, the
1165 * value of the resid_off is undefined; do
1166 * NOT use it in place of end_off if you
1167 * intend to increment from the end of the
1168 * last call and call iteratively.
1170 * Notes: see ubc_msync_internal() for more detailed information.
1174 ubc_msync(vnode_t vp
, off_t beg_off
, off_t end_off
, off_t
*resid_off
, int flags
)
1180 *resid_off
= beg_off
;
1182 retval
= ubc_msync_internal(vp
, beg_off
, end_off
, resid_off
, flags
, &io_errno
);
1184 if (retval
== 0 && io_errno
== 0)
1191 * Clean and/or invalidate a range in the memory object that backs this vnode
1193 * Parameters: vp The vnode whose associated ubc_info's
1194 * associated memory object is to have a
1195 * range invalidated within it
1196 * beg_off The start of the range, as an offset
1197 * end_off The end of the range, as an offset
1198 * resid_off The address of an off_t supplied by the
1199 * caller; may be set to NULL to ignore
1200 * flags MUST contain at least one of the flags
1201 * UBC_INVALIDATE, UBC_PUSHDIRTY, or
1202 * UBC_PUSHALL; if UBC_PUSHDIRTY is used,
1203 * UBC_SYNC may also be specified to cause
1204 * this function to block until the
1205 * operation is complete. The behavior
1206 * of UBC_SYNC is otherwise undefined.
1207 * io_errno The address of an int to contain the
1208 * errno from a failed I/O operation, if
1209 * one occurs; may be set to NULL to
1212 * Returns: 1 Success
1216 * *resid_off, modified The contents of this offset MAY be
1217 * modified; in case of an I/O error, the
1218 * difference between beg_off and the
1219 * current value will reflect what was
1220 * able to be written before the error
1222 * *io_errno, modified The contents of this offset are set to
1223 * an errno, if an error occurs; if the
1224 * caller supplies an io_errno parameter,
1225 * they should be careful to initialize it
1226 * to 0 before calling this function to
1227 * enable them to distinguish an error
1228 * with a valid *resid_off from an invalid
1229 * one, and to avoid potentially falsely
1230 * reporting an error, depending on use.
1232 * Notes: If there is no ubc_info associated with the vnode supplied,
1233 * this function immediately returns success.
1235 * If the value of end_off is less than or equal to beg_off, this
1236 * function immediately returns success; that is, end_off is NOT
1239 * IMPORTANT: one of the flags UBC_INVALIDATE, UBC_PUSHDIRTY, or
1240 * UBC_PUSHALL MUST be specified; that is, it is NOT possible to
1241 * attempt to block on in-progress I/O by calling this function
1242 * with UBC_PUSHDIRTY, and then later call it with just UBC_SYNC
1243 * in order to block pending on the I/O already in progress.
1245 * The start offset is truncated to the page boundary and the
1246 * size is adjusted to include the last page in the range; that
1247 * is, end_off on exactly a page boundary will not change if it
1248 * is rounded, and the range of bytes written will be from the
1249 * truncate beg_off to the rounded (end_off - 1).
1252 ubc_msync_internal(vnode_t vp
, off_t beg_off
, off_t end_off
, off_t
*resid_off
, int flags
, int *io_errno
)
1254 memory_object_size_t tsize
;
1256 int request_flags
= 0;
1257 int flush_flags
= MEMORY_OBJECT_RETURN_NONE
;
1259 if ( !UBCINFOEXISTS(vp
))
1261 if ((flags
& (UBC_INVALIDATE
| UBC_PUSHDIRTY
| UBC_PUSHALL
)) == 0)
1263 if (end_off
<= beg_off
)
1266 if (flags
& UBC_INVALIDATE
)
1268 * discard the resident pages
1270 request_flags
= (MEMORY_OBJECT_DATA_FLUSH
| MEMORY_OBJECT_DATA_NO_CHANGE
);
1272 if (flags
& UBC_SYNC
)
1274 * wait for all the I/O to complete before returning
1276 request_flags
|= MEMORY_OBJECT_IO_SYNC
;
1278 if (flags
& UBC_PUSHDIRTY
)
1280 * we only return the dirty pages in the range
1282 flush_flags
= MEMORY_OBJECT_RETURN_DIRTY
;
1284 if (flags
& UBC_PUSHALL
)
1286 * then return all the interesting pages in the range (both
1287 * dirty and precious) to the pager
1289 flush_flags
= MEMORY_OBJECT_RETURN_ALL
;
1291 beg_off
= trunc_page_64(beg_off
);
1292 end_off
= round_page_64(end_off
);
1293 tsize
= (memory_object_size_t
)end_off
- beg_off
;
1295 /* flush and/or invalidate pages in the range requested */
1296 kret
= memory_object_lock_request(vp
->v_ubcinfo
->ui_control
,
1298 (memory_object_offset_t
*)resid_off
,
1299 io_errno
, flush_flags
, request_flags
,
1302 return ((kret
== KERN_SUCCESS
) ? 1 : 0);
1307 * ubc_msync_internal
1309 * Explicitly map a vnode that has an associate ubc_info, and add a reference
1310 * to it for the ubc system, if there isn't one already, so it will not be
1311 * recycled while it's in use, and set flags on the ubc_info to indicate that
1314 * Parameters: vp The vnode to map
1315 * flags The mapping flags for the vnode; this
1316 * will be a combination of one or more of
1317 * PROT_READ, PROT_WRITE, and PROT_EXEC
1319 * Returns: 0 Success
1320 * EPERM Permission was denied
1322 * Notes: An I/O reference on the vnode must already be held on entry
1324 * If there is no ubc_info associated with the vnode, this function
1325 * will return success.
1327 * If a permission error occurs, this function will return
1328 * failure; all other failures will cause this function to return
1331 * IMPORTANT: This is an internal use function, and its symbols
1332 * are not exported, hence its error checking is not very robust.
1333 * It is primarily used by:
1335 * o mmap(), when mapping a file
1336 * o The deprecated map_fd() interface, when mapping a file
1337 * o When mapping a shared file (a shared library in the
1338 * shared segment region)
1339 * o When loading a program image during the exec process
1341 * ...all of these uses ignore the return code, and any fault that
1342 * results later because of a failure is handled in the fix-up path
1343 * of the fault handler. The interface exists primarily as a
1346 * Given that third party implementation of the type of interfaces
1347 * that would use this function, such as alternative executable
1348 * formats, etc., are unsupported, this function is not exported
1351 * The extra reference is held until the VM system unmaps the
1352 * vnode from its own context to maintain a vnode reference in
1353 * cases like open()/mmap()/close(), which leave the backing
1354 * object referenced by a mapped memory region in a process
1357 __private_extern__
int
1358 ubc_map(vnode_t vp
, int flags
)
1360 struct ubc_info
*uip
;
1363 int need_wakeup
= 0;
1365 if (UBCINFOEXISTS(vp
)) {
1368 uip
= vp
->v_ubcinfo
;
1370 while (ISSET(uip
->ui_flags
, UI_MAPBUSY
)) {
1371 SET(uip
->ui_flags
, UI_MAPWAITING
);
1372 (void) msleep(&uip
->ui_flags
, &vp
->v_lock
,
1373 PRIBIO
, "ubc_map", NULL
);
1375 SET(uip
->ui_flags
, UI_MAPBUSY
);
1378 error
= VNOP_MMAP(vp
, flags
, vfs_context_current());
1383 vnode_lock_spin(vp
);
1386 if ( !ISSET(uip
->ui_flags
, UI_ISMAPPED
))
1388 SET(uip
->ui_flags
, (UI_WASMAPPED
| UI_ISMAPPED
));
1390 CLR(uip
->ui_flags
, UI_MAPBUSY
);
1392 if (ISSET(uip
->ui_flags
, UI_MAPWAITING
)) {
1393 CLR(uip
->ui_flags
, UI_MAPWAITING
);
1399 wakeup(&uip
->ui_flags
);
1411 * Destroy the named memory object associated with the ubc_info control object
1412 * associated with the designated vnode, if there is a ubc_info associated
1413 * with the vnode, and a control object is associated with it
1415 * Parameters: vp The designated vnode
1419 * Notes: This function is called on vnode termination for all vnodes,
1420 * and must therefore not assume that there is a ubc_info that is
1421 * associated with the vnode, nor that there is a control object
1422 * associated with the ubc_info.
1424 * If all the conditions necessary are present, this function
1425 * calls memory_object_destory(), which will in turn end up
1426 * calling ubc_unmap() to release any vnode references that were
1427 * established via ubc_map().
1429 * IMPORTANT: This is an internal use function that is used
1430 * exclusively by the internal use function vclean().
1432 __private_extern__
void
1433 ubc_destroy_named(vnode_t vp
)
1435 memory_object_control_t control
;
1436 struct ubc_info
*uip
;
1439 if (UBCINFOEXISTS(vp
)) {
1440 uip
= vp
->v_ubcinfo
;
1442 /* Terminate the memory object */
1443 control
= ubc_getobject(vp
, UBC_HOLDOBJECT
);
1444 if (control
!= MEMORY_OBJECT_CONTROL_NULL
) {
1445 kret
= memory_object_destroy(control
, 0);
1446 if (kret
!= KERN_SUCCESS
)
1447 panic("ubc_destroy_named: memory_object_destroy failed");
1456 * Determine whether or not a vnode is currently in use by ubc at a level in
1457 * excess of the requested busycount
1459 * Parameters: vp The vnode to check
1460 * busycount The threshold busy count, used to bias
1461 * the count usually already held by the
1462 * caller to avoid races
1464 * Returns: 1 The vnode is in use over the threshold
1465 * 0 The vnode is not in use over the
1468 * Notes: Because the vnode is only held locked while actually asking
1469 * the use count, this function only represents a snapshot of the
1470 * current state of the vnode. If more accurate information is
1471 * required, an additional busycount should be held by the caller
1472 * and a non-zero busycount used.
1474 * If there is no ubc_info associated with the vnode, this
1475 * function will report that the vnode is not in use by ubc.
1478 ubc_isinuse(struct vnode
*vp
, int busycount
)
1480 if ( !UBCINFOEXISTS(vp
))
1482 return(ubc_isinuse_locked(vp
, busycount
, 0));
1487 * ubc_isinuse_locked
1489 * Determine whether or not a vnode is currently in use by ubc at a level in
1490 * excess of the requested busycount
1492 * Parameters: vp The vnode to check
1493 * busycount The threshold busy count, used to bias
1494 * the count usually already held by the
1495 * caller to avoid races
1496 * locked True if the vnode is already locked by
1499 * Returns: 1 The vnode is in use over the threshold
1500 * 0 The vnode is not in use over the
1503 * Notes: If the vnode is not locked on entry, it is locked while
1504 * actually asking the use count. If this is the case, this
1505 * function only represents a snapshot of the current state of
1506 * the vnode. If more accurate information is required, the
1507 * vnode lock should be held by the caller, otherwise an
1508 * additional busycount should be held by the caller and a
1509 * non-zero busycount used.
1511 * If there is no ubc_info associated with the vnode, this
1512 * function will report that the vnode is not in use by ubc.
1515 ubc_isinuse_locked(struct vnode
*vp
, int busycount
, int locked
)
1521 vnode_lock_spin(vp
);
1523 if ((vp
->v_usecount
- vp
->v_kusecount
) > busycount
)
1535 * Reverse the effects of a ubc_map() call for a given vnode
1537 * Parameters: vp vnode to unmap from ubc
1541 * Notes: This is an internal use function used by vnode_pager_unmap().
1542 * It will attempt to obtain a reference on the supplied vnode,
1543 * and if it can do so, and there is an associated ubc_info, and
1544 * the flags indicate that it was mapped via ubc_map(), then the
1545 * flag is cleared, the mapping removed, and the reference taken
1546 * by ubc_map() is released.
1548 * IMPORTANT: This MUST only be called by the VM
1549 * to prevent race conditions.
1551 __private_extern__
void
1552 ubc_unmap(struct vnode
*vp
)
1554 struct ubc_info
*uip
;
1556 int need_wakeup
= 0;
1558 if (vnode_getwithref(vp
))
1561 if (UBCINFOEXISTS(vp
)) {
1563 uip
= vp
->v_ubcinfo
;
1565 while (ISSET(uip
->ui_flags
, UI_MAPBUSY
)) {
1566 SET(uip
->ui_flags
, UI_MAPWAITING
);
1567 (void) msleep(&uip
->ui_flags
, &vp
->v_lock
,
1568 PRIBIO
, "ubc_unmap", NULL
);
1570 SET(uip
->ui_flags
, UI_MAPBUSY
);
1572 if (ISSET(uip
->ui_flags
, UI_ISMAPPED
)) {
1573 CLR(uip
->ui_flags
, UI_ISMAPPED
);
1579 (void)VNOP_MNOMAP(vp
, vfs_context_current());
1583 vnode_lock_spin(vp
);
1585 CLR(uip
->ui_flags
, UI_MAPBUSY
);
1586 if (ISSET(uip
->ui_flags
, UI_MAPWAITING
)) {
1587 CLR(uip
->ui_flags
, UI_MAPWAITING
);
1593 wakeup(&uip
->ui_flags
);
1597 * the drop of the vnode ref will cleanup
1606 * Manipulate individual page state for a vnode with an associated ubc_info
1607 * with an associated memory object control.
1609 * Parameters: vp The vnode backing the page
1610 * f_offset A file offset interior to the page
1611 * ops The operations to perform, as a bitmap
1612 * (see below for more information)
1613 * phys_entryp The address of a ppnum_t; may be NULL
1615 * flagsp A pointer to an int to contain flags;
1616 * may be NULL to ignore
1618 * Returns: KERN_SUCCESS Success
1619 * KERN_INVALID_ARGUMENT If the memory object control has no VM
1621 * KERN_INVALID_OBJECT If UPL_POP_PHYSICAL and the object is
1622 * not physically contiguous
1623 * KERN_INVALID_OBJECT If !UPL_POP_PHYSICAL and the object is
1624 * physically contiguous
1625 * KERN_FAILURE If the page cannot be looked up
1628 * *phys_entryp (modified) If phys_entryp is non-NULL and
1630 * *flagsp (modified) If flagsp is non-NULL and there was
1631 * !UPL_POP_PHYSICAL and a KERN_SUCCESS
1633 * Notes: For object boundaries, it is considerably more efficient to
1634 * ensure that f_offset is in fact on a page boundary, as this
1635 * will avoid internal use of the hash table to identify the
1636 * page, and would therefore skip a number of early optimizations.
1637 * Since this is a page operation anyway, the caller should try
1638 * to pass only a page aligned offset because of this.
1640 * *flagsp may be modified even if this function fails. If it is
1641 * modified, it will contain the condition of the page before the
1642 * requested operation was attempted; these will only include the
1643 * bitmap flags, and not the PL_POP_PHYSICAL, UPL_POP_DUMP,
1644 * UPL_POP_SET, or UPL_POP_CLR bits.
1646 * The flags field may contain a specific operation, such as
1647 * UPL_POP_PHYSICAL or UPL_POP_DUMP:
1649 * o UPL_POP_PHYSICAL Fail if not contiguous; if
1650 * *phys_entryp and successful, set
1652 * o UPL_POP_DUMP Dump the specified page
1654 * Otherwise, it is treated as a bitmap of one or more page
1655 * operations to perform on the final memory object; allowable
1658 * o UPL_POP_DIRTY The page is dirty
1659 * o UPL_POP_PAGEOUT The page is paged out
1660 * o UPL_POP_PRECIOUS The page is precious
1661 * o UPL_POP_ABSENT The page is absent
1662 * o UPL_POP_BUSY The page is busy
1664 * If the page status is only being queried and not modified, then
1665 * not other bits should be specified. However, if it is being
1666 * modified, exactly ONE of the following bits should be set:
1668 * o UPL_POP_SET Set the current bitmap bits
1669 * o UPL_POP_CLR Clear the current bitmap bits
1671 * Thus to effect a combination of setting an clearing, it may be
1672 * necessary to call this function twice. If this is done, the
1673 * set should be used before the clear, since clearing may trigger
1674 * a wakeup on the destination page, and if the page is backed by
1675 * an encrypted swap file, setting will trigger the decryption
1676 * needed before the wakeup occurs.
1683 ppnum_t
*phys_entryp
,
1686 memory_object_control_t control
;
1688 control
= ubc_getobject(vp
, UBC_FLAGS_NONE
);
1689 if (control
== MEMORY_OBJECT_CONTROL_NULL
)
1690 return KERN_INVALID_ARGUMENT
;
1692 return (memory_object_page_op(control
,
1693 (memory_object_offset_t
)f_offset
,
1703 * Manipulate page state for a range of memory for a vnode with an associated
1704 * ubc_info with an associated memory object control, when page level state is
1705 * not required to be returned from the call (i.e. there are no phys_entryp or
1706 * flagsp parameters to this call, and it takes a range which may contain
1707 * multiple pages, rather than an offset interior to a single page).
1709 * Parameters: vp The vnode backing the page
1710 * f_offset_beg A file offset interior to the start page
1711 * f_offset_end A file offset interior to the end page
1712 * ops The operations to perform, as a bitmap
1713 * (see below for more information)
1714 * range The address of an int; may be NULL to
1717 * Returns: KERN_SUCCESS Success
1718 * KERN_INVALID_ARGUMENT If the memory object control has no VM
1720 * KERN_INVALID_OBJECT If the object is physically contiguous
1723 * *range (modified) If range is non-NULL, its contents will
1724 * be modified to contain the number of
1725 * bytes successfully operated upon.
1727 * Notes: IMPORTANT: This function cannot be used on a range that
1728 * consists of physically contiguous pages.
1730 * For object boundaries, it is considerably more efficient to
1731 * ensure that f_offset_beg and f_offset_end are in fact on page
1732 * boundaries, as this will avoid internal use of the hash table
1733 * to identify the page, and would therefore skip a number of
1734 * early optimizations. Since this is an operation on a set of
1735 * pages anyway, the caller should try to pass only a page aligned
1736 * offsets because of this.
1738 * *range will be modified only if this function succeeds.
1740 * The flags field MUST contain a specific operation; allowable
1743 * o UPL_ROP_ABSENT Returns the extent of the range
1744 * presented which is absent, starting
1745 * with the start address presented
1747 * o UPL_ROP_PRESENT Returns the extent of the range
1748 * presented which is present (resident),
1749 * starting with the start address
1751 * o UPL_ROP_DUMP Dump the pages which are found in the
1752 * target object for the target range.
1754 * IMPORTANT: For UPL_ROP_ABSENT and UPL_ROP_PRESENT; if there are
1755 * multiple regions in the range, only the first matching region
1766 memory_object_control_t control
;
1768 control
= ubc_getobject(vp
, UBC_FLAGS_NONE
);
1769 if (control
== MEMORY_OBJECT_CONTROL_NULL
)
1770 return KERN_INVALID_ARGUMENT
;
1772 return (memory_object_range_op(control
,
1773 (memory_object_offset_t
)f_offset_beg
,
1774 (memory_object_offset_t
)f_offset_end
,
1783 * Given a vnode, cause the population of a portion of the vm_object; based on
1784 * the nature of the request, the pages returned may contain valid data, or
1785 * they may be uninitialized.
1787 * Parameters: vp The vnode from which to create the upl
1788 * f_offset The start offset into the backing store
1789 * represented by the vnode
1790 * bufsize The size of the upl to create
1791 * uplp Pointer to the upl_t to receive the
1792 * created upl; MUST NOT be NULL
1793 * plp Pointer to receive the internal page
1794 * list for the created upl; MAY be NULL
1797 * Returns: KERN_SUCCESS The requested upl has been created
1798 * KERN_INVALID_ARGUMENT The bufsize argument is not an even
1799 * multiple of the page size
1800 * KERN_INVALID_ARGUMENT There is no ubc_info associated with
1801 * the vnode, or there is no memory object
1802 * control associated with the ubc_info
1803 * memory_object_upl_request:KERN_INVALID_VALUE
1804 * The supplied upl_flags argument is
1808 * *plp (modified) If non-NULL, the value of *plp will be
1809 * modified to point to the internal page
1810 * list; this modification may occur even
1811 * if this function is unsuccessful, in
1812 * which case the contents may be invalid
1814 * Note: If successful, the returned *uplp MUST subsequently be freed
1815 * via a call to ubc_upl_commit(), ubc_upl_commit_range(),
1816 * ubc_upl_abort(), or ubc_upl_abort_range().
1824 upl_page_info_t
**plp
,
1827 memory_object_control_t control
;
1834 if (bufsize
& 0xfff)
1835 return KERN_INVALID_ARGUMENT
;
1837 if (uplflags
& (UPL_UBC_MSYNC
| UPL_UBC_PAGEOUT
| UPL_UBC_PAGEIN
)) {
1839 if (uplflags
& UPL_UBC_MSYNC
) {
1840 uplflags
&= UPL_RET_ONLY_DIRTY
;
1842 uplflags
|= UPL_COPYOUT_FROM
| UPL_CLEAN_IN_PLACE
|
1843 UPL_SET_INTERNAL
| UPL_SET_LITE
;
1845 } else if (uplflags
& UPL_UBC_PAGEOUT
) {
1846 uplflags
&= UPL_RET_ONLY_DIRTY
;
1848 if (uplflags
& UPL_RET_ONLY_DIRTY
)
1849 uplflags
|= UPL_NOBLOCK
;
1851 uplflags
|= UPL_FOR_PAGEOUT
| UPL_CLEAN_IN_PLACE
|
1852 UPL_COPYOUT_FROM
| UPL_SET_INTERNAL
| UPL_SET_LITE
;
1854 uplflags
|= UPL_RET_ONLY_ABSENT
| UPL_NOBLOCK
|
1855 UPL_NO_SYNC
| UPL_CLEAN_IN_PLACE
|
1856 UPL_SET_INTERNAL
| UPL_SET_LITE
;
1859 uplflags
&= ~UPL_FOR_PAGEOUT
;
1861 if (uplflags
& UPL_WILL_BE_DUMPED
) {
1862 uplflags
&= ~UPL_WILL_BE_DUMPED
;
1863 uplflags
|= (UPL_NO_SYNC
|UPL_SET_INTERNAL
);
1865 uplflags
|= (UPL_NO_SYNC
|UPL_CLEAN_IN_PLACE
|UPL_SET_INTERNAL
);
1867 control
= ubc_getobject(vp
, UBC_FLAGS_NONE
);
1868 if (control
== MEMORY_OBJECT_CONTROL_NULL
)
1869 return KERN_INVALID_ARGUMENT
;
1871 kr
= memory_object_upl_request(control
, f_offset
, bufsize
, uplp
, NULL
, NULL
, uplflags
);
1872 if (kr
== KERN_SUCCESS
&& plp
!= NULL
)
1873 *plp
= UPL_GET_INTERNAL_PAGE_LIST(*uplp
);
1879 * ubc_upl_maxbufsize
1881 * Return the maximum bufsize ubc_create_upl( ) will take.
1885 * Returns: maximum size buffer (in bytes) ubc_create_upl( ) will take.
1891 return(MAX_UPL_SIZE
* PAGE_SIZE
);
1897 * Map the page list assocated with the supplied upl into the kernel virtual
1898 * address space at the virtual address indicated by the dst_addr argument;
1899 * the entire upl is mapped
1901 * Parameters: upl The upl to map
1902 * dst_addr The address at which to map the upl
1904 * Returns: KERN_SUCCESS The upl has been mapped
1905 * KERN_INVALID_ARGUMENT The upl is UPL_NULL
1906 * KERN_FAILURE The upl is already mapped
1907 * vm_map_enter:KERN_INVALID_ARGUMENT
1908 * A failure code from vm_map_enter() due
1909 * to an invalid argument
1914 vm_offset_t
*dst_addr
)
1916 return (vm_upl_map(kernel_map
, upl
, dst_addr
));
1923 * Unmap the page list assocated with the supplied upl from the kernel virtual
1924 * address space; the entire upl is unmapped.
1926 * Parameters: upl The upl to unmap
1928 * Returns: KERN_SUCCESS The upl has been unmapped
1929 * KERN_FAILURE The upl is not currently mapped
1930 * KERN_INVALID_ARGUMENT If the upl is UPL_NULL
1936 return(vm_upl_unmap(kernel_map
, upl
));
1943 * Commit the contents of the upl to the backing store
1945 * Parameters: upl The upl to commit
1947 * Returns: KERN_SUCCESS The upl has been committed
1948 * KERN_INVALID_ARGUMENT The supplied upl was UPL_NULL
1949 * KERN_FAILURE The supplied upl does not represent
1950 * device memory, and the offset plus the
1951 * size would exceed the actual size of
1954 * Notes: In practice, the only return value for this function should be
1955 * KERN_SUCCESS, unless there has been data structure corruption;
1956 * since the upl is deallocated regardless of success or failure,
1957 * there's really nothing to do about this other than panic.
1959 * IMPORTANT: Use of this function should not be mixed with use of
1960 * ubc_upl_commit_range(), due to the unconditional deallocation
1967 upl_page_info_t
*pl
;
1970 pl
= UPL_GET_INTERNAL_PAGE_LIST(upl
);
1971 kr
= upl_commit(upl
, pl
, MAX_UPL_SIZE
);
1972 upl_deallocate(upl
);
1980 * Commit the contents of the specified range of the upl to the backing store
1982 * Parameters: upl The upl to commit
1983 * offset The offset into the upl
1984 * size The size of the region to be committed,
1985 * starting at the specified offset
1986 * flags commit type (see below)
1988 * Returns: KERN_SUCCESS The range has been committed
1989 * KERN_INVALID_ARGUMENT The supplied upl was UPL_NULL
1990 * KERN_FAILURE The supplied upl does not represent
1991 * device memory, and the offset plus the
1992 * size would exceed the actual size of
1995 * Notes: IMPORTANT: If the commit is successful, and the object is now
1996 * empty, the upl will be deallocated. Since the caller cannot
1997 * check that this is the case, the UPL_COMMIT_FREE_ON_EMPTY flag
1998 * should generally only be used when the offset is 0 and the size
1999 * is equal to the upl size.
2001 * The flags argument is a bitmap of flags on the rage of pages in
2002 * the upl to be committed; allowable flags are:
2004 * o UPL_COMMIT_FREE_ON_EMPTY Free the upl when it is
2005 * both empty and has been
2006 * successfully committed
2007 * o UPL_COMMIT_CLEAR_DIRTY Clear each pages dirty
2008 * bit; will prevent a
2010 * o UPL_COMMIT_SET_DIRTY Set each pages dirty
2011 * bit; will cause a later
2013 * o UPL_COMMIT_INACTIVATE Clear each pages
2014 * reference bit; the page
2015 * will not be accessed
2016 * o UPL_COMMIT_ALLOW_ACCESS Unbusy each page; pages
2017 * become busy when an
2018 * IOMemoryDescriptor is
2019 * mapped or redirected,
2020 * and we have to wait for
2023 * The flag UPL_COMMIT_NOTIFY_EMPTY is used internally, and should
2024 * not be specified by the caller.
2026 * The UPL_COMMIT_CLEAR_DIRTY and UPL_COMMIT_SET_DIRTY flags are
2027 * mutually exclusive, and should not be combined.
2030 ubc_upl_commit_range(
2032 upl_offset_t offset
,
2036 upl_page_info_t
*pl
;
2040 if (flags
& UPL_COMMIT_FREE_ON_EMPTY
)
2041 flags
|= UPL_COMMIT_NOTIFY_EMPTY
;
2043 if (flags
& UPL_COMMIT_KERNEL_ONLY_FLAGS
) {
2044 return KERN_INVALID_ARGUMENT
;
2047 pl
= UPL_GET_INTERNAL_PAGE_LIST(upl
);
2049 kr
= upl_commit_range(upl
, offset
, size
, flags
,
2050 pl
, MAX_UPL_SIZE
, &empty
);
2052 if((flags
& UPL_COMMIT_FREE_ON_EMPTY
) && empty
)
2053 upl_deallocate(upl
);
2060 * ubc_upl_abort_range
2062 * Abort the contents of the specified range of the specified upl
2064 * Parameters: upl The upl to abort
2065 * offset The offset into the upl
2066 * size The size of the region to be aborted,
2067 * starting at the specified offset
2068 * abort_flags abort type (see below)
2070 * Returns: KERN_SUCCESS The range has been aborted
2071 * KERN_INVALID_ARGUMENT The supplied upl was UPL_NULL
2072 * KERN_FAILURE The supplied upl does not represent
2073 * device memory, and the offset plus the
2074 * size would exceed the actual size of
2077 * Notes: IMPORTANT: If the abort is successful, and the object is now
2078 * empty, the upl will be deallocated. Since the caller cannot
2079 * check that this is the case, the UPL_ABORT_FREE_ON_EMPTY flag
2080 * should generally only be used when the offset is 0 and the size
2081 * is equal to the upl size.
2083 * The abort_flags argument is a bitmap of flags on the range of
2084 * pages in the upl to be aborted; allowable flags are:
2086 * o UPL_ABORT_FREE_ON_EMPTY Free the upl when it is both
2087 * empty and has been successfully
2089 * o UPL_ABORT_RESTART The operation must be restarted
2090 * o UPL_ABORT_UNAVAILABLE The pages are unavailable
2091 * o UPL_ABORT_ERROR An I/O error occurred
2092 * o UPL_ABORT_DUMP_PAGES Just free the pages
2093 * o UPL_ABORT_NOTIFY_EMPTY RESERVED
2094 * o UPL_ABORT_ALLOW_ACCESS RESERVED
2096 * The UPL_ABORT_NOTIFY_EMPTY is an internal use flag and should
2097 * not be specified by the caller. It is intended to fulfill the
2098 * same role as UPL_COMMIT_NOTIFY_EMPTY does in the function
2099 * ubc_upl_commit_range(), but is never referenced internally.
2101 * The UPL_ABORT_ALLOW_ACCESS is defined, but neither set nor
2102 * referenced; do not use it.
2105 ubc_upl_abort_range(
2107 upl_offset_t offset
,
2112 boolean_t empty
= FALSE
;
2114 if (abort_flags
& UPL_ABORT_FREE_ON_EMPTY
)
2115 abort_flags
|= UPL_ABORT_NOTIFY_EMPTY
;
2117 kr
= upl_abort_range(upl
, offset
, size
, abort_flags
, &empty
);
2119 if((abort_flags
& UPL_ABORT_FREE_ON_EMPTY
) && empty
)
2120 upl_deallocate(upl
);
2129 * Abort the contents of the specified upl
2131 * Parameters: upl The upl to abort
2132 * abort_type abort type (see below)
2134 * Returns: KERN_SUCCESS The range has been aborted
2135 * KERN_INVALID_ARGUMENT The supplied upl was UPL_NULL
2136 * KERN_FAILURE The supplied upl does not represent
2137 * device memory, and the offset plus the
2138 * size would exceed the actual size of
2141 * Notes: IMPORTANT: If the abort is successful, and the object is now
2142 * empty, the upl will be deallocated. Since the caller cannot
2143 * check that this is the case, the UPL_ABORT_FREE_ON_EMPTY flag
2144 * should generally only be used when the offset is 0 and the size
2145 * is equal to the upl size.
2147 * The abort_type is a bitmap of flags on the range of
2148 * pages in the upl to be aborted; allowable flags are:
2150 * o UPL_ABORT_FREE_ON_EMPTY Free the upl when it is both
2151 * empty and has been successfully
2153 * o UPL_ABORT_RESTART The operation must be restarted
2154 * o UPL_ABORT_UNAVAILABLE The pages are unavailable
2155 * o UPL_ABORT_ERROR An I/O error occurred
2156 * o UPL_ABORT_DUMP_PAGES Just free the pages
2157 * o UPL_ABORT_NOTIFY_EMPTY RESERVED
2158 * o UPL_ABORT_ALLOW_ACCESS RESERVED
2160 * The UPL_ABORT_NOTIFY_EMPTY is an internal use flag and should
2161 * not be specified by the caller. It is intended to fulfill the
2162 * same role as UPL_COMMIT_NOTIFY_EMPTY does in the function
2163 * ubc_upl_commit_range(), but is never referenced internally.
2165 * The UPL_ABORT_ALLOW_ACCESS is defined, but neither set nor
2166 * referenced; do not use it.
2175 kr
= upl_abort(upl
, abort_type
);
2176 upl_deallocate(upl
);
2184 * Retrieve the internal page list for the specified upl
2186 * Parameters: upl The upl to obtain the page list from
2188 * Returns: !NULL The (upl_page_info_t *) for the page
2189 * list internal to the upl
2190 * NULL Error/no page list associated
2192 * Notes: IMPORTANT: The function is only valid on internal objects
2193 * where the list request was made with the UPL_INTERNAL flag.
2195 * This function is a utility helper function, since some callers
2196 * may not have direct access to the header defining the macro,
2197 * due to abstraction layering constraints.
2203 return (UPL_GET_INTERNAL_PAGE_LIST(upl
));
2208 UBCINFOEXISTS(struct vnode
* vp
)
2210 return((vp
) && ((vp
)->v_type
== VREG
) && ((vp
)->v_ubcinfo
!= UBC_INFO_NULL
));
2217 #define CS_BLOB_PAGEABLE 0
2218 static volatile SInt32 cs_blob_size
= 0;
2219 static volatile SInt32 cs_blob_count
= 0;
2220 static SInt32 cs_blob_size_peak
= 0;
2221 static UInt32 cs_blob_size_max
= 0;
2222 static SInt32 cs_blob_count_peak
= 0;
2224 int cs_validation
= 1;
2226 SYSCTL_INT(_vm
, OID_AUTO
, cs_validation
, CTLFLAG_RW
, &cs_validation
, 0, "Do validate code signatures");
2227 SYSCTL_INT(_vm
, OID_AUTO
, cs_blob_count
, CTLFLAG_RD
, &cs_blob_count
, 0, "Current number of code signature blobs");
2228 SYSCTL_INT(_vm
, OID_AUTO
, cs_blob_size
, CTLFLAG_RD
, &cs_blob_size
, 0, "Current size of all code signature blobs");
2229 SYSCTL_INT(_vm
, OID_AUTO
, cs_blob_count_peak
, CTLFLAG_RD
, &cs_blob_count_peak
, 0, "Peak number of code signature blobs");
2230 SYSCTL_INT(_vm
, OID_AUTO
, cs_blob_size_peak
, CTLFLAG_RD
, &cs_blob_size_peak
, 0, "Peak size of code signature blobs");
2231 SYSCTL_INT(_vm
, OID_AUTO
, cs_blob_size_max
, CTLFLAG_RD
, &cs_blob_size_max
, 0, "Size of biggest code signature blob");
2234 ubc_cs_blob_allocate(
2235 vm_offset_t
*blob_addr_p
,
2236 vm_size_t
*blob_size_p
)
2240 #if CS_BLOB_PAGEABLE
2241 *blob_size_p
= round_page(*blob_size_p
);
2242 kr
= kmem_alloc(kernel_map
, blob_addr_p
, *blob_size_p
);
2243 #else /* CS_BLOB_PAGEABLE */
2244 *blob_addr_p
= (vm_offset_t
) kalloc(*blob_size_p
);
2245 if (*blob_addr_p
== 0) {
2250 #endif /* CS_BLOB_PAGEABLE */
2255 ubc_cs_blob_deallocate(
2256 vm_offset_t blob_addr
,
2257 vm_size_t blob_size
)
2259 #if CS_BLOB_PAGEABLE
2260 kmem_free(kernel_map
, blob_addr
, blob_size
);
2261 #else /* CS_BLOB_PAGEABLE */
2262 kfree((void *) blob_addr
, blob_size
);
2263 #endif /* CS_BLOB_PAGEABLE */
2275 struct ubc_info
*uip
;
2276 struct cs_blob
*blob
, *oblob
;
2278 ipc_port_t blob_handle
;
2279 memory_object_size_t blob_size
;
2280 const CS_CodeDirectory
*cd
;
2281 off_t blob_start_offset
, blob_end_offset
;
2284 blob_handle
= IPC_PORT_NULL
;
2286 blob
= (struct cs_blob
*) kalloc(sizeof (struct cs_blob
));
2291 #if CS_BLOB_PAGEABLE
2292 /* get a memory entry on the blob */
2293 blob_size
= (memory_object_size_t
) size
;
2294 kr
= mach_make_memory_entry_64(kernel_map
,
2300 if (kr
!= KERN_SUCCESS
) {
2304 if (memory_object_round_page(blob_size
) !=
2305 (memory_object_size_t
) round_page(size
)) {
2306 printf("ubc_cs_blob_add: size mismatch 0x%llx 0x%lx !?\n",
2307 blob_size
, (size_t)size
);
2308 panic("XXX FBDP size mismatch 0x%llx 0x%lx\n", blob_size
, (size_t)size
);
2313 blob_size
= (memory_object_size_t
) size
;
2314 blob_handle
= IPC_PORT_NULL
;
2317 /* fill in the new blob */
2318 blob
->csb_cpu_type
= cputype
;
2319 blob
->csb_base_offset
= base_offset
;
2320 blob
->csb_mem_size
= size
;
2321 blob
->csb_mem_offset
= 0;
2322 blob
->csb_mem_handle
= blob_handle
;
2323 blob
->csb_mem_kaddr
= addr
;
2326 * Validate the blob's contents
2328 cd
= findCodeDirectory(
2329 (const CS_SuperBlob
*) addr
,
2331 (char *) addr
+ blob
->csb_mem_size
);
2333 /* no code directory => useless blob ! */
2334 blob
->csb_flags
= 0;
2335 blob
->csb_start_offset
= 0;
2336 blob
->csb_end_offset
= 0;
2338 unsigned char *sha1_base
;
2341 blob
->csb_flags
= ntohl(cd
->flags
) | CS_VALID
;
2342 blob
->csb_end_offset
= round_page(ntohl(cd
->codeLimit
));
2343 if((ntohl(cd
->version
) >= supportsScatter
) && (ntohl(cd
->scatterOffset
))) {
2344 const struct Scatter
*scatter
= (const struct Scatter
*)
2345 ((const char*)cd
+ ntohl(cd
->scatterOffset
));
2346 blob
->csb_start_offset
= ntohl(scatter
->base
) * PAGE_SIZE
;
2348 blob
->csb_start_offset
= (blob
->csb_end_offset
-
2349 (ntohl(cd
->nCodeSlots
) * PAGE_SIZE
));
2351 /* compute the blob's SHA1 hash */
2352 sha1_base
= (const unsigned char *) cd
;
2353 sha1_size
= ntohl(cd
->length
);
2354 SHA1Init(&sha1ctxt
);
2355 SHA1Update(&sha1ctxt
, sha1_base
, sha1_size
);
2356 SHA1Final(blob
->csb_sha1
, &sha1ctxt
);
2360 * Let policy module check whether the blob's signature is accepted.
2363 error
= mac_vnode_check_signature(vp
, blob
->csb_sha1
, (void*)addr
, size
);
2369 * Validate the blob's coverage
2371 blob_start_offset
= blob
->csb_base_offset
+ blob
->csb_start_offset
;
2372 blob_end_offset
= blob
->csb_base_offset
+ blob
->csb_end_offset
;
2374 if (blob_start_offset
>= blob_end_offset
||
2375 blob_start_offset
< 0 ||
2376 blob_end_offset
<= 0) {
2377 /* reject empty or backwards blob */
2383 if (! UBCINFOEXISTS(vp
)) {
2388 uip
= vp
->v_ubcinfo
;
2390 /* check if this new blob overlaps with an existing blob */
2391 for (oblob
= uip
->cs_blobs
;
2393 oblob
= oblob
->csb_next
) {
2394 off_t oblob_start_offset
, oblob_end_offset
;
2396 oblob_start_offset
= (oblob
->csb_base_offset
+
2397 oblob
->csb_start_offset
);
2398 oblob_end_offset
= (oblob
->csb_base_offset
+
2399 oblob
->csb_end_offset
);
2400 if (blob_start_offset
>= oblob_end_offset
||
2401 blob_end_offset
<= oblob_start_offset
) {
2402 /* no conflict with this existing blob */
2405 if (blob_start_offset
== oblob_start_offset
&&
2406 blob_end_offset
== oblob_end_offset
&&
2407 blob
->csb_mem_size
== oblob
->csb_mem_size
&&
2408 blob
->csb_flags
== oblob
->csb_flags
&&
2409 (blob
->csb_cpu_type
== CPU_TYPE_ANY
||
2410 oblob
->csb_cpu_type
== CPU_TYPE_ANY
||
2411 blob
->csb_cpu_type
== oblob
->csb_cpu_type
) &&
2412 !bcmp(blob
->csb_sha1
,
2416 * We already have this blob:
2417 * we'll return success but
2418 * throw away the new blob.
2420 if (oblob
->csb_cpu_type
== CPU_TYPE_ANY
) {
2422 * The old blob matches this one
2423 * but doesn't have any CPU type.
2424 * Update it with whatever the caller
2425 * provided this time.
2427 oblob
->csb_cpu_type
= cputype
;
2433 /* different blob: reject the new one */
2443 /* mark this vnode's VM object as having "signed pages" */
2444 kr
= memory_object_signed(uip
->ui_control
, TRUE
);
2445 if (kr
!= KERN_SUCCESS
) {
2452 * Add this blob to the list of blobs for this vnode.
2453 * We always add at the front of the list and we never remove a
2454 * blob from the list, so ubc_cs_get_blobs() can return whatever
2455 * the top of the list was and that list will remain valid
2456 * while we validate a page, even after we release the vnode's lock.
2458 blob
->csb_next
= uip
->cs_blobs
;
2459 uip
->cs_blobs
= blob
;
2461 OSAddAtomic(+1, &cs_blob_count
);
2462 if (cs_blob_count
> cs_blob_count_peak
) {
2463 cs_blob_count_peak
= cs_blob_count
; /* XXX atomic ? */
2465 OSAddAtomic((SInt32
) +blob
->csb_mem_size
, &cs_blob_size
);
2466 if ((SInt32
) cs_blob_size
> cs_blob_size_peak
) {
2467 cs_blob_size_peak
= (SInt32
) cs_blob_size
; /* XXX atomic ? */
2469 if ((UInt32
) blob
->csb_mem_size
> cs_blob_size_max
) {
2470 cs_blob_size_max
= (UInt32
) blob
->csb_mem_size
;
2477 printf("CODE SIGNING: proc %d(%s) "
2478 "loaded %s signatures for file (%s) "
2479 "range 0x%llx:0x%llx flags 0x%x\n",
2480 p
->p_pid
, p
->p_comm
,
2481 blob
->csb_cpu_type
== -1 ? "detached" : "embedded",
2483 blob
->csb_base_offset
+ blob
->csb_start_offset
,
2484 blob
->csb_base_offset
+ blob
->csb_end_offset
,
2490 error
= 0; /* success ! */
2494 /* we failed; release what we allocated */
2496 kfree(blob
, sizeof (*blob
));
2499 if (blob_handle
!= IPC_PORT_NULL
) {
2500 mach_memory_entry_port_release(blob_handle
);
2501 blob_handle
= IPC_PORT_NULL
;
2505 if (error
== EAGAIN
) {
2507 * See above: error is EAGAIN if we were asked
2508 * to add an existing blob again. We cleaned the new
2509 * blob and we want to return success.
2513 * Since we're not failing, consume the data we received.
2515 ubc_cs_blob_deallocate(addr
, size
);
2528 struct ubc_info
*uip
;
2529 struct cs_blob
*blob
;
2530 off_t offset_in_blob
;
2532 vnode_lock_spin(vp
);
2534 if (! UBCINFOEXISTS(vp
)) {
2539 uip
= vp
->v_ubcinfo
;
2540 for (blob
= uip
->cs_blobs
;
2542 blob
= blob
->csb_next
) {
2543 if (cputype
!= -1 && blob
->csb_cpu_type
== cputype
) {
2547 offset_in_blob
= offset
- blob
->csb_base_offset
;
2548 if (offset_in_blob
>= blob
->csb_start_offset
&&
2549 offset_in_blob
< blob
->csb_end_offset
) {
2550 /* our offset is covered by this blob */
2564 struct ubc_info
*uip
)
2566 struct cs_blob
*blob
, *next_blob
;
2568 for (blob
= uip
->cs_blobs
;
2571 next_blob
= blob
->csb_next
;
2572 if (blob
->csb_mem_kaddr
!= 0) {
2573 ubc_cs_blob_deallocate(blob
->csb_mem_kaddr
,
2574 blob
->csb_mem_size
);
2575 blob
->csb_mem_kaddr
= 0;
2577 if (blob
->csb_mem_handle
!= IPC_PORT_NULL
) {
2578 mach_memory_entry_port_release(blob
->csb_mem_handle
);
2580 blob
->csb_mem_handle
= IPC_PORT_NULL
;
2581 OSAddAtomic(-1, &cs_blob_count
);
2582 OSAddAtomic((SInt32
) -blob
->csb_mem_size
, &cs_blob_size
);
2583 kfree(blob
, sizeof (*blob
));
2585 uip
->cs_blobs
= NULL
;
2592 struct ubc_info
*uip
;
2593 struct cs_blob
*blobs
;
2596 * No need to take the vnode lock here. The caller must be holding
2597 * a reference on the vnode (via a VM mapping or open file descriptor),
2598 * so the vnode will not go away. The ubc_info stays until the vnode
2599 * goes away. And we only modify "blobs" by adding to the head of the
2601 * The ubc_info could go away entirely if the vnode gets reclaimed as
2602 * part of a forced unmount. In the case of a code-signature validation
2603 * during a page fault, the "paging_in_progress" reference on the VM
2604 * object guarantess that the vnode pager (and the ubc_info) won't go
2605 * away during the fault.
2606 * Other callers need to protect against vnode reclaim by holding the
2607 * vnode lock, for example.
2610 if (! UBCINFOEXISTS(vp
)) {
2615 uip
= vp
->v_ubcinfo
;
2616 blobs
= uip
->cs_blobs
;
2622 unsigned long cs_validate_page_no_hash
= 0;
2623 unsigned long cs_validate_page_bad_hash
= 0;
2627 memory_object_offset_t page_offset
,
2632 unsigned char actual_hash
[SHA1_RESULTLEN
];
2633 unsigned char expected_hash
[SHA1_RESULTLEN
];
2634 boolean_t found_hash
;
2635 struct cs_blob
*blobs
, *blob
;
2636 const CS_CodeDirectory
*cd
;
2637 const CS_SuperBlob
*embedded
;
2638 const unsigned char *hash
;
2639 boolean_t validated
;
2640 off_t offset
; /* page offset in the file */
2642 off_t codeLimit
= 0;
2643 char *lower_bound
, *upper_bound
;
2644 vm_offset_t kaddr
, blob_addr
;
2648 offset
= page_offset
;
2650 /* retrieve the expected hash */
2652 blobs
= (struct cs_blob
*) _blobs
;
2656 blob
= blob
->csb_next
) {
2657 offset
= page_offset
- blob
->csb_base_offset
;
2658 if (offset
< blob
->csb_start_offset
||
2659 offset
>= blob
->csb_end_offset
) {
2660 /* our page is not covered by this blob */
2664 /* map the blob in the kernel address space */
2665 kaddr
= blob
->csb_mem_kaddr
;
2667 ksize
= (vm_size_t
) (blob
->csb_mem_size
+
2668 blob
->csb_mem_offset
);
2669 kr
= vm_map(kernel_map
,
2674 blob
->csb_mem_handle
,
2680 if (kr
!= KERN_SUCCESS
) {
2681 /* XXX FBDP what to do !? */
2682 printf("cs_validate_page: failed to map blob, "
2683 "size=0x%lx kr=0x%x\n",
2684 (size_t)blob
->csb_mem_size
, kr
);
2688 blob_addr
= kaddr
+ blob
->csb_mem_offset
;
2690 lower_bound
= CAST_DOWN(char *, blob_addr
);
2691 upper_bound
= lower_bound
+ blob
->csb_mem_size
;
2693 embedded
= (const CS_SuperBlob
*) blob_addr
;
2694 cd
= findCodeDirectory(embedded
, lower_bound
, upper_bound
);
2696 if (cd
->pageSize
!= PAGE_SHIFT
||
2697 cd
->hashType
!= 0x1 ||
2698 cd
->hashSize
!= SHA1_RESULTLEN
) {
2703 offset
= page_offset
- blob
->csb_base_offset
;
2704 if (offset
< blob
->csb_start_offset
||
2705 offset
>= blob
->csb_end_offset
) {
2706 /* our page is not covered by this blob */
2710 codeLimit
= ntohl(cd
->codeLimit
);
2711 hash
= hashes(cd
, atop(offset
),
2712 lower_bound
, upper_bound
);
2714 bcopy(hash
, expected_hash
,
2715 sizeof (expected_hash
));
2723 if (found_hash
== FALSE
) {
2725 * We can't verify this page because there is no signature
2726 * for it (yet). It's possible that this part of the object
2727 * is not signed, or that signatures for that part have not
2729 * Report that the page has not been validated and let the
2730 * caller decide if it wants to accept it or not.
2732 cs_validate_page_no_hash
++;
2734 printf("CODE SIGNING: cs_validate_page: "
2735 "off 0x%llx: no hash to validate !?\n",
2743 const uint32_t *asha1
, *esha1
;
2744 if ((off_t
)(offset
+ size
) > codeLimit
) {
2745 /* partial page at end of segment */
2746 assert(offset
< codeLimit
);
2747 size
= (size_t) (codeLimit
& PAGE_MASK
);
2749 /* compute the actual page's SHA1 hash */
2750 SHA1Init(&sha1ctxt
);
2751 SHA1UpdateUsePhysicalAddress(&sha1ctxt
, data
, size
);
2752 SHA1Final(actual_hash
, &sha1ctxt
);
2754 asha1
= (const uint32_t *) actual_hash
;
2755 esha1
= (const uint32_t *) expected_hash
;
2757 if (bcmp(expected_hash
, actual_hash
, SHA1_RESULTLEN
) != 0) {
2759 printf("CODE SIGNING: cs_validate_page: "
2760 "off 0x%llx size 0x%lx: "
2761 "actual [0x%x 0x%x 0x%x 0x%x 0x%x] != "
2762 "expected [0x%x 0x%x 0x%x 0x%x 0x%x]\n",
2764 asha1
[0], asha1
[1], asha1
[2],
2766 esha1
[0], esha1
[1], esha1
[2],
2767 esha1
[3], esha1
[4]);
2769 cs_validate_page_bad_hash
++;
2773 printf("CODE SIGNING: cs_validate_page: "
2774 "off 0x%llx size 0x%lx: SHA1 OK\n",
2789 unsigned char *cdhash
)
2791 struct cs_blob
*blobs
, *blob
;
2797 blobs
= ubc_get_cs_blobs(vp
);
2800 blob
= blob
->csb_next
) {
2801 /* compute offset relative to this blob */
2802 rel_offset
= offset
- blob
->csb_base_offset
;
2803 if (rel_offset
>= blob
->csb_start_offset
&&
2804 rel_offset
< blob
->csb_end_offset
) {
2805 /* this blob does cover our "offset" ! */
2811 /* we didn't find a blob covering "offset" */
2812 ret
= EBADEXEC
; /* XXX any better error ? */
2814 /* get the SHA1 hash of that blob */
2815 bcopy(blob
->csb_sha1
, cdhash
, sizeof (blob
->csb_sha1
));