/*
- * Copyright (c) 2000-2004 Apple Computer, Inc. All rights reserved.
+ * Copyright (c) 2007-2020 Apple Inc. All Rights Reserved.
+ *
+ * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
*
- * @APPLE_LICENSE_HEADER_START@
- *
* This file contains Original Code and/or Modifications of Original Code
* as defined in and that are subject to the Apple Public Source License
* Version 2.0 (the 'License'). You may not use this file except in
- * compliance with the License. Please obtain a copy of the License at
- * http://www.opensource.apple.com/apsl/ and read it before using this
- * file.
- *
+ * compliance with the License. The rights granted to you under the License
+ * may not be used to create, or enable the creation or redistribution of,
+ * unlawful or unlicensed copies of an Apple operating system, or to
+ * circumvent, violate, or enable the circumvention or violation of, any
+ * terms of an Apple operating system software license agreement.
+ *
+ * Please obtain a copy of the License at
+ * http://www.opensource.apple.com/apsl/ and read it before using this file.
+ *
* The Original Code and all software distributed under the License are
* distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
* EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
* FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
* Please see the License for the specific language governing rights and
* limitations under the License.
- *
- * @APPLE_LICENSE_HEADER_END@
+ *
+ * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
*/
/*
* Copyright (c) 1988 University of Utah.
*
* @(#)vm_mmap.c 8.10 (Berkeley) 2/19/95
*/
+/*
+ * NOTICE: This file was modified by SPARTA, Inc. in 2005 to introduce
+ * support for mandatory and extensible security protections. This notice
+ * is included in support of clause 2.2 (b) of the Apple Public License,
+ * Version 2.0.
+ */
/*
* Mapped file (mmap) interface to VM
#include <sys/conf.h>
#include <sys/stat.h>
#include <sys/ubc.h>
+#include <sys/ubc_internal.h>
#include <sys/sysproto.h>
-#include <bsm/audit_kernel.h>
+#include <sys/syscall.h>
+#include <sys/kdebug.h>
+#include <sys/bsdtask_info.h>
+
+#include <security/audit/audit.h>
#include <bsm/audit_kevents.h>
#include <mach/mach_types.h>
#include <mach/mach_vm.h>
#include <mach/vm_map.h>
#include <mach/host_priv.h>
+#include <mach/sdt.h>
+#include <mach-o/loader.h>
+
+#include <machine/machine_routines.h>
#include <kern/cpu_number.h>
#include <kern/host.h>
+#include <kern/task.h>
+#include <kern/page_decrypt.h>
+
+#include <IOKit/IOReturn.h>
#include <vm/vm_map.h>
#include <vm/vm_kern.h>
#include <vm/vm_pager.h>
+#include <vm/vm_protos.h>
-int
-sbrk(__unused struct proc *p, __unused struct sbrk_args *uap, __unused register_t *retval)
-{
- /* Not yet implemented */
- return (ENOTSUP);
-}
-
-int
-sstk(__unused struct proc *p, __unused struct sstk_args *uap, __unused register_t *retval)
-{
- /* Not yet implemented */
- return (ENOTSUP);
-}
-
-
-struct osmmap_args {
- caddr_t addr;
- int len;
- int prot;
- int share;
- int fd;
- long pos;
-};
+#if CONFIG_MACF
+#include <security/mac_framework.h>
+#endif
+#include <os/overflow.h>
-int
-osmmap(
- struct proc *curp,
- register struct osmmap_args *uap,
- register_t *retval)
+/*
+ * this function implements the same logic as dyld's "dyld_fall_2020_os_versions"
+ * from dyld_priv.h. this way we can consistently deny / allow allocations based
+ * on SDK version at fall 2020 level. Compare output to proc_sdk(current_proc())
+ */
+static uint32_t
+proc_2020_fall_os_sdk(void)
{
- struct mmap_args newargs;
- user_addr_t addr;
- int ret;
-
- if ((uap->share == MAP_SHARED )|| (uap->share == MAP_PRIVATE )) {
- newargs.addr = CAST_USER_ADDR_T(uap->addr);
- newargs.len = CAST_USER_ADDR_T(uap->len);
- newargs.prot = uap->prot;
- newargs.flags = uap->share;
- newargs.fd = uap->fd;
- newargs.pos = (off_t)uap->pos;
- ret = mmap(curp, &newargs, &addr);
- if (ret == 0)
- *retval = CAST_DOWN(register_t, addr);
- } else
- ret = EINVAL;
- return ret;
+ switch (current_proc()->p_platform) {
+ case PLATFORM_MACOS:
+ return 0x000a1000; // DYLD_MACOSX_VERSION_10_16
+ case PLATFORM_IOS:
+ case PLATFORM_IOSSIMULATOR:
+ case PLATFORM_MACCATALYST:
+ return 0x000e0000; // DYLD_IOS_VERSION_14_0
+ case PLATFORM_BRIDGEOS:
+ return 0x00050000; // DYLD_BRIDGEOS_VERSION_5_0
+ case PLATFORM_TVOS:
+ case PLATFORM_TVOSSIMULATOR:
+ return 0x000e0000; // DYLD_TVOS_VERSION_14_0
+ case PLATFORM_WATCHOS:
+ case PLATFORM_WATCHOSSIMULATOR:
+ return 0x00070000; // DYLD_WATCHOS_VERSION_7_0
+ default:
+ return 0;
+ }
}
-
+/*
+ * XXX Internally, we use VM_PROT_* somewhat interchangeably, but the correct
+ * XXX usage is PROT_* from an interface perspective. Thus the values of
+ * XXX VM_PROT_* and PROT_* need to correspond.
+ */
int
-mmap(struct proc *p, struct mmap_args *uap, user_addr_t *retval)
+mmap(proc_t p, struct mmap_args *uap, user_addr_t *retval)
{
/*
* Map in special device (must be SHARED) or file
*/
struct fileproc *fp;
- register struct vnode *vp;
- int flags;
- int prot;
- int err=0;
- vm_map_t user_map;
- kern_return_t result;
- mach_vm_offset_t user_addr;
- mach_vm_size_t user_size;
- vm_object_offset_t pageoff;
- vm_object_offset_t file_pos;
- int alloc_flags;
- boolean_t docow;
- vm_prot_t maxprot;
- void *handle;
- vm_pager_t pager;
- int mapanon=0;
- int fpref=0;
- int error =0;
+ struct vnode *vp;
+ int flags;
+ int prot;
+ int err = 0;
+ vm_map_t user_map;
+ kern_return_t result;
+ vm_map_offset_t user_addr;
+ vm_map_offset_t sum;
+ vm_map_size_t user_size;
+ vm_object_offset_t pageoff;
+ vm_object_offset_t file_pos;
+ int alloc_flags = 0;
+ vm_tag_t tag = VM_KERN_MEMORY_NONE;
+ vm_map_kernel_flags_t vmk_flags = VM_MAP_KERNEL_FLAGS_NONE;
+ boolean_t docow;
+ vm_prot_t maxprot;
+ void *handle;
+ memory_object_t pager = MEMORY_OBJECT_NULL;
+ memory_object_control_t control;
+ int mapanon = 0;
+ int fpref = 0;
+ int error = 0;
int fd = uap->fd;
+ int num_retries = 0;
- user_addr = (mach_vm_offset_t)uap->addr;
- user_size = (mach_vm_size_t) uap->len;
+ /*
+ * Note that for UNIX03 conformance, there is additional parameter checking for
+ * mmap() system call in libsyscall prior to entering the kernel. The sanity
+ * checks and argument validation done in this function are not the only places
+ * one can get returned errnos.
+ */
+
+ user_map = current_map();
+ user_addr = (vm_map_offset_t)uap->addr;
+ user_size = (vm_map_size_t) uap->len;
AUDIT_ARG(addr, user_addr);
AUDIT_ARG(len, user_size);
AUDIT_ARG(fd, uap->fd);
+ if (vm_map_range_overflows(user_addr, user_size)) {
+ return EINVAL;
+ }
prot = (uap->prot & VM_PROT_ALL);
+#if 3777787
+ /*
+ * Since the hardware currently does not support writing without
+ * read-before-write, or execution-without-read, if the request is
+ * for write or execute access, we must imply read access as well;
+ * otherwise programs expecting this to work will fail to operate.
+ */
+ if (prot & (VM_PROT_EXECUTE | VM_PROT_WRITE)) {
+ prot |= VM_PROT_READ;
+ }
+#endif /* radar 3777787 */
+
flags = uap->flags;
vp = NULLVP;
/*
- * The vm code does not have prototypes & compiler doesn't do the'
- * the right thing when you cast 64bit value and pass it in function
+ * verify no unknown flags are passed in, and if any are,
+ * fail out early to make sure the logic below never has to deal
+ * with invalid flag values
+ */
+ if (flags & ~(MAP_SHARED |
+ MAP_PRIVATE |
+ MAP_COPY |
+ MAP_FIXED |
+ MAP_RENAME |
+ MAP_NORESERVE |
+ MAP_RESERVED0080 | //grandfathered in as accepted and ignored
+ MAP_NOEXTEND |
+ MAP_HASSEMAPHORE |
+ MAP_NOCACHE |
+ MAP_JIT |
+ MAP_FILE |
+ MAP_ANON |
+ MAP_RESILIENT_CODESIGN |
+ MAP_RESILIENT_MEDIA |
+#if XNU_TARGET_OS_OSX
+ MAP_32BIT |
+#endif
+ MAP_TRANSLATED_ALLOW_EXECUTE |
+ MAP_UNIX03)) {
+ if (proc_sdk(current_proc()) >= proc_2020_fall_os_sdk()) {
+ return EINVAL;
+ }
+ }
+
+
+ /*
+ * The vm code does not have prototypes & compiler doesn't do
+ * the right thing when you cast 64bit value and pass it in function
* call. So here it is.
*/
file_pos = (vm_object_offset_t)uap->pos;
/* make sure mapping fits into numeric range etc */
- if ((file_pos + user_size > (vm_object_offset_t)-PAGE_SIZE_64) ||
- ((flags & MAP_ANON) && fd != -1))
- return (EINVAL);
+ if (os_add3_overflow(file_pos, user_size, vm_map_page_size(user_map) - 1, &sum)) {
+ return EINVAL;
+ }
+
+ if (flags & MAP_UNIX03) {
+ vm_map_offset_t offset_alignment_mask;
+
+ /*
+ * Enforce UNIX03 compliance.
+ */
+
+ if (vm_map_is_exotic(current_map())) {
+ offset_alignment_mask = 0xFFF;
+ } else {
+ offset_alignment_mask = vm_map_page_mask(current_map());
+ }
+ if (file_pos & offset_alignment_mask) {
+ /* file offset should be page-aligned */
+ return EINVAL;
+ }
+ if (!(flags & (MAP_PRIVATE | MAP_SHARED))) {
+ /* need either MAP_PRIVATE or MAP_SHARED */
+ return EINVAL;
+ }
+ if (user_size == 0) {
+ /* mapping length should not be 0 */
+ return EINVAL;
+ }
+ }
/*
* Align the file position to a page boundary,
* and save its page offset component.
*/
- pageoff = (file_pos & PAGE_MASK);
+ pageoff = (file_pos & vm_map_page_mask(user_map));
file_pos -= (vm_object_offset_t)pageoff;
/* Adjust size for rounding (on both ends). */
- user_size += pageoff; /* low end... */
- user_size = mach_vm_round_page(user_size); /* hi end */
+ user_size += pageoff; /* low end... */
+ user_size = vm_map_round_page(user_size,
+ vm_map_page_mask(user_map)); /* hi end */
+
+
+ if (flags & MAP_JIT) {
+ if ((flags & MAP_FIXED) ||
+ (flags & MAP_SHARED) ||
+ !(flags & MAP_ANON) ||
+ (flags & MAP_RESILIENT_CODESIGN) ||
+ (flags & MAP_RESILIENT_MEDIA)) {
+ return EINVAL;
+ }
+ }
+ if ((flags & MAP_RESILIENT_CODESIGN) ||
+ (flags & MAP_RESILIENT_MEDIA)) {
+ if ((flags & MAP_ANON) ||
+ (flags & MAP_JIT)) {
+ return EINVAL;
+ }
+ }
+ if (flags & MAP_RESILIENT_CODESIGN) {
+ int reject_prot = ((flags & MAP_PRIVATE) ? VM_PROT_EXECUTE : (VM_PROT_WRITE | VM_PROT_EXECUTE));
+ if (prot & reject_prot) {
+ /*
+ * Quick sanity check. maxprot is calculated below and
+ * we will test it again.
+ */
+ return EPERM;
+ }
+ }
+ if (flags & MAP_SHARED) {
+ /*
+ * MAP_RESILIENT_MEDIA is not valid with MAP_SHARED because
+ * there is no place to inject zero-filled pages without
+ * actually adding them to the file.
+ * Since we didn't reject that combination before, there might
+ * already be callers using it and getting a valid MAP_SHARED
+ * mapping but without the resilience.
+ * For backwards compatibility's sake, let's keep ignoring
+ * MAP_RESILIENT_MEDIA in that case.
+ */
+ flags &= ~MAP_RESILIENT_MEDIA;
+ }
+ if (flags & MAP_RESILIENT_MEDIA) {
+ if ((flags & MAP_ANON) ||
+ (flags & MAP_SHARED)) {
+ return EINVAL;
+ }
+ }
/*
* Check for illegal addresses. Watch out for address wrap... Note
* should be aligned after adjustment by pageoff.
*/
user_addr -= pageoff;
- if (user_addr & PAGE_MASK)
- return (EINVAL);
+ if (user_addr & vm_map_page_mask(user_map)) {
+ return EINVAL;
+ }
}
#ifdef notyet
/* DO not have apis to get this info, need to wait till then*/
* There should really be a pmap call to determine a reasonable
* location.
*/
- else if (addr < mach_vm_round_page(p->p_vmspace->vm_daddr + MAXDSIZ))
- addr = mach_vm_round_page(p->p_vmspace->vm_daddr + MAXDSIZ);
+ else if (addr < vm_map_round_page(p->p_vmspace->vm_daddr + MAXDSIZ,
+ vm_map_page_mask(user_map))) {
+ addr = vm_map_round_page(p->p_vmspace->vm_daddr + MAXDSIZ,
+ vm_map_page_mask(user_map));
+ }
#endif
+ alloc_flags = 0;
if (flags & MAP_ANON) {
+ maxprot = VM_PROT_ALL;
+#if CONFIG_MACF
/*
- * Mapping blank space is trivial.
+ * Entitlement check.
*/
+ error = mac_proc_check_map_anon(p, user_addr, user_size, prot, flags, &maxprot);
+ if (error) {
+ return EINVAL;
+ }
+#endif /* MAC */
+
+ /*
+ * Mapping blank space is trivial. Use positive fds as the alias
+ * value for memory tracking.
+ */
+ if (fd != -1) {
+ /*
+ * Use "fd" to pass (some) Mach VM allocation flags,
+ * (see the VM_FLAGS_* definitions).
+ */
+ alloc_flags = fd & (VM_FLAGS_ALIAS_MASK |
+ VM_FLAGS_SUPERPAGE_MASK |
+ VM_FLAGS_PURGABLE |
+ VM_FLAGS_4GB_CHUNK);
+ if (alloc_flags != fd) {
+ /* reject if there are any extra flags */
+ return EINVAL;
+ }
+ VM_GET_FLAGS_ALIAS(alloc_flags, tag);
+ alloc_flags &= ~VM_FLAGS_ALIAS_MASK;
+ }
+
handle = NULL;
- maxprot = VM_PROT_ALL;
file_pos = 0;
+ pageoff = 0;
mapanon = 1;
} else {
struct vnode_attr va;
- struct vfs_context context;
+ vfs_context_t ctx = vfs_context_current();
+
+ if (flags & MAP_JIT) {
+ return EINVAL;
+ }
+
/*
* Mapping file, get fp for validation. Obtain vnode and make
* sure it is of appropriate type.
*/
err = fp_lookup(p, fd, &fp, 0);
- if (err)
- return(err);
+ if (err) {
+ return err;
+ }
fpref = 1;
- if(fp->f_fglob->fg_type == DTYPE_PSXSHM) {
+ switch (FILEGLOB_DTYPE(fp->fp_glob)) {
+ case DTYPE_PSXSHM:
uap->addr = (user_addr_t)user_addr;
uap->len = (user_size_t)user_size;
uap->prot = prot;
uap->pos = file_pos;
error = pshm_mmap(p, uap, retval, fp, (off_t)pageoff);
goto bad;
- }
-
- if (fp->f_fglob->fg_type != DTYPE_VNODE) {
+ case DTYPE_VNODE:
+ break;
+ default:
error = EINVAL;
goto bad;
}
- vp = (struct vnode *)fp->f_fglob->fg_data;
+ vp = (struct vnode *)fp->fp_glob->fg_data;
error = vnode_getwithref(vp);
- if(error != 0)
+ if (error != 0) {
goto bad;
+ }
if (vp->v_type != VREG && vp->v_type != VCHR) {
(void)vnode_put(vp);
}
AUDIT_ARG(vnpath, vp, ARG_VNODE1);
-
- /* conformance change - mmap needs to update access time for mapped
- * files
+
+ /*
+ * POSIX: mmap needs to update access time for mapped files
*/
- VATTR_INIT(&va);
- nanotime(&va.va_access_time);
- VATTR_SET_ACTIVE(&va, va_access_time);
- context.vc_proc = p;
- context.vc_ucred = kauth_cred_get();
- vnode_setattr(vp, &va, &context);
+ if ((vnode_vfsvisflags(vp) & MNT_NOATIME) == 0) {
+ VATTR_INIT(&va);
+ nanotime(&va.va_access_time);
+ VATTR_SET_ACTIVE(&va, va_access_time);
+ vnode_setattr(vp, &va, ctx);
+ }
/*
* XXX hack to handle use of /dev/zero to map anon memory (ala
* credentials do we use for determination? What if
* proc does a setuid?
*/
- maxprot = VM_PROT_EXECUTE; /* ??? */
- if (fp->f_fglob->fg_flag & FREAD)
+ maxprot = VM_PROT_EXECUTE; /* TODO: Remove this and restrict maxprot? */
+ if (fp->fp_glob->fg_flag & FREAD) {
maxprot |= VM_PROT_READ;
- else if (prot & PROT_READ) {
+ } else if (prot & PROT_READ) {
(void)vnode_put(vp);
error = EACCES;
goto bad;
* MAP_SHARED or via the implicit sharing of character
* device mappings), and we are trying to get write
* permission although we opened it without asking
- * for it, bail out.
+ * for it, bail out.
*/
if ((flags & MAP_SHARED) != 0) {
- if ((fp->f_fglob->fg_flag & FWRITE) != 0) {
- /*
- * check for write access
- *
- * Note that we already made this check when granting FWRITE
- * against the file, so it seems redundant here.
- */
- error = vnode_authorize(vp, NULL, KAUTH_VNODE_CHECKIMMUTABLE, &context);
-
- /* if not granted for any reason, but we wanted it, bad */
- if ((prot & PROT_WRITE) && (error != 0)) {
- vnode_put(vp);
- goto bad;
- }
-
- /* if writable, remember */
- if (error == 0)
- maxprot |= VM_PROT_WRITE;
-
+ if ((fp->fp_glob->fg_flag & FWRITE) != 0 &&
+ /*
+ * Do not allow writable mappings of
+ * swap files (see vm_swapfile_pager.c).
+ */
+ !vnode_isswap(vp)) {
+ /*
+ * check for write access
+ *
+ * Note that we already made this check when granting FWRITE
+ * against the file, so it seems redundant here.
+ */
+ error = vnode_authorize(vp, NULL, KAUTH_VNODE_CHECKIMMUTABLE, ctx);
+
+ /* if not granted for any reason, but we wanted it, bad */
+ if ((prot & PROT_WRITE) && (error != 0)) {
+ vnode_put(vp);
+ goto bad;
+ }
+
+ /* if writable, remember */
+ if (error == 0) {
+ maxprot |= VM_PROT_WRITE;
+ }
} else if ((prot & PROT_WRITE) != 0) {
(void)vnode_put(vp);
error = EACCES;
goto bad;
}
- } else
+ } else {
maxprot |= VM_PROT_WRITE;
+ }
handle = (void *)vp;
+#if CONFIG_MACF
+ error = mac_file_check_mmap(vfs_context_ucred(ctx),
+ fp->fp_glob, prot, flags, file_pos + pageoff,
+ &maxprot);
+ if (error) {
+ (void)vnode_put(vp);
+ goto bad;
+ }
+#endif /* MAC */
+ /*
+ * Consult the file system to determine if this
+ * particular file object can be mapped.
+ *
+ * N.B. If MAP_PRIVATE (i.e. CoW) has been specified,
+ * then we don't check for writeability on the file
+ * object, because it will only ever see reads.
+ */
+ error = VNOP_MMAP_CHECK(vp, (flags & MAP_PRIVATE) ?
+ (prot & ~PROT_WRITE) : prot, ctx);
+ if (error) {
+ (void)vnode_put(vp);
+ goto bad;
+ }
}
+
+ /*
+ * No copy-on-read for mmap() mappings themselves.
+ */
+ vmk_flags.vmkf_no_copy_on_read = 1;
}
- if (user_size == 0) {
- if (!mapanon)
+ if (user_size == 0) {
+ if (!mapanon) {
(void)vnode_put(vp);
+ }
error = 0;
goto bad;
}
* We bend a little - round the start and end addresses
* to the nearest page boundary.
*/
- user_size = mach_vm_round_page(user_size);
+ user_size = vm_map_round_page(user_size,
+ vm_map_page_mask(user_map));
- if (file_pos & PAGE_MASK_64) {
- if (!mapanon)
+ if (file_pos & vm_map_page_mask(user_map)) {
+ if (!mapanon) {
(void)vnode_put(vp);
+ }
error = EINVAL;
goto bad;
}
- user_map = current_map();
-
if ((flags & MAP_FIXED) == 0) {
- alloc_flags = VM_FLAGS_ANYWHERE;
- user_addr = mach_vm_round_page(user_addr);
+ alloc_flags |= VM_FLAGS_ANYWHERE;
+ user_addr = vm_map_round_page(user_addr,
+ vm_map_page_mask(user_map));
} else {
- if (user_addr != mach_vm_trunc_page(user_addr)) {
- if (!mapanon)
- (void)vnode_put(vp);
+ if (user_addr != vm_map_trunc_page(user_addr,
+ vm_map_page_mask(user_map))) {
+ if (!mapanon) {
+ (void)vnode_put(vp);
+ }
error = EINVAL;
goto bad;
}
* has to deallocate the existing mappings and establish the
* new ones atomically.
*/
- alloc_flags = VM_FLAGS_FIXED | VM_FLAGS_OVERWRITE;
+ alloc_flags |= VM_FLAGS_FIXED | VM_FLAGS_OVERWRITE;
}
+ if (flags & MAP_NOCACHE) {
+ alloc_flags |= VM_FLAGS_NO_CACHE;
+ }
+
+ if (flags & MAP_JIT) {
+ vmk_flags.vmkf_map_jit = TRUE;
+ }
+
+
+ if (flags & MAP_RESILIENT_CODESIGN) {
+ alloc_flags |= VM_FLAGS_RESILIENT_CODESIGN;
+ }
+ if (flags & MAP_RESILIENT_MEDIA) {
+ alloc_flags |= VM_FLAGS_RESILIENT_MEDIA;
+ }
+
+#if XNU_TARGET_OS_OSX
+ /* macOS-specific MAP_32BIT flag handling */
+ if (flags & MAP_32BIT) {
+ vmk_flags.vmkf_32bit_map_va = TRUE;
+ }
+#endif
/*
* Lookup/allocate object.
*/
if (handle == NULL) {
- pager = NULL;
+ control = NULL;
#ifdef notyet
/* Hmm .. */
#if defined(VM_PROT_READ_IS_EXEC)
- if (prot & VM_PROT_READ)
+ if (prot & VM_PROT_READ) {
prot |= VM_PROT_EXECUTE;
-
- if (maxprot & VM_PROT_READ)
+ }
+ if (maxprot & VM_PROT_READ) {
maxprot |= VM_PROT_EXECUTE;
+ }
#endif
#endif
- result = mach_vm_map(user_map, &user_addr, user_size, 0,
- alloc_flags, IPC_PORT_NULL, 0,
- FALSE, prot, maxprot,
- (flags & MAP_SHARED) ? VM_INHERIT_SHARE :
- VM_INHERIT_DEFAULT);
- if (result != KERN_SUCCESS)
- goto out;
+
+#if 3777787
+ if (prot & (VM_PROT_EXECUTE | VM_PROT_WRITE)) {
+ prot |= VM_PROT_READ;
+ }
+ if (maxprot & (VM_PROT_EXECUTE | VM_PROT_WRITE)) {
+ maxprot |= VM_PROT_READ;
+ }
+#endif /* radar 3777787 */
+map_anon_retry:
+
+ result = vm_map_enter_mem_object(user_map,
+ &user_addr, user_size,
+ 0, alloc_flags, vmk_flags,
+ tag,
+ IPC_PORT_NULL, 0, FALSE,
+ prot, maxprot,
+ (flags & MAP_SHARED) ?
+ VM_INHERIT_SHARE :
+ VM_INHERIT_DEFAULT);
+
+ /* If a non-binding address was specified for this anonymous
+ * mapping, retry the mapping with a zero base
+ * in the event the mapping operation failed due to
+ * lack of space between the address and the map's maximum.
+ */
+ if ((result == KERN_NO_SPACE) && ((flags & MAP_FIXED) == 0) && user_addr && (num_retries++ == 0)) {
+ user_addr = vm_map_page_size(user_map);
+ goto map_anon_retry;
+ }
} else {
- UBCINFOCHECK("mmap", vp);
- pager = (vm_pager_t)ubc_getpager(vp);
-
- if (pager == NULL) {
+ if (vnode_isswap(vp)) {
+ /*
+ * Map swap files with a special pager
+ * that returns obfuscated contents.
+ */
+ control = NULL;
+ pager = swapfile_pager_setup(vp);
+ if (pager != MEMORY_OBJECT_NULL) {
+ control = swapfile_pager_control(pager);
+ }
+ } else {
+ control = ubc_getobject(vp, UBC_FLAGS_NONE);
+ }
+
+ if (control == NULL) {
(void)vnode_put(vp);
error = ENOMEM;
goto bad;
* Set credentials:
* FIXME: if we're writing the file we need a way to
* ensure that someone doesn't replace our R/W creds
- * with ones that only work for read.
+ * with ones that only work for read.
*/
- ubc_setcred(vp, p);
+ ubc_setthreadcred(vp, p, current_thread());
docow = FALSE;
- if ((flags & (MAP_ANON|MAP_SHARED)) == 0) {
+ if ((flags & (MAP_ANON | MAP_SHARED)) == 0) {
docow = TRUE;
}
#ifdef notyet
/* Hmm .. */
#if defined(VM_PROT_READ_IS_EXEC)
- if (prot & VM_PROT_READ)
+ if (prot & VM_PROT_READ) {
prot |= VM_PROT_EXECUTE;
-
- if (maxprot & VM_PROT_READ)
+ }
+ if (maxprot & VM_PROT_READ) {
maxprot |= VM_PROT_EXECUTE;
+ }
#endif
#endif /* notyet */
- result = mach_vm_map(user_map, &user_addr, user_size,
- 0, alloc_flags, (ipc_port_t)pager, file_pos,
- docow, prot, maxprot,
- (flags & MAP_SHARED) ? VM_INHERIT_SHARE :
- VM_INHERIT_DEFAULT);
+#if 3777787
+ if (prot & (VM_PROT_EXECUTE | VM_PROT_WRITE)) {
+ prot |= VM_PROT_READ;
+ }
+ if (maxprot & (VM_PROT_EXECUTE | VM_PROT_WRITE)) {
+ maxprot |= VM_PROT_READ;
+ }
+#endif /* radar 3777787 */
+
+map_file_retry:
+ if (flags & MAP_RESILIENT_CODESIGN) {
+ int reject_prot = ((flags & MAP_PRIVATE) ? VM_PROT_EXECUTE : (VM_PROT_WRITE | VM_PROT_EXECUTE));
+ if (prot & reject_prot) {
+ /*
+ * Would like to use (prot | maxprot) here
+ * but the assignment of VM_PROT_EXECUTE
+ * to maxprot above would always fail the test.
+ *
+ * Skipping the check is ok, however, because we
+ * restrict maxprot to prot just below in this
+ * block.
+ */
+ assert(!mapanon);
+ vnode_put(vp);
+ error = EPERM;
+ goto bad;
+ }
+ /* strictly limit access to "prot" */
+ maxprot &= prot;
+ }
- if (result != KERN_SUCCESS) {
- (void)vnode_put(vp);
- goto out;
+ vm_object_offset_t end_pos = 0;
+ if (os_add_overflow(user_size, file_pos, &end_pos)) {
+ vnode_put(vp);
+ error = EINVAL;
+ goto bad;
}
- (void)ubc_map(vp,(prot & ( PROT_EXEC | PROT_READ | PROT_WRITE | PROT_EXEC)));
+ result = vm_map_enter_mem_object_control(user_map,
+ &user_addr, user_size,
+ 0, alloc_flags, vmk_flags,
+ tag,
+ control, file_pos,
+ docow, prot, maxprot,
+ (flags & MAP_SHARED) ?
+ VM_INHERIT_SHARE :
+ VM_INHERIT_DEFAULT);
+
+ /* If a non-binding address was specified for this file backed
+ * mapping, retry the mapping with a zero base
+ * in the event the mapping operation failed due to
+ * lack of space between the address and the map's maximum.
+ */
+ if ((result == KERN_NO_SPACE) && ((flags & MAP_FIXED) == 0) && user_addr && (num_retries++ == 0)) {
+ user_addr = vm_map_page_size(user_map);
+ goto map_file_retry;
+ }
}
- if (!mapanon)
+ if (!mapanon) {
(void)vnode_put(vp);
+ }
-out:
switch (result) {
case KERN_SUCCESS:
*retval = user_addr + pageoff;
break;
}
bad:
- if (fpref)
+ if (pager != MEMORY_OBJECT_NULL) {
+ /*
+ * Release the reference on the pager.
+ * If the mapping was successful, it now holds
+ * an extra reference.
+ */
+ memory_object_deallocate(pager);
+ }
+ if (fpref) {
fp_drop(p, fd, fp, 0);
- return(error);
+ }
+
+ KERNEL_DEBUG_CONSTANT((BSDDBG_CODE(DBG_BSD_SC_EXTENDED_INFO, SYS_mmap) | DBG_FUNC_NONE), fd, (uint32_t)(*retval), (uint32_t)user_size, error, 0);
+#if XNU_TARGET_OS_OSX
+ KERNEL_DEBUG_CONSTANT((BSDDBG_CODE(DBG_BSD_SC_EXTENDED_INFO2, SYS_mmap) | DBG_FUNC_NONE), (uint32_t)(*retval >> 32), (uint32_t)(user_size >> 32),
+ (uint32_t)(file_pos >> 32), (uint32_t)file_pos, 0);
+#endif /* XNU_TARGET_OS_OSX */
+ return error;
+}
+
+int
+msync(__unused proc_t p, struct msync_args *uap, int32_t *retval)
+{
+ __pthread_testcancel(1);
+ return msync_nocancel(p, (struct msync_nocancel_args *)uap, retval);
}
int
-msync(__unused struct proc *p, struct msync_args *uap, __unused register_t *retval)
+msync_nocancel(__unused proc_t p, struct msync_nocancel_args *uap, __unused int32_t *retval)
{
mach_vm_offset_t addr;
mach_vm_size_t size;
int flags;
vm_map_t user_map;
int rv;
- vm_sync_t sync_flags=0;
+ vm_sync_t sync_flags = 0;
+ user_map = current_map();
addr = (mach_vm_offset_t) uap->addr;
- size = (mach_vm_size_t)uap->len;
-
- if (addr & PAGE_MASK_64) {
+ size = (mach_vm_size_t) uap->len;
+#if XNU_TARGET_OS_OSX
+ KERNEL_DEBUG_CONSTANT((BSDDBG_CODE(DBG_BSD_SC_EXTENDED_INFO, SYS_msync) | DBG_FUNC_NONE), (uint32_t)(addr >> 32), (uint32_t)(size >> 32), 0, 0, 0);
+#endif /* XNU_TARGET_OS_OSX */
+ if (mach_vm_range_overflows(addr, size)) {
+ return EINVAL;
+ }
+ if (addr & vm_map_page_mask(user_map)) {
/* UNIX SPEC: user address is not page-aligned, return EINVAL */
return EINVAL;
}
/*
* We cannot support this properly without maintaining
* list all mmaps done. Cannot use vm_map_entry as they could be
- * split or coalesced by indepenedant actions. So instead of
+ * split or coalesced by indepenedant actions. So instead of
* inaccurate results, lets just return error as invalid size
* specified
*/
- return (EINVAL); /* XXX breaks posix apps */
+ return EINVAL; /* XXX breaks posix apps */
}
flags = uap->flags;
/* disallow contradictory flags */
- if ((flags & (MS_SYNC|MS_ASYNC)) == (MS_SYNC|MS_ASYNC) ||
- (flags & (MS_ASYNC|MS_INVALIDATE)) == (MS_ASYNC|MS_INVALIDATE))
- return (EINVAL);
+ if ((flags & (MS_SYNC | MS_ASYNC)) == (MS_SYNC | MS_ASYNC)) {
+ return EINVAL;
+ }
- if (flags & MS_KILLPAGES)
- sync_flags |= VM_SYNC_KILLPAGES;
- if (flags & MS_DEACTIVATE)
- sync_flags |= VM_SYNC_DEACTIVATE;
- if (flags & MS_INVALIDATE)
- sync_flags |= VM_SYNC_INVALIDATE;
+ if (flags & MS_KILLPAGES) {
+ sync_flags |= VM_SYNC_KILLPAGES;
+ }
+ if (flags & MS_DEACTIVATE) {
+ sync_flags |= VM_SYNC_DEACTIVATE;
+ }
+ if (flags & MS_INVALIDATE) {
+ sync_flags |= VM_SYNC_INVALIDATE;
+ }
- if ( !(flags & (MS_KILLPAGES | MS_DEACTIVATE))) {
- if (flags & MS_ASYNC)
- sync_flags |= VM_SYNC_ASYNCHRONOUS;
- else
- sync_flags |= VM_SYNC_SYNCHRONOUS;
+ if (!(flags & (MS_KILLPAGES | MS_DEACTIVATE))) {
+ if (flags & MS_ASYNC) {
+ sync_flags |= VM_SYNC_ASYNCHRONOUS;
+ } else {
+ sync_flags |= VM_SYNC_SYNCHRONOUS;
+ }
}
- sync_flags |= VM_SYNC_CONTIGUOUS; /* complain if holes */
+ sync_flags |= VM_SYNC_CONTIGUOUS; /* complain if holes */
- user_map = current_map();
rv = mach_vm_msync(user_map, addr, size, sync_flags);
switch (rv) {
case KERN_SUCCESS:
break;
- case KERN_INVALID_ADDRESS: /* hole in region being sync'ed */
- return (ENOMEM);
+ case KERN_INVALID_ADDRESS: /* hole in region being sync'ed */
+ return ENOMEM;
case KERN_FAILURE:
- return (EIO);
+ return EIO;
default:
- return (EINVAL);
+ return EINVAL;
}
- return (0);
+ return 0;
}
int
-mremap(void)
-{
- /* Not yet implemented */
- return (ENOTSUP);
-}
-
-int
-munmap(__unused struct proc *p, struct munmap_args *uap, __unused register_t *retval)
+munmap(__unused proc_t p, struct munmap_args *uap, __unused int32_t *retval)
{
- mach_vm_offset_t user_addr;
- mach_vm_size_t user_size;
- kern_return_t result;
+ mach_vm_offset_t user_addr;
+ mach_vm_size_t user_size;
+ kern_return_t result;
+ vm_map_t user_map;
+ user_map = current_map();
user_addr = (mach_vm_offset_t) uap->addr;
user_size = (mach_vm_size_t) uap->len;
AUDIT_ARG(addr, user_addr);
AUDIT_ARG(len, user_size);
- if (user_addr & PAGE_MASK_64) {
+ if (user_addr & vm_map_page_mask(user_map)) {
/* UNIX SPEC: user address is not page-aligned, return EINVAL */
return EINVAL;
}
- if (user_addr + user_size < user_addr)
- return(EINVAL);
+ if (mach_vm_range_overflows(user_addr, user_size)) {
+ return EINVAL;
+ }
if (user_size == 0) {
/* UNIX SPEC: size is 0, return EINVAL */
return EINVAL;
}
- result = mach_vm_deallocate(current_map(), user_addr, user_size);
+ result = mach_vm_deallocate(user_map, user_addr, user_size);
if (result != KERN_SUCCESS) {
- return(EINVAL);
+ return EINVAL;
}
- return(0);
+ return 0;
}
int
-mprotect(__unused struct proc *p, struct mprotect_args *uap, __unused register_t *retval)
+mprotect(__unused proc_t p, struct mprotect_args *uap, __unused int32_t *retval)
{
- register vm_prot_t prot;
- mach_vm_offset_t user_addr;
- mach_vm_size_t user_size;
- kern_return_t result;
- vm_map_t user_map;
+ vm_prot_t prot;
+ mach_vm_offset_t user_addr;
+ mach_vm_size_t user_size;
+ kern_return_t result;
+ vm_map_t user_map;
+#if CONFIG_MACF
+ int error;
+#endif
AUDIT_ARG(addr, uap->addr);
AUDIT_ARG(len, uap->len);
- AUDIT_ARG(value, uap->prot);
+ AUDIT_ARG(value32, uap->prot);
+ user_map = current_map();
user_addr = (mach_vm_offset_t) uap->addr;
user_size = (mach_vm_size_t) uap->len;
- prot = (vm_prot_t)(uap->prot & VM_PROT_ALL);
+ prot = (vm_prot_t)(uap->prot & (VM_PROT_ALL | VM_PROT_TRUSTED | VM_PROT_STRIP_READ));
- if (user_addr & PAGE_MASK_64) {
+ if (mach_vm_range_overflows(user_addr, user_size)) {
+ return EINVAL;
+ }
+ if (user_addr & vm_map_page_mask(user_map)) {
/* UNIX SPEC: user address is not page-aligned, return EINVAL */
return EINVAL;
}
-
+
#ifdef notyet
/* Hmm .. */
#if defined(VM_PROT_READ_IS_EXEC)
- if (prot & VM_PROT_READ)
+ if (prot & VM_PROT_READ) {
prot |= VM_PROT_EXECUTE;
+ }
#endif
#endif /* notyet */
- user_map = current_map();
+#if 3936456
+ if (prot & (VM_PROT_EXECUTE | VM_PROT_WRITE)) {
+ prot |= VM_PROT_READ;
+ }
+#endif /* 3936456 */
+
+#if defined(__arm64__)
+ if (prot & VM_PROT_STRIP_READ) {
+ prot &= ~(VM_PROT_READ | VM_PROT_STRIP_READ);
+ }
+#endif
+
+#if CONFIG_MACF
+ /*
+ * The MAC check for mprotect is of limited use for 2 reasons:
+ * Without mmap revocation, the caller could have asked for the max
+ * protections initially instead of a reduced set, so a mprotect
+ * check would offer no new security.
+ * It is not possible to extract the vnode from the pager object(s)
+ * of the target memory range.
+ * However, the MAC check may be used to prevent a process from,
+ * e.g., making the stack executable.
+ */
+ error = mac_proc_check_mprotect(p, user_addr,
+ user_size, prot);
+ if (error) {
+ return error;
+ }
+#endif
+
+ if (prot & VM_PROT_TRUSTED) {
+#if CONFIG_DYNAMIC_CODE_SIGNING
+ /* CODE SIGNING ENFORCEMENT - JIT support */
+ /* The special protection value VM_PROT_TRUSTED requests that we treat
+ * this page as if it had a valid code signature.
+ * If this is enabled, there MUST be a MAC policy implementing the
+ * mac_proc_check_mprotect() hook above. Otherwise, Codesigning will be
+ * compromised because the check would always succeed and thusly any
+ * process could sign dynamically. */
+ result = vm_map_sign(
+ user_map,
+ vm_map_trunc_page(user_addr,
+ vm_map_page_mask(user_map)),
+ vm_map_round_page(user_addr + user_size,
+ vm_map_page_mask(user_map)));
+ switch (result) {
+ case KERN_SUCCESS:
+ break;
+ case KERN_INVALID_ADDRESS:
+ /* UNIX SPEC: for an invalid address range, return ENOMEM */
+ return ENOMEM;
+ default:
+ return EINVAL;
+ }
+#else
+ return ENOTSUP;
+#endif
+ }
+ prot &= ~VM_PROT_TRUSTED;
result = mach_vm_protect(user_map, user_addr, user_size,
- FALSE, prot);
+ FALSE, prot);
switch (result) {
case KERN_SUCCESS:
- return (0);
+ return 0;
case KERN_PROTECTION_FAILURE:
- return (EACCES);
+ return EACCES;
case KERN_INVALID_ADDRESS:
/* UNIX SPEC: for an invalid address range, return ENOMEM */
return ENOMEM;
}
- return (EINVAL);
+ return EINVAL;
}
int
-minherit(__unused struct proc *p, struct minherit_args *uap, __unused register_t *retval)
+minherit(__unused proc_t p, struct minherit_args *uap, __unused int32_t *retval)
{
mach_vm_offset_t addr;
mach_vm_size_t size;
- register vm_inherit_t inherit;
- vm_map_t user_map;
- kern_return_t result;
+ vm_inherit_t inherit;
+ vm_map_t user_map;
+ kern_return_t result;
AUDIT_ARG(addr, uap->addr);
AUDIT_ARG(len, uap->len);
- AUDIT_ARG(value, uap->inherit);
+ AUDIT_ARG(value32, uap->inherit);
addr = (mach_vm_offset_t)uap->addr;
size = (mach_vm_size_t)uap->len;
inherit = uap->inherit;
-
+ if (mach_vm_range_overflows(addr, size)) {
+ return EINVAL;
+ }
user_map = current_map();
result = mach_vm_inherit(user_map, addr, size,
- inherit);
+ inherit);
switch (result) {
case KERN_SUCCESS:
- return (0);
+ return 0;
case KERN_PROTECTION_FAILURE:
- return (EACCES);
+ return EACCES;
}
- return (EINVAL);
+ return EINVAL;
}
int
-madvise(__unused struct proc *p, struct madvise_args *uap, __unused register_t *retval)
+madvise(__unused proc_t p, struct madvise_args *uap, __unused int32_t *retval)
{
vm_map_t user_map;
mach_vm_offset_t start;
mach_vm_size_t size;
vm_behavior_t new_behavior;
- kern_return_t result;
+ kern_return_t result;
/*
* Since this routine is only advisory, we default to conservative
* behavior.
*/
switch (uap->behav) {
- case MADV_RANDOM:
- new_behavior = VM_BEHAVIOR_RANDOM;
- break;
- case MADV_SEQUENTIAL:
- new_behavior = VM_BEHAVIOR_SEQUENTIAL;
- break;
- case MADV_NORMAL:
- new_behavior = VM_BEHAVIOR_DEFAULT;
- break;
- case MADV_WILLNEED:
- new_behavior = VM_BEHAVIOR_WILLNEED;
- break;
- case MADV_DONTNEED:
- new_behavior = VM_BEHAVIOR_DONTNEED;
- break;
- default:
- return(EINVAL);
+ case MADV_RANDOM:
+ new_behavior = VM_BEHAVIOR_RANDOM;
+ break;
+ case MADV_SEQUENTIAL:
+ new_behavior = VM_BEHAVIOR_SEQUENTIAL;
+ break;
+ case MADV_NORMAL:
+ new_behavior = VM_BEHAVIOR_DEFAULT;
+ break;
+ case MADV_WILLNEED:
+ new_behavior = VM_BEHAVIOR_WILLNEED;
+ break;
+ case MADV_DONTNEED:
+ new_behavior = VM_BEHAVIOR_DONTNEED;
+ break;
+ case MADV_FREE:
+ new_behavior = VM_BEHAVIOR_FREE;
+ break;
+ case MADV_ZERO_WIRED_PAGES:
+ new_behavior = VM_BEHAVIOR_ZERO_WIRED_PAGES;
+ break;
+ case MADV_FREE_REUSABLE:
+ new_behavior = VM_BEHAVIOR_REUSABLE;
+ break;
+ case MADV_FREE_REUSE:
+ new_behavior = VM_BEHAVIOR_REUSE;
+ break;
+ case MADV_CAN_REUSE:
+ new_behavior = VM_BEHAVIOR_CAN_REUSE;
+ break;
+ case MADV_PAGEOUT:
+#if MACH_ASSERT
+ new_behavior = VM_BEHAVIOR_PAGEOUT;
+ break;
+#else /* MACH_ASSERT */
+ return ENOTSUP;
+#endif /* MACH_ASSERT */
+ default:
+ return EINVAL;
}
start = (mach_vm_offset_t) uap->addr;
size = (mach_vm_size_t) uap->len;
-
+ if (mach_vm_range_overflows(start, size)) {
+ return EINVAL;
+ }
+#if __arm64__
+ if (start == 0 &&
+ size != 0 &&
+ (uap->behav == MADV_FREE ||
+ uap->behav == MADV_FREE_REUSABLE)) {
+ printf("** FOURK_COMPAT: %d[%s] "
+ "failing madvise(0x%llx,0x%llx,%s)\n",
+ p->p_pid, p->p_comm, start, size,
+ ((uap->behav == MADV_FREE_REUSABLE)
+ ? "MADV_FREE_REUSABLE"
+ : "MADV_FREE"));
+ DTRACE_VM3(fourk_compat_madvise,
+ uint64_t, start,
+ uint64_t, size,
+ int, uap->behav);
+ return EINVAL;
+ }
+#endif /* __arm64__ */
+
user_map = current_map();
result = mach_vm_behavior_set(user_map, start, size, new_behavior);
switch (result) {
- case KERN_SUCCESS:
- return (0);
- case KERN_INVALID_ADDRESS:
- return (ENOMEM);
+ case KERN_SUCCESS:
+ return 0;
+ case KERN_INVALID_ADDRESS:
+ return EINVAL;
+ case KERN_NO_SPACE:
+ return ENOMEM;
}
- return (EINVAL);
+ return EINVAL;
}
int
-mincore(__unused struct proc *p, struct mincore_args *uap, __unused register_t *retval)
+mincore(__unused proc_t p, struct mincore_args *uap, __unused int32_t *retval)
{
- mach_vm_offset_t addr, first_addr, end;
- vm_map_t map;
- user_addr_t vec;
- int error;
- int vecindex, lastvecindex;
- int mincoreinfo=0;
- int pqueryinfo;
- kern_return_t ret;
- int numref;
-
- char c;
+ mach_vm_offset_t addr = 0, first_addr = 0, end = 0, cur_end = 0;
+ vm_map_t map = VM_MAP_NULL;
+ user_addr_t vec = 0;
+ int error = 0;
+ int64_t lastvecindex = 0;
+ int mincoreinfo = 0;
+ int pqueryinfo = 0;
+ uint64_t pqueryinfo_vec_size = 0;
+ vm_page_info_basic_t info = NULL;
+ mach_msg_type_number_t count = 0;
+ char *kernel_vec = NULL;
+ uint64_t req_vec_size_pages = 0, cur_vec_size_pages = 0, vecindex = 0;
+ kern_return_t kr = KERN_SUCCESS;
+ int effective_page_shift, effective_page_size;
map = current_map();
+ /*
+ * On systems with 4k kernel space and 16k user space, we will
+ * use the kernel page size to report back the residency information.
+ * This is for backwards compatibility since we already have
+ * processes that depend on this behavior.
+ */
+ if (vm_map_page_shift(map) < PAGE_SHIFT) {
+ effective_page_shift = vm_map_page_shift(map);
+ effective_page_size = vm_map_page_size(map);
+ } else {
+ effective_page_shift = PAGE_SHIFT;
+ effective_page_size = PAGE_SIZE;
+ }
+
/*
* Make sure that the addresses presented are valid for user
* mode.
*/
- first_addr = addr = mach_vm_trunc_page(uap->addr);
- end = addr + mach_vm_round_page(uap->len);
+ first_addr = addr = vm_map_trunc_page(uap->addr,
+ vm_map_page_mask(map));
+ end = vm_map_round_page(uap->addr + uap->len,
+ vm_map_page_mask(map));
- if (end < addr)
- return (EINVAL);
+ if (end < addr) {
+ return EINVAL;
+ }
+
+ if (end == addr) {
+ return 0;
+ }
/*
- * Address of byte vector
+ * We are going to loop through the whole 'req_vec_size' pages
+ * range in chunks of 'cur_vec_size'.
*/
- vec = uap->vec;
- map = current_map();
+ req_vec_size_pages = (end - addr) >> effective_page_shift;
+ cur_vec_size_pages = MIN(req_vec_size_pages, (MAX_PAGE_RANGE_QUERY >> effective_page_shift));
+ size_t kernel_vec_size = cur_vec_size_pages;
+
+ kernel_vec = kheap_alloc(KHEAP_TEMP, kernel_vec_size, Z_WAITOK | Z_ZERO);
+
+ if (kernel_vec == NULL) {
+ return ENOMEM;
+ }
/*
- * Do this on a map entry basis so that if the pages are not
- * in the current processes address space, we can easily look
- * up the pages elsewhere.
+ * Address of byte vector
*/
- lastvecindex = -1;
- for( ; addr < end; addr += PAGE_SIZE ) {
- pqueryinfo = 0;
- ret = vm_map_page_query(map, addr, &pqueryinfo, &numref);
- if (ret != KERN_SUCCESS)
- pqueryinfo = 0;
- mincoreinfo = 0;
- if (pqueryinfo & VM_PAGE_QUERY_PAGE_PRESENT)
- mincoreinfo |= MINCORE_INCORE;
- if (pqueryinfo & VM_PAGE_QUERY_PAGE_REF)
- mincoreinfo |= MINCORE_REFERENCED;
- if (pqueryinfo & VM_PAGE_QUERY_PAGE_DIRTY)
- mincoreinfo |= MINCORE_MODIFIED;
-
-
- /*
- * calculate index into user supplied byte vector
- */
- vecindex = (addr - first_addr)>> PAGE_SHIFT;
+ vec = uap->vec;
+
+ pqueryinfo_vec_size = cur_vec_size_pages * sizeof(struct vm_page_info_basic);
+
+ info = kheap_alloc(KHEAP_TEMP, pqueryinfo_vec_size, Z_WAITOK);
+
+ if (info == NULL) {
+ kheap_free(KHEAP_TEMP, kernel_vec, kernel_vec_size);
+ return ENOMEM;
+ }
+
+ while (addr < end) {
+ cur_end = addr + (cur_vec_size_pages * effective_page_size);
+
+ count = VM_PAGE_INFO_BASIC_COUNT;
+ kr = vm_map_page_range_info_internal(map,
+ addr,
+ cur_end,
+ effective_page_shift,
+ VM_PAGE_INFO_BASIC,
+ (vm_page_info_t) info,
+ &count);
+
+ assert(kr == KERN_SUCCESS);
/*
- * If we have skipped map entries, we need to make sure that
- * the byte vector is zeroed for those skipped entries.
+ * Do this on a map entry basis so that if the pages are not
+ * in the current processes address space, we can easily look
+ * up the pages elsewhere.
*/
- while((lastvecindex + 1) < vecindex) {
- c = 0;
- error = copyout(&c, vec + lastvecindex, 1);
- if (error) {
- return (EFAULT);
+ lastvecindex = -1;
+
+ for (; addr < cur_end; addr += effective_page_size) {
+ pqueryinfo = info[lastvecindex + 1].disposition;
+
+ mincoreinfo = 0;
+
+ if (pqueryinfo & VM_PAGE_QUERY_PAGE_PRESENT) {
+ mincoreinfo |= MINCORE_INCORE;
+ }
+ if (pqueryinfo & VM_PAGE_QUERY_PAGE_REF) {
+ mincoreinfo |= MINCORE_REFERENCED;
+ }
+ if (pqueryinfo & VM_PAGE_QUERY_PAGE_DIRTY) {
+ mincoreinfo |= MINCORE_MODIFIED;
+ }
+ if (pqueryinfo & VM_PAGE_QUERY_PAGE_PAGED_OUT) {
+ mincoreinfo |= MINCORE_PAGED_OUT;
+ }
+ if (pqueryinfo & VM_PAGE_QUERY_PAGE_COPIED) {
+ mincoreinfo |= MINCORE_COPIED;
}
- ++lastvecindex;
+ if ((pqueryinfo & VM_PAGE_QUERY_PAGE_EXTERNAL) == 0) {
+ mincoreinfo |= MINCORE_ANONYMOUS;
+ }
+ /*
+ * calculate index into user supplied byte vector
+ */
+ vecindex = (addr - first_addr) >> effective_page_shift;
+ kernel_vec[vecindex] = (char)mincoreinfo;
+ lastvecindex = vecindex;
}
- /*
- * Pass the page information to the user
- */
- c = (char)mincoreinfo;
- error = copyout(&c, vec + vecindex, 1);
+
+ assert(vecindex == (cur_vec_size_pages - 1));
+
+ error = copyout(kernel_vec, vec, cur_vec_size_pages * sizeof(char) /* a char per page */);
+
if (error) {
- return (EFAULT);
+ break;
}
- lastvecindex = vecindex;
+
+ /*
+ * For the next chunk, we'll need:
+ * - bump the location in the user buffer for our next disposition.
+ * - new length
+ * - starting address
+ */
+ vec += cur_vec_size_pages * sizeof(char);
+ req_vec_size_pages = (end - addr) >> effective_page_shift;
+ cur_vec_size_pages = MIN(req_vec_size_pages, (MAX_PAGE_RANGE_QUERY >> effective_page_shift));
+
+ first_addr = addr;
}
+ kheap_free(KHEAP_TEMP, info, pqueryinfo_vec_size);
+ kheap_free(KHEAP_TEMP, kernel_vec, kernel_vec_size);
- /*
- * Zero the last entries in the byte vector.
- */
- vecindex = (end - first_addr) >> PAGE_SHIFT;
- while((lastvecindex + 1) < vecindex) {
- c = 0;
- error = copyout(&c, vec + lastvecindex, 1);
- if (error) {
- return (EFAULT);
- }
- ++lastvecindex;
+ if (error) {
+ return EFAULT;
}
-
- return (0);
+
+ return 0;
}
int
-mlock(__unused struct proc *p, struct mlock_args *uap, __unused register_t *retvalval)
+mlock(__unused proc_t p, struct mlock_args *uap, __unused int32_t *retvalval)
{
vm_map_t user_map;
vm_map_offset_t addr;
vm_map_size_t size, pageoff;
- kern_return_t result;
+ kern_return_t result;
AUDIT_ARG(addr, uap->addr);
AUDIT_ARG(len, uap->len);
addr = (vm_map_offset_t) uap->addr;
size = (vm_map_size_t)uap->len;
- /* disable wrap around */
- if (addr + size < addr)
- return (EINVAL);
-
- if (size == 0)
- return (0);
+ if (vm_map_range_overflows(addr, size)) {
+ return EINVAL;
+ }
- pageoff = (addr & PAGE_MASK);
- addr -= pageoff;
- size = vm_map_round_page(size+pageoff);
-
-#ifdef notyet
-/* Hmm.. What am I going to do with this? */
- if (atop(size) + cnt.v_wire_count > vm_page_max_wired)
- return (EAGAIN);
-#ifdef pmap_wired_count
- if (size + ptoa(pmap_wired_count(vm_map_pmap(&p->p_vmspace->vm_map))) >
- p->p_rlimit[RLIMIT_MEMLOCK].rlim_cur)
- return (ENOMEM);
-#else
- error = suser(kauth_cred_get(), &p->p_acflag);
- if (error)
- return (error);
-#endif
-#endif /* notyet */
+ if (size == 0) {
+ return 0;
+ }
user_map = current_map();
+ pageoff = (addr & vm_map_page_mask(user_map));
+ addr -= pageoff;
+ size = vm_map_round_page(size + pageoff, vm_map_page_mask(user_map));
/* have to call vm_map_wire directly to pass "I don't know" protections */
- result = vm_map_wire(user_map, addr, addr+size, VM_PROT_NONE, TRUE);
- return (result == KERN_SUCCESS ? 0 : ENOMEM);
+ result = vm_map_wire_kernel(user_map, addr, addr + size, VM_PROT_NONE, VM_KERN_MEMORY_MLOCK, TRUE);
+
+ if (result == KERN_RESOURCE_SHORTAGE) {
+ return EAGAIN;
+ } else if (result == KERN_PROTECTION_FAILURE) {
+ return EACCES;
+ } else if (result != KERN_SUCCESS) {
+ return ENOMEM;
+ }
+
+ return 0; /* KERN_SUCCESS */
}
int
-munlock(__unused struct proc *p, struct munlock_args *uap, __unused register_t *retval)
+munlock(__unused proc_t p, struct munlock_args *uap, __unused int32_t *retval)
{
mach_vm_offset_t addr;
mach_vm_size_t size;
vm_map_t user_map;
- kern_return_t result;
+ kern_return_t result;
AUDIT_ARG(addr, uap->addr);
- AUDIT_ARG(addr, uap->len);
+ AUDIT_ARG(len, uap->len);
addr = (mach_vm_offset_t) uap->addr;
size = (mach_vm_size_t)uap->len;
-
-
-#ifdef notyet
-/* Hmm.. What am I going to do with this? */
-#ifndef pmap_wired_count
- error = suser(kauth_cred_get(), &p->p_acflag);
- if (error)
- return (error);
-#endif
-#endif /* notyet */
-
user_map = current_map();
-
+ if (mach_vm_range_overflows(addr, size)) {
+ return EINVAL;
+ }
/* JMM - need to remove all wirings by spec - this just removes one */
- result = mach_vm_wire(host_priv_self(), user_map, addr, size, VM_PROT_NONE);
- return (result == KERN_SUCCESS ? 0 : ENOMEM);
+ result = mach_vm_wire_kernel(host_priv_self(), user_map, addr, size, VM_PROT_NONE, VM_KERN_MEMORY_MLOCK);
+ return result == KERN_SUCCESS ? 0 : ENOMEM;
}
int
-mlockall(__unused struct proc *p, __unused struct mlockall_args *uap, __unused register_t *retval)
+mlockall(__unused proc_t p, __unused struct mlockall_args *uap, __unused int32_t *retval)
{
- return (ENOSYS);
+ return ENOSYS;
}
int
-munlockall(__unused struct proc *p, __unused struct munlockall_args *uap, __unused register_t *retval)
+munlockall(__unused proc_t p, __unused struct munlockall_args *uap, __unused int32_t *retval)
{
- return(ENOSYS);
+ return ENOSYS;
}
-
-/* BEGIN DEFUNCT */
+#if CONFIG_CODE_DECRYPTION
int
-obreak(__unused struct proc *p, __unused struct obreak_args *uap, __unused register_t *retval)
+mremap_encrypted(__unused struct proc *p, struct mremap_encrypted_args *uap, __unused int32_t *retval)
{
- /* Not implemented, obsolete */
- return (ENOMEM);
-}
-
-int both;
+ mach_vm_offset_t user_addr;
+ mach_vm_size_t user_size;
+ kern_return_t result;
+ vm_map_t user_map;
+ uint32_t cryptid;
+ cpu_type_t cputype;
+ cpu_subtype_t cpusubtype;
+ pager_crypt_info_t crypt_info;
+ const char * cryptname = 0;
+ char *vpath;
+ int len, ret;
+ struct proc_regioninfo_internal pinfo;
+ vnode_t vp;
+ uintptr_t vnodeaddr;
+ uint32_t vid;
-int
-ovadvise(__unused struct proc *p, __unused struct ovadvise_args *uap, __unused register_t *retval)
-{
-
-#ifdef lint
- both = 0;
-#endif
- return( 0 );
-}
-/* END DEFUNCT */
-
-/* USV: No! need to obsolete map_fd()! mmap() already supports 64 bits */
-kern_return_t
-map_fd(struct map_fd_args *args)
-{
- int fd = args->fd;
- vm_offset_t offset = args->offset;
- vm_offset_t *va = args->va;
- boolean_t findspace = args->findspace;
- vm_size_t size = args->size;
- kern_return_t ret;
-
- AUDIT_MACH_SYSCALL_ENTER(AUE_MAPFD);
- AUDIT_ARG(addr, CAST_DOWN(user_addr_t, va));
- AUDIT_ARG(fd, fd);
-
- ret = map_fd_funneled( fd, (vm_object_offset_t)offset, va, findspace, size);
-
- AUDIT_MACH_SYSCALL_EXIT(ret);
- return ret;
-}
+ AUDIT_ARG(addr, uap->addr);
+ AUDIT_ARG(len, uap->len);
-kern_return_t
-map_fd_funneled(
- int fd,
- vm_object_offset_t offset,
- vm_offset_t *va,
- boolean_t findspace,
- vm_size_t size)
-{
- kern_return_t result;
- struct fileproc *fp;
- struct vnode *vp;
- void * pager;
- vm_offset_t map_addr=0;
- vm_size_t map_size;
- int err=0;
- vm_map_t my_map;
- struct proc *p =(struct proc *)current_proc();
- struct vnode_attr vattr;
- struct vfs_context context;
+ user_map = current_map();
+ user_addr = (mach_vm_offset_t) uap->addr;
+ user_size = (mach_vm_size_t) uap->len;
- /*
- * Find the inode; verify that it's a regular file.
- */
+ cryptid = uap->cryptid;
+ cputype = uap->cputype;
+ cpusubtype = uap->cpusubtype;
- err = fp_lookup(p, fd, &fp, 0);
- if (err)
- return(err);
-
- if (fp->f_fglob->fg_type != DTYPE_VNODE){
- err = KERN_INVALID_ARGUMENT;
- goto bad;
+ if (mach_vm_range_overflows(user_addr, user_size)) {
+ return EINVAL;
}
-
- if (!(fp->f_fglob->fg_flag & FREAD)) {
- err = KERN_PROTECTION_FAILURE;
- goto bad;
+ if (user_addr & vm_map_page_mask(user_map)) {
+ /* UNIX SPEC: user address is not page-aligned, return EINVAL */
+ return EINVAL;
}
- vp = (struct vnode *)fp->f_fglob->fg_data;
- err = vnode_getwithref(vp);
- if(err != 0)
- goto bad;
-
- if (vp->v_type != VREG) {
- (void)vnode_put(vp);
- err = KERN_INVALID_ARGUMENT;
- goto bad;
+ switch (cryptid) {
+ case CRYPTID_NO_ENCRYPTION:
+ /* not encrypted, just an empty load command */
+ return 0;
+ case CRYPTID_APP_ENCRYPTION:
+ case CRYPTID_MODEL_ENCRYPTION:
+ cryptname = "com.apple.unfree";
+ break;
+ case 0x10:
+ /* some random cryptid that you could manually put into
+ * your binary if you want NULL */
+ cryptname = "com.apple.null";
+ break;
+ default:
+ return EINVAL;
}
- AUDIT_ARG(vnpath, vp, ARG_VNODE1);
-
- /* conformance change - mmap needs to update access time for mapped
- * files
- */
- VATTR_INIT(&vattr);
- nanotime(&vattr.va_access_time);
- VATTR_SET_ACTIVE(&vattr, va_access_time);
- context.vc_proc = p;
- context.vc_ucred = kauth_cred_get();
- vnode_setattr(vp, &vattr, &context);
-
- if (offset & PAGE_MASK_64) {
- printf("map_fd: file offset not page aligned(%d : %s)\n",p->p_pid, p->p_comm);
- (void)vnode_put(vp);
- err = KERN_INVALID_ARGUMENT;
- goto bad;
+ if (NULL == text_crypter_create) {
+ return ENOTSUP;
}
- map_size = round_page(size);
- /*
- * Allow user to map in a zero length file.
- */
- if (size == 0) {
- (void)vnode_put(vp);
- err = KERN_SUCCESS;
- goto bad;
- }
- /*
- * Map in the file.
- */
- UBCINFOCHECK("map_fd_funneled", vp);
- pager = (void *) ubc_getpager(vp);
- if (pager == NULL) {
- (void)vnode_put(vp);
- err = KERN_FAILURE;
- goto bad;
+ ret = fill_procregioninfo_onlymappedvnodes( proc_task(p), user_addr, &pinfo, &vnodeaddr, &vid);
+ if (ret == 0 || !vnodeaddr) {
+ /* No really, this returns 0 if the memory address is not backed by a file */
+ return EINVAL;
}
+ vp = (vnode_t)vnodeaddr;
+ if ((vnode_getwithvid(vp, vid)) == 0) {
+ vpath = zalloc(ZV_NAMEI);
- my_map = current_map();
+ len = MAXPATHLEN;
+ ret = vn_getpath(vp, vpath, &len);
+ if (ret) {
+ zfree(ZV_NAMEI, vpath);
+ vnode_put(vp);
+ return ret;
+ }
- result = vm_map_64(
- my_map,
- &map_addr, map_size, (vm_offset_t)0,
- VM_FLAGS_ANYWHERE, pager, offset, TRUE,
- VM_PROT_DEFAULT, VM_PROT_ALL,
- VM_INHERIT_DEFAULT);
- if (result != KERN_SUCCESS) {
- (void)vnode_put(vp);
- err = result;
- goto bad;
+ vnode_put(vp);
+ } else {
+ return EINVAL;
}
+#if 0
+ kprintf("%s vpath %s cryptid 0x%08x cputype 0x%08x cpusubtype 0x%08x range 0x%016llx size 0x%016llx\n",
+ __FUNCTION__, vpath, cryptid, cputype, cpusubtype, (uint64_t)user_addr, (uint64_t)user_size);
+#endif
- if (!findspace) {
- vm_offset_t dst_addr;
- vm_map_copy_t tmp;
-
- if (copyin(CAST_USER_ADDR_T(va), &dst_addr, sizeof (dst_addr)) ||
- trunc_page_32(dst_addr) != dst_addr) {
- (void) vm_map_remove(
- my_map,
- map_addr, map_addr + map_size,
- VM_MAP_NO_FLAGS);
- (void)vnode_put(vp);
- err = KERN_INVALID_ADDRESS;
- goto bad;
- }
-
- result = vm_map_copyin(my_map, (vm_map_address_t)map_addr,
- (vm_map_size_t)map_size, TRUE, &tmp);
- if (result != KERN_SUCCESS) {
-
- (void) vm_map_remove(my_map, vm_map_trunc_page(map_addr),
- vm_map_round_page(map_addr + map_size),
- VM_MAP_NO_FLAGS);
- (void)vnode_put(vp);
- err = result;
- goto bad;
+ /* set up decrypter first */
+ crypt_file_data_t crypt_data = {
+ .filename = vpath,
+ .cputype = cputype,
+ .cpusubtype = cpusubtype
+ };
+ result = text_crypter_create(&crypt_info, cryptname, (void*)&crypt_data);
+#if VM_MAP_DEBUG_APPLE_PROTECT
+ if (vm_map_debug_apple_protect) {
+ printf("APPLE_PROTECT: %d[%s] map %p [0x%llx:0x%llx] %s(%s) -> 0x%x\n",
+ p->p_pid, p->p_comm,
+ user_map,
+ (uint64_t) user_addr,
+ (uint64_t) (user_addr + user_size),
+ __FUNCTION__, vpath, result);
+ }
+#endif /* VM_MAP_DEBUG_APPLE_PROTECT */
+ zfree(ZV_NAMEI, vpath);
+
+ if (result) {
+ printf("%s: unable to create decrypter %s, kr=%d\n",
+ __FUNCTION__, cryptname, result);
+ if (result == kIOReturnNotPrivileged) {
+ /* text encryption returned decryption failure */
+ return EPERM;
+ } else {
+ return ENOMEM;
}
+ }
- result = vm_map_copy_overwrite(my_map,
- (vm_map_address_t)dst_addr, tmp, FALSE);
- if (result != KERN_SUCCESS) {
- vm_map_copy_discard(tmp);
- (void)vnode_put(vp);
- err = result;
- goto bad;
- }
- } else {
- if (copyout(&map_addr, CAST_USER_ADDR_T(va), sizeof (map_addr))) {
- (void) vm_map_remove(my_map, vm_map_trunc_page(map_addr),
- vm_map_round_page(map_addr + map_size),
- VM_MAP_NO_FLAGS);
- (void)vnode_put(vp);
- err = KERN_INVALID_ADDRESS;
- goto bad;
- }
+ /* now remap using the decrypter */
+ vm_object_offset_t crypto_backing_offset;
+ crypto_backing_offset = -1; /* i.e. use map entry's offset */
+ result = vm_map_apple_protected(user_map,
+ user_addr,
+ user_addr + user_size,
+ crypto_backing_offset,
+ &crypt_info,
+ cryptid);
+ if (result) {
+ printf("%s: mapping failed with %d\n", __FUNCTION__, result);
}
- ubc_setcred(vp, current_proc());
- (void)ubc_map(vp, (PROT_READ | PROT_WRITE | PROT_EXEC));
- (void)vnode_put(vp);
- err = 0;
-bad:
- fp_drop(p, fd, fp, 0);
- return (err);
+ if (result) {
+ return EPERM;
+ }
+ return 0;
}
-
+#endif /* CONFIG_CODE_DECRYPTION */