X-Git-Url: https://git.saurik.com/apple/xnu.git/blobdiff_plain/765c9de3b4af7c2078d16a03812ae2c7c2b24938..4ba76501152d51ccb5647018f3192c6096367d48:/osfmk/vm/vm_map.c

diff --git a/osfmk/vm/vm_map.c b/osfmk/vm/vm_map.c
index f7c440eb6..305c8d677 100644
--- a/osfmk/vm/vm_map.c
+++ b/osfmk/vm/vm_map.c
@@ -1,49 +1,55 @@
 /*
- * Copyright (c) 2000 Apple Computer, Inc. All rights reserved.
- *
- * @APPLE_LICENSE_HEADER_START@
- * 
- * The contents of this file constitute Original Code as defined in and
- * are subject to the Apple Public Source License Version 1.1 (the
- * "License").  You may not use this file except in compliance with the
- * License.  Please obtain a copy of the License at
- * http://www.apple.com/publicsource and read it before using this file.
- * 
- * This Original Code and all software distributed under the License are
- * distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY KIND, EITHER
+ * Copyright (c) 2000-2019 Apple Inc. All rights reserved.
+ *
+ * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
+ *
+ * This file contains Original Code and/or Modifications of Original Code
+ * as defined in and that are subject to the Apple Public Source License
+ * Version 2.0 (the 'License'). You may not use this file except in
+ * compliance with the License. The rights granted to you under the License
+ * may not be used to create, or enable the creation or redistribution of,
+ * unlawful or unlicensed copies of an Apple operating system, or to
+ * circumvent, violate, or enable the circumvention or violation of, any
+ * terms of an Apple operating system software license agreement.
+ *
+ * Please obtain a copy of the License at
+ * http://www.opensource.apple.com/apsl/ and read it before using this file.
+ *
+ * The Original Code and all software distributed under the License are
+ * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
  * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
  * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
- * FITNESS FOR A PARTICULAR PURPOSE OR NON-INFRINGEMENT.  Please see the
- * License for the specific language governing rights and limitations
- * under the License.
- * 
- * @APPLE_LICENSE_HEADER_END@
+ * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
+ * Please see the License for the specific language governing rights and
+ * limitations under the License.
+ *
+ * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
  */
 /*
  * @OSF_COPYRIGHT@
  */
-/* 
+/*
  * Mach Operating System
  * Copyright (c) 1991,1990,1989,1988,1987 Carnegie Mellon University
  * All Rights Reserved.
- * 
+ *
  * Permission to use, copy, modify and distribute this software and its
  * documentation is hereby granted, provided that both the copyright
  * notice and this permission notice appear in all copies of the
  * software, derivative works or modified versions, and any portions
  * thereof, and that both notices appear in supporting documentation.
- * 
+ *
  * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS"
  * CONDITION.  CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND FOR
  * ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
- * 
+ *
  * Carnegie Mellon requests users of this software to return to
- * 
+ *
  *  Software Distribution Coordinator  or  Software.Distribution@CS.CMU.EDU
  *  School of Computer Science
  *  Carnegie Mellon University
  *  Pittsburgh PA 15213-3890
- * 
+ *
  * any improvements or extensions that they make and grant Carnegie Mellon
  * the rights to redistribute these changes.
  */
@@ -57,133 +63,282 @@
  *	Virtual memory mapping module.
  */
 
-#include <cpus.h>
 #include <task_swapper.h>
 #include <mach_assert.h>
 
+#include <vm/vm_options.h>
+
+#include <libkern/OSAtomic.h>
+
 #include <mach/kern_return.h>
 #include <mach/port.h>
 #include <mach/vm_attributes.h>
 #include <mach/vm_param.h>
 #include <mach/vm_behavior.h>
+#include <mach/vm_statistics.h>
+#include <mach/memory_object.h>
+#include <mach/mach_vm.h>
+#include <machine/cpu_capabilities.h>
+#include <mach/sdt.h>
+
 #include <kern/assert.h>
+#include <kern/backtrace.h>
 #include <kern/counters.h>
+#include <kern/exc_guard.h>
+#include <kern/kalloc.h>
 #include <kern/zalloc.h>
+
+#include <vm/cpm.h>
+#include <vm/vm_compressor.h>
+#include <vm/vm_compressor_pager.h>
 #include <vm/vm_init.h>
 #include <vm/vm_fault.h>
 #include <vm/vm_map.h>
 #include <vm/vm_object.h>
 #include <vm/vm_page.h>
+#include <vm/vm_pageout.h>
+#include <vm/pmap.h>
 #include <vm/vm_kern.h>
 #include <ipc/ipc_port.h>
 #include <kern/sched_prim.h>
 #include <kern/misc_protos.h>
+
 #include <mach/vm_map_server.h>
 #include <mach/mach_host_server.h>
-#include <ddb/tr.h>
-#include <kern/xpr.h>
-
+#include <vm/vm_protos.h>
+#include <vm/vm_purgeable_internal.h>
+
+#include <vm/vm_protos.h>
+#include <vm/vm_shared_region.h>
+#include <vm/vm_map_store.h>
+
+#include <san/kasan.h>
+
+#include <sys/codesign.h>
+#include <libkern/section_keywords.h>
+#if DEVELOPMENT || DEBUG
+extern int proc_selfcsflags(void);
+#if CONFIG_EMBEDDED
+extern int panic_on_unsigned_execute;
+#endif /* CONFIG_EMBEDDED */
+#endif /* DEVELOPMENT || DEBUG */
+
+#if __arm64__
+extern const int fourk_binary_compatibility_unsafe;
+extern const int fourk_binary_compatibility_allow_wx;
+#endif /* __arm64__ */
+extern int proc_selfpid(void);
+extern char *proc_name_address(void *p);
+
+#if VM_MAP_DEBUG_APPLE_PROTECT
+int vm_map_debug_apple_protect = 0;
+#endif /* VM_MAP_DEBUG_APPLE_PROTECT */
+#if VM_MAP_DEBUG_FOURK
+int vm_map_debug_fourk = 0;
+#endif /* VM_MAP_DEBUG_FOURK */
+
+SECURITY_READ_ONLY_LATE(int) vm_map_executable_immutable = 1;
+int vm_map_executable_immutable_verbose = 0;
+
+os_refgrp_decl(static, map_refgrp, "vm_map", NULL);
+
+extern u_int32_t random(void);  /* from <libkern/libkern.h> */
 /* Internal prototypes
  */
-extern boolean_t vm_map_range_check(
-				vm_map_t	map,
-				vm_offset_t	start,
-				vm_offset_t	end,
-				vm_map_entry_t	*entry);
-
-extern vm_map_entry_t	_vm_map_entry_create(
-				struct vm_map_header	*map_header);
-
-extern void		_vm_map_entry_dispose(
-				struct vm_map_header	*map_header,
-				vm_map_entry_t		entry);
-
-extern void		vm_map_pmap_enter(
-				vm_map_t		map,
-				vm_offset_t 		addr,
-				vm_offset_t		end_addr,
-				vm_object_t 		object,
-				vm_object_offset_t	offset,
-				vm_prot_t		protection);
-
-extern void		_vm_map_clip_end(
-				struct vm_map_header	*map_header,
-				vm_map_entry_t		entry,
-				vm_offset_t		end);
-
-extern void		vm_map_entry_delete(
-				vm_map_t	map,
-				vm_map_entry_t	entry);
-
-extern kern_return_t	vm_map_delete(
-				vm_map_t	map,
-				vm_offset_t	start,
-				vm_offset_t	end,
-				int		flags);
-
-extern void		vm_map_copy_steal_pages(
-				vm_map_copy_t	copy);
-
-extern kern_return_t	vm_map_copy_overwrite_unaligned(
-				vm_map_t	dst_map,
-				vm_map_entry_t	entry,
-				vm_map_copy_t	copy,
-				vm_offset_t	start);
-
-extern kern_return_t	vm_map_copy_overwrite_aligned(
-				vm_map_t	dst_map,
-				vm_map_entry_t	tmp_entry,
-				vm_map_copy_t	copy,
-				vm_offset_t	start,
-				pmap_t		pmap);
-
-extern kern_return_t	vm_map_copyin_kernel_buffer(
-				vm_map_t	src_map,
-				vm_offset_t	src_addr,
-				vm_size_t	len,
-				boolean_t	src_destroy,
-				vm_map_copy_t	*copy_result);  /* OUT */
-
-extern kern_return_t	vm_map_copyout_kernel_buffer(
-				vm_map_t	map,
-				vm_offset_t	*addr,	/* IN/OUT */
-				vm_map_copy_t	copy,
-				boolean_t	overwrite);
-
-extern void		vm_map_fork_share(
-				vm_map_t	old_map,
-				vm_map_entry_t	old_entry,
-				vm_map_t	new_map);
-
-extern boolean_t	vm_map_fork_copy(
-				vm_map_t	old_map,
-				vm_map_entry_t	*old_entry_p,
-				vm_map_t	new_map);
-
-extern kern_return_t	vm_remap_range_allocate(
-				vm_map_t	map,
-				vm_offset_t	*address,	/* IN/OUT */
-				vm_size_t	size,
-				vm_offset_t	mask,
-				boolean_t	anywhere,
-				vm_map_entry_t	*map_entry);	/* OUT */
-
-extern void		_vm_map_clip_start(
-				struct vm_map_header	*map_header,
-				vm_map_entry_t		entry,
-				vm_offset_t		start);
-
-void			vm_region_top_walk(
-        			vm_map_entry_t		   entry,
-				vm_region_top_info_t       top);
-
-void 			vm_region_walk(
-        			vm_map_entry_t		   entry,
-				vm_region_extended_info_t  extended,
-				vm_object_offset_t	   offset,
-				vm_offset_t		   range,
-				vm_map_t		   map,
-				vm_offset_t                va);
+
+static void vm_map_simplify_range(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end);   /* forward */
+
+static boolean_t        vm_map_range_check(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end,
+	vm_map_entry_t  *entry);
+
+static vm_map_entry_t   _vm_map_entry_create(
+	struct vm_map_header    *map_header, boolean_t map_locked);
+
+static void             _vm_map_entry_dispose(
+	struct vm_map_header    *map_header,
+	vm_map_entry_t          entry);
+
+static void             vm_map_pmap_enter(
+	vm_map_t                map,
+	vm_map_offset_t         addr,
+	vm_map_offset_t         end_addr,
+	vm_object_t             object,
+	vm_object_offset_t      offset,
+	vm_prot_t               protection);
+
+static void             _vm_map_clip_end(
+	struct vm_map_header    *map_header,
+	vm_map_entry_t          entry,
+	vm_map_offset_t         end);
+
+static void             _vm_map_clip_start(
+	struct vm_map_header    *map_header,
+	vm_map_entry_t          entry,
+	vm_map_offset_t         start);
+
+static void             vm_map_entry_delete(
+	vm_map_t        map,
+	vm_map_entry_t  entry);
+
+static kern_return_t    vm_map_delete(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end,
+	int             flags,
+	vm_map_t        zap_map);
+
+static void             vm_map_copy_insert(
+	vm_map_t        map,
+	vm_map_entry_t  after_where,
+	vm_map_copy_t   copy);
+
+static kern_return_t    vm_map_copy_overwrite_unaligned(
+	vm_map_t        dst_map,
+	vm_map_entry_t  entry,
+	vm_map_copy_t   copy,
+	vm_map_address_t start,
+	boolean_t       discard_on_success);
+
+static kern_return_t    vm_map_copy_overwrite_aligned(
+	vm_map_t        dst_map,
+	vm_map_entry_t  tmp_entry,
+	vm_map_copy_t   copy,
+	vm_map_offset_t start,
+	pmap_t          pmap);
+
+static kern_return_t    vm_map_copyin_kernel_buffer(
+	vm_map_t        src_map,
+	vm_map_address_t src_addr,
+	vm_map_size_t   len,
+	boolean_t       src_destroy,
+	vm_map_copy_t   *copy_result);  /* OUT */
+
+static kern_return_t    vm_map_copyout_kernel_buffer(
+	vm_map_t        map,
+	vm_map_address_t *addr, /* IN/OUT */
+	vm_map_copy_t   copy,
+	vm_map_size_t   copy_size,
+	boolean_t       overwrite,
+	boolean_t       consume_on_success);
+
+static void             vm_map_fork_share(
+	vm_map_t        old_map,
+	vm_map_entry_t  old_entry,
+	vm_map_t        new_map);
+
+static boolean_t        vm_map_fork_copy(
+	vm_map_t        old_map,
+	vm_map_entry_t  *old_entry_p,
+	vm_map_t        new_map,
+	int             vm_map_copyin_flags);
+
+static kern_return_t    vm_map_wire_nested(
+	vm_map_t                   map,
+	vm_map_offset_t            start,
+	vm_map_offset_t            end,
+	vm_prot_t                  caller_prot,
+	vm_tag_t                   tag,
+	boolean_t                  user_wire,
+	pmap_t                     map_pmap,
+	vm_map_offset_t            pmap_addr,
+	ppnum_t                    *physpage_p);
+
+static kern_return_t    vm_map_unwire_nested(
+	vm_map_t                   map,
+	vm_map_offset_t            start,
+	vm_map_offset_t            end,
+	boolean_t                  user_wire,
+	pmap_t                     map_pmap,
+	vm_map_offset_t            pmap_addr);
+
+static kern_return_t    vm_map_overwrite_submap_recurse(
+	vm_map_t                   dst_map,
+	vm_map_offset_t            dst_addr,
+	vm_map_size_t              dst_size);
+
+static kern_return_t    vm_map_copy_overwrite_nested(
+	vm_map_t                   dst_map,
+	vm_map_offset_t            dst_addr,
+	vm_map_copy_t              copy,
+	boolean_t                  interruptible,
+	pmap_t                     pmap,
+	boolean_t                  discard_on_success);
+
+static kern_return_t    vm_map_remap_extract(
+	vm_map_t                map,
+	vm_map_offset_t         addr,
+	vm_map_size_t           size,
+	boolean_t               copy,
+	struct vm_map_header    *map_header,
+	vm_prot_t               *cur_protection,
+	vm_prot_t               *max_protection,
+	vm_inherit_t            inheritance,
+	boolean_t               pageable,
+	boolean_t               same_map,
+	vm_map_kernel_flags_t   vmk_flags);
+
+static kern_return_t    vm_map_remap_range_allocate(
+	vm_map_t                map,
+	vm_map_address_t        *address,
+	vm_map_size_t           size,
+	vm_map_offset_t         mask,
+	int                     flags,
+	vm_map_kernel_flags_t   vmk_flags,
+	vm_tag_t                tag,
+	vm_map_entry_t          *map_entry);
+
+static void             vm_map_region_look_for_page(
+	vm_map_t                   map,
+	vm_map_offset_t            va,
+	vm_object_t                object,
+	vm_object_offset_t         offset,
+	int                        max_refcnt,
+	int                        depth,
+	vm_region_extended_info_t  extended,
+	mach_msg_type_number_t count);
+
+static int              vm_map_region_count_obj_refs(
+	vm_map_entry_t             entry,
+	vm_object_t                object);
+
+
+static kern_return_t    vm_map_willneed(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end);
+
+static kern_return_t    vm_map_reuse_pages(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end);
+
+static kern_return_t    vm_map_reusable_pages(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end);
+
+static kern_return_t    vm_map_can_reuse(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end);
+
+#if MACH_ASSERT
+static kern_return_t    vm_map_pageout(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end);
+#endif /* MACH_ASSERT */
+
+static void             vm_map_corpse_footprint_destroy(
+	vm_map_t        map);
+
+pid_t find_largest_process_vm_map_entries(void);
 
 /*
  * Macros to copy a vm_map_entry. We must be careful to correctly
@@ -194,17 +349,165 @@ void 			vm_region_walk(
  * wire count; it's used for map splitting and zone changing in
  * vm_map_copyout.
  */
-#define vm_map_entry_copy(NEW,OLD) \
-MACRO_BEGIN                                     \
-                *(NEW) = *(OLD);                \
-                (NEW)->is_shared = FALSE;	\
-                (NEW)->needs_wakeup = FALSE;    \
-                (NEW)->in_transition = FALSE;   \
-                (NEW)->wired_count = 0;         \
-                (NEW)->user_wired_count = 0;    \
+
+#if CONFIG_EMBEDDED
+
+/*
+ * The "used_for_jit" flag was copied from OLD to NEW in vm_map_entry_copy().
+ * But for security reasons on embedded platforms, we don't want the
+ * new mapping to be "used for jit", so we always reset the flag here.
+ * Same for "pmap_cs_associated".
+ */
+#define VM_MAP_ENTRY_COPY_CODE_SIGNING(NEW, OLD)         \
+MACRO_BEGIN                                             \
+	(NEW)->used_for_jit = FALSE;                    \
+	(NEW)->pmap_cs_associated = FALSE;                              \
+MACRO_END
+
+#else /* CONFIG_EMBEDDED */
+
+/*
+ * The "used_for_jit" flag was copied from OLD to NEW in vm_map_entry_copy().
+ * On macOS, the new mapping can be "used for jit".
+ */
+#define VM_MAP_ENTRY_COPY_CODE_SIGNING(NEW, OLD)                         \
+MACRO_BEGIN                                                             \
+	assert((NEW)->used_for_jit == (OLD)->used_for_jit);             \
+	assert((NEW)->pmap_cs_associated == FALSE);                             \
+MACRO_END
+
+#endif /* CONFIG_EMBEDDED */
+
+#define vm_map_entry_copy(NEW, OLD)      \
+MACRO_BEGIN                             \
+boolean_t _vmec_reserved = (NEW)->from_reserved_zone;   \
+	*(NEW) = *(OLD);                \
+	(NEW)->is_shared = FALSE;       \
+	(NEW)->needs_wakeup = FALSE;    \
+	(NEW)->in_transition = FALSE;   \
+	(NEW)->wired_count = 0;         \
+	(NEW)->user_wired_count = 0;    \
+	(NEW)->permanent = FALSE;       \
+	VM_MAP_ENTRY_COPY_CODE_SIGNING((NEW),(OLD));    \
+	(NEW)->from_reserved_zone = _vmec_reserved;     \
+	if ((NEW)->iokit_acct) {                        \
+	     assertf(!(NEW)->use_pmap, "old %p new %p\n", (OLD), (NEW)); \
+	     (NEW)->iokit_acct = FALSE;                 \
+	     (NEW)->use_pmap = TRUE;                    \
+	}                                               \
+	(NEW)->vme_resilient_codesign = FALSE; \
+	(NEW)->vme_resilient_media = FALSE;     \
+	(NEW)->vme_atomic = FALSE;      \
+	(NEW)->vme_no_copy_on_read = FALSE;     \
 MACRO_END
 
-#define vm_map_entry_copy_full(NEW,OLD)        (*(NEW) = *(OLD))
+#define vm_map_entry_copy_full(NEW, OLD)                 \
+MACRO_BEGIN                                             \
+boolean_t _vmecf_reserved = (NEW)->from_reserved_zone;  \
+(*(NEW) = *(OLD));                                      \
+(NEW)->from_reserved_zone = _vmecf_reserved;                    \
+MACRO_END
+
+/*
+ * Normal lock_read_to_write() returns FALSE/0 on failure.
+ * These functions evaluate to zero on success and non-zero value on failure.
+ */
+__attribute__((always_inline))
+int
+vm_map_lock_read_to_write(vm_map_t map)
+{
+	if (lck_rw_lock_shared_to_exclusive(&(map)->lock)) {
+		DTRACE_VM(vm_map_lock_upgrade);
+		return 0;
+	}
+	return 1;
+}
+
+__attribute__((always_inline))
+boolean_t
+vm_map_try_lock(vm_map_t map)
+{
+	if (lck_rw_try_lock_exclusive(&(map)->lock)) {
+		DTRACE_VM(vm_map_lock_w);
+		return TRUE;
+	}
+	return FALSE;
+}
+
+__attribute__((always_inline))
+boolean_t
+vm_map_try_lock_read(vm_map_t map)
+{
+	if (lck_rw_try_lock_shared(&(map)->lock)) {
+		DTRACE_VM(vm_map_lock_r);
+		return TRUE;
+	}
+	return FALSE;
+}
+
+/*
+ *	Decide if we want to allow processes to execute from their data or stack areas.
+ *	override_nx() returns true if we do.  Data/stack execution can be enabled independently
+ *	for 32 and 64 bit processes.  Set the VM_ABI_32 or VM_ABI_64 flags in allow_data_exec
+ *	or allow_stack_exec to enable data execution for that type of data area for that particular
+ *	ABI (or both by or'ing the flags together).  These are initialized in the architecture
+ *	specific pmap files since the default behavior varies according to architecture.  The
+ *	main reason it varies is because of the need to provide binary compatibility with old
+ *	applications that were written before these restrictions came into being.  In the old
+ *	days, an app could execute anything it could read, but this has slowly been tightened
+ *	up over time.  The default behavior is:
+ *
+ *	32-bit PPC apps		may execute from both stack and data areas
+ *	32-bit Intel apps	may exeucte from data areas but not stack
+ *	64-bit PPC/Intel apps	may not execute from either data or stack
+ *
+ *	An application on any architecture may override these defaults by explicitly
+ *	adding PROT_EXEC permission to the page in question with the mprotect(2)
+ *	system call.  This code here just determines what happens when an app tries to
+ *      execute from a page that lacks execute permission.
+ *
+ *	Note that allow_data_exec or allow_stack_exec may also be modified by sysctl to change the
+ *	default behavior for both 32 and 64 bit apps on a system-wide basis. Furthermore,
+ *	a Mach-O header flag bit (MH_NO_HEAP_EXECUTION) can be used to forcibly disallow
+ *	execution from data areas for a particular binary even if the arch normally permits it. As
+ *	a final wrinkle, a posix_spawn attribute flag can be used to negate this opt-in header bit
+ *	to support some complicated use cases, notably browsers with out-of-process plugins that
+ *	are not all NX-safe.
+ */
+
+extern int allow_data_exec, allow_stack_exec;
+
+int
+override_nx(vm_map_t map, uint32_t user_tag) /* map unused on arm */
+{
+	int current_abi;
+
+	if (map->pmap == kernel_pmap) {
+		return FALSE;
+	}
+
+	/*
+	 * Determine if the app is running in 32 or 64 bit mode.
+	 */
+
+	if (vm_map_is_64bit(map)) {
+		current_abi = VM_ABI_64;
+	} else {
+		current_abi = VM_ABI_32;
+	}
+
+	/*
+	 * Determine if we should allow the execution based on whether it's a
+	 * stack or data area and the current architecture.
+	 */
+
+	if (user_tag == VM_MEMORY_STACK) {
+		return allow_stack_exec & current_abi;
+	}
+
+	return (allow_data_exec & current_abi) && (map->map_disallow_data_exec == FALSE);
+}
+
 
 /*
  *	Virtual memory maps provide for the mapping, protection,
@@ -223,7 +526,7 @@ MACRO_END
  *	the asymmetric (delayed) strategy is used for shared temporary
  *	objects instead of the symmetric (shadow) strategy.  All maps
  *	are now "top level" maps (either task map, kernel map or submap
- *	of the kernel map).  
+ *	of the kernel map).
  *
  *	Since portions of maps are specified by start/end addreses,
  *	which may not align with existing map entries, all
@@ -249,10 +552,11 @@ MACRO_END
  *	vm_object_copy_strategically() in vm_object.c.
  */
 
-zone_t		vm_map_zone;		/* zone for vm_map structures */
-zone_t		vm_map_entry_zone;	/* zone for vm_map_entry structures */
-zone_t		vm_map_kentry_zone;	/* zone for kernel entry structures */
-zone_t		vm_map_copy_zone;	/* zone for vm_map_copy structures */
+static zone_t   vm_map_zone;                            /* zone for vm_map structures */
+zone_t                  vm_map_entry_zone;                      /* zone for vm_map_entry structures */
+static zone_t   vm_map_entry_reserved_zone;     /* zone with reserve for non-blocking allocations */
+static zone_t   vm_map_copy_zone;                       /* zone for vm_map_copy structures */
+zone_t                  vm_map_holes_zone;                      /* zone for vm map holes (vm_map_links) structures */
 
 
 /*
@@ -261,7 +565,311 @@ zone_t		vm_map_copy_zone;	/* zone for vm_map_copy structures */
  *	vm_map_submap creates the submap.
  */
 
-vm_object_t	vm_submap_object;
+vm_object_t     vm_submap_object;
+
+static void             *map_data;
+static vm_size_t        map_data_size;
+static void             *kentry_data;
+static vm_size_t        kentry_data_size;
+static void             *map_holes_data;
+static vm_size_t        map_holes_data_size;
+
+#if CONFIG_EMBEDDED
+#define         NO_COALESCE_LIMIT  0
+#else
+#define         NO_COALESCE_LIMIT  ((1024 * 128) - 1)
+#endif
+
+/* Skip acquiring locks if we're in the midst of a kernel core dump */
+unsigned int not_in_kdp = 1;
+
+unsigned int vm_map_set_cache_attr_count = 0;
+
+kern_return_t
+vm_map_set_cache_attr(
+	vm_map_t        map,
+	vm_map_offset_t va)
+{
+	vm_map_entry_t  map_entry;
+	vm_object_t     object;
+	kern_return_t   kr = KERN_SUCCESS;
+
+	vm_map_lock_read(map);
+
+	if (!vm_map_lookup_entry(map, va, &map_entry) ||
+	    map_entry->is_sub_map) {
+		/*
+		 * that memory is not properly mapped
+		 */
+		kr = KERN_INVALID_ARGUMENT;
+		goto done;
+	}
+	object = VME_OBJECT(map_entry);
+
+	if (object == VM_OBJECT_NULL) {
+		/*
+		 * there should be a VM object here at this point
+		 */
+		kr = KERN_INVALID_ARGUMENT;
+		goto done;
+	}
+	vm_object_lock(object);
+	object->set_cache_attr = TRUE;
+	vm_object_unlock(object);
+
+	vm_map_set_cache_attr_count++;
+done:
+	vm_map_unlock_read(map);
+
+	return kr;
+}
+
+
+#if CONFIG_CODE_DECRYPTION
+/*
+ * vm_map_apple_protected:
+ * This remaps the requested part of the object with an object backed by
+ * the decrypting pager.
+ * crypt_info contains entry points and session data for the crypt module.
+ * The crypt_info block will be copied by vm_map_apple_protected. The data structures
+ * referenced in crypt_info must remain valid until crypt_info->crypt_end() is called.
+ */
+kern_return_t
+vm_map_apple_protected(
+	vm_map_t                map,
+	vm_map_offset_t         start,
+	vm_map_offset_t         end,
+	vm_object_offset_t      crypto_backing_offset,
+	struct pager_crypt_info *crypt_info)
+{
+	boolean_t       map_locked;
+	kern_return_t   kr;
+	vm_map_entry_t  map_entry;
+	struct vm_map_entry tmp_entry;
+	memory_object_t unprotected_mem_obj;
+	vm_object_t     protected_object;
+	vm_map_offset_t map_addr;
+	vm_map_offset_t start_aligned, end_aligned;
+	vm_object_offset_t      crypto_start, crypto_end;
+	int             vm_flags;
+	vm_map_kernel_flags_t vmk_flags;
+
+	vm_flags = 0;
+	vmk_flags = VM_MAP_KERNEL_FLAGS_NONE;
+
+	map_locked = FALSE;
+	unprotected_mem_obj = MEMORY_OBJECT_NULL;
+
+	start_aligned = vm_map_trunc_page(start, PAGE_MASK_64);
+	end_aligned = vm_map_round_page(end, PAGE_MASK_64);
+	start_aligned = vm_map_trunc_page(start_aligned, VM_MAP_PAGE_MASK(map));
+	end_aligned = vm_map_round_page(end_aligned, VM_MAP_PAGE_MASK(map));
+
+#if __arm64__
+	/*
+	 * "start" and "end" might be 4K-aligned but not 16K-aligned,
+	 * so we might have to loop and establish up to 3 mappings:
+	 *
+	 * + the first 16K-page, which might overlap with the previous
+	 *   4K-aligned mapping,
+	 * + the center,
+	 * + the last 16K-page, which might overlap with the next
+	 *   4K-aligned mapping.
+	 * Each of these mapping might be backed by a vnode pager (if
+	 * properly page-aligned) or a "fourk_pager", itself backed by a
+	 * vnode pager (if 4K-aligned but not page-aligned).
+	 */
+#endif /* __arm64__ */
+
+	map_addr = start_aligned;
+	for (map_addr = start_aligned;
+	    map_addr < end;
+	    map_addr = tmp_entry.vme_end) {
+		vm_map_lock(map);
+		map_locked = TRUE;
+
+		/* lookup the protected VM object */
+		if (!vm_map_lookup_entry(map,
+		    map_addr,
+		    &map_entry) ||
+		    map_entry->is_sub_map ||
+		    VME_OBJECT(map_entry) == VM_OBJECT_NULL ||
+		    !(map_entry->protection & VM_PROT_EXECUTE)) {
+			/* that memory is not properly mapped */
+			kr = KERN_INVALID_ARGUMENT;
+			goto done;
+		}
+
+		/* get the protected object to be decrypted */
+		protected_object = VME_OBJECT(map_entry);
+		if (protected_object == VM_OBJECT_NULL) {
+			/* there should be a VM object here at this point */
+			kr = KERN_INVALID_ARGUMENT;
+			goto done;
+		}
+		/* ensure protected object stays alive while map is unlocked */
+		vm_object_reference(protected_object);
+
+		/* limit the map entry to the area we want to cover */
+		vm_map_clip_start(map, map_entry, start_aligned);
+		vm_map_clip_end(map, map_entry, end_aligned);
+
+		tmp_entry = *map_entry;
+		map_entry = VM_MAP_ENTRY_NULL; /* not valid after unlocking map */
+		vm_map_unlock(map);
+		map_locked = FALSE;
+
+		/*
+		 * This map entry might be only partially encrypted
+		 * (if not fully "page-aligned").
+		 */
+		crypto_start = 0;
+		crypto_end = tmp_entry.vme_end - tmp_entry.vme_start;
+		if (tmp_entry.vme_start < start) {
+			if (tmp_entry.vme_start != start_aligned) {
+				kr = KERN_INVALID_ADDRESS;
+			}
+			crypto_start += (start - tmp_entry.vme_start);
+		}
+		if (tmp_entry.vme_end > end) {
+			if (tmp_entry.vme_end != end_aligned) {
+				kr = KERN_INVALID_ADDRESS;
+			}
+			crypto_end -= (tmp_entry.vme_end - end);
+		}
+
+		/*
+		 * This "extra backing offset" is needed to get the decryption
+		 * routine to use the right key.  It adjusts for the possibly
+		 * relative offset of an interposed "4K" pager...
+		 */
+		if (crypto_backing_offset == (vm_object_offset_t) -1) {
+			crypto_backing_offset = VME_OFFSET(&tmp_entry);
+		}
+
+		/*
+		 * Lookup (and create if necessary) the protected memory object
+		 * matching that VM object.
+		 * If successful, this also grabs a reference on the memory object,
+		 * to guarantee that it doesn't go away before we get a chance to map
+		 * it.
+		 */
+		unprotected_mem_obj = apple_protect_pager_setup(
+			protected_object,
+			VME_OFFSET(&tmp_entry),
+			crypto_backing_offset,
+			crypt_info,
+			crypto_start,
+			crypto_end);
+
+		/* release extra ref on protected object */
+		vm_object_deallocate(protected_object);
+
+		if (unprotected_mem_obj == NULL) {
+			kr = KERN_FAILURE;
+			goto done;
+		}
+
+		vm_flags = VM_FLAGS_FIXED | VM_FLAGS_OVERWRITE;
+		/* can overwrite an immutable mapping */
+		vmk_flags.vmkf_overwrite_immutable = TRUE;
+#if __arm64__
+		if (tmp_entry.used_for_jit &&
+		    (VM_MAP_PAGE_SHIFT(map) != FOURK_PAGE_SHIFT ||
+		    PAGE_SHIFT != FOURK_PAGE_SHIFT) &&
+		    fourk_binary_compatibility_unsafe &&
+		    fourk_binary_compatibility_allow_wx) {
+			printf("** FOURK_COMPAT [%d]: "
+			    "allowing write+execute at 0x%llx\n",
+			    proc_selfpid(), tmp_entry.vme_start);
+			vmk_flags.vmkf_map_jit = TRUE;
+		}
+#endif /* __arm64__ */
+
+		/* map this memory object in place of the current one */
+		map_addr = tmp_entry.vme_start;
+		kr = vm_map_enter_mem_object(map,
+		    &map_addr,
+		    (tmp_entry.vme_end -
+		    tmp_entry.vme_start),
+		    (mach_vm_offset_t) 0,
+		    vm_flags,
+		    vmk_flags,
+		    VM_KERN_MEMORY_NONE,
+		    (ipc_port_t)(uintptr_t) unprotected_mem_obj,
+		    0,
+		    TRUE,
+		    tmp_entry.protection,
+		    tmp_entry.max_protection,
+		    tmp_entry.inheritance);
+		assertf(kr == KERN_SUCCESS,
+		    "kr = 0x%x\n", kr);
+		assertf(map_addr == tmp_entry.vme_start,
+		    "map_addr=0x%llx vme_start=0x%llx tmp_entry=%p\n",
+		    (uint64_t)map_addr,
+		    (uint64_t) tmp_entry.vme_start,
+		    &tmp_entry);
+
+#if VM_MAP_DEBUG_APPLE_PROTECT
+		if (vm_map_debug_apple_protect) {
+			printf("APPLE_PROTECT: map %p [0x%llx:0x%llx] pager %p:"
+			    " backing:[object:%p,offset:0x%llx,"
+			    "crypto_backing_offset:0x%llx,"
+			    "crypto_start:0x%llx,crypto_end:0x%llx]\n",
+			    map,
+			    (uint64_t) map_addr,
+			    (uint64_t) (map_addr + (tmp_entry.vme_end -
+			    tmp_entry.vme_start)),
+			    unprotected_mem_obj,
+			    protected_object,
+			    VME_OFFSET(&tmp_entry),
+			    crypto_backing_offset,
+			    crypto_start,
+			    crypto_end);
+		}
+#endif /* VM_MAP_DEBUG_APPLE_PROTECT */
+
+		/*
+		 * Release the reference obtained by
+		 * apple_protect_pager_setup().
+		 * The mapping (if it succeeded) is now holding a reference on
+		 * the memory object.
+		 */
+		memory_object_deallocate(unprotected_mem_obj);
+		unprotected_mem_obj = MEMORY_OBJECT_NULL;
+
+		/* continue with next map entry */
+		crypto_backing_offset += (tmp_entry.vme_end -
+		    tmp_entry.vme_start);
+		crypto_backing_offset -= crypto_start;
+	}
+	kr = KERN_SUCCESS;
+
+done:
+	if (map_locked) {
+		vm_map_unlock(map);
+	}
+	return kr;
+}
+#endif  /* CONFIG_CODE_DECRYPTION */
+
+
+lck_grp_t               vm_map_lck_grp;
+lck_grp_attr_t  vm_map_lck_grp_attr;
+lck_attr_t              vm_map_lck_attr;
+lck_attr_t              vm_map_lck_rw_attr;
+
+#if CONFIG_EMBEDDED
+int malloc_no_cow = 1;
+#define VM_PROTECT_WX_FAIL 0
+#else /* CONFIG_EMBEDDED */
+int malloc_no_cow = 0;
+#define VM_PROTECT_WX_FAIL 1
+#endif /* CONFIG_EMBEDDED */
+uint64_t vm_memory_malloc_no_cow_mask = 0ULL;
+#if DEBUG
+int vm_check_map_sanity = 0;
+#endif
 
 /*
  *	vm_map_init:
@@ -276,7 +884,7 @@ vm_object_t	vm_submap_object;
  *
  *	vm_map_zone:		used to allocate maps.
  *	vm_map_entry_zone:	used to allocate map entries.
- *	vm_map_kentry_zone:	used to allocate map entries for the kernel.
+ *	vm_map_entry_reserved_zone:	fallback zone for kernel map entries
  *
  *	The kernel allocates map entries from a special zone that is initially
  *	"crammed" with memory.  It would be difficult (perhaps impossible) for
@@ -284,72 +892,229 @@ vm_object_t	vm_submap_object;
  *	empty since the very act of allocating memory implies the creation
  *	of a new entry.
  */
-
-vm_offset_t	map_data;
-vm_size_t	map_data_size;
-vm_offset_t	kentry_data;
-vm_size_t	kentry_data_size;
-int		kentry_count = 2048;		/* to init kentry_data_size */
-
-#define         NO_COALESCE_LIMIT  (1024 * 128)
-
-/*
- *	Threshold for aggressive (eager) page map entering for vm copyout
- *	operations.  Any copyout larger will NOT be aggressively entered.
- */
-vm_size_t vm_map_aggressive_enter_max;		/* set by bootstrap */
-
 void
 vm_map_init(
 	void)
 {
-	vm_map_zone = zinit((vm_size_t) sizeof(struct vm_map), 40*1024,
-					PAGE_SIZE, "maps");
+	vm_size_t entry_zone_alloc_size;
+	const char *mez_name = "VM map entries";
+
+	vm_map_zone = zinit((vm_map_size_t) sizeof(struct _vm_map), 40 * 1024,
+	    PAGE_SIZE, "maps");
+	zone_change(vm_map_zone, Z_NOENCRYPT, TRUE);
+#if     defined(__LP64__)
+	entry_zone_alloc_size = PAGE_SIZE * 5;
+#else
+	entry_zone_alloc_size = PAGE_SIZE * 6;
+#endif
+	vm_map_entry_zone = zinit((vm_map_size_t) sizeof(struct vm_map_entry),
+	    1024 * 1024, entry_zone_alloc_size,
+	    mez_name);
+	zone_change(vm_map_entry_zone, Z_NOENCRYPT, TRUE);
+	zone_change(vm_map_entry_zone, Z_NOCALLOUT, TRUE);
+	zone_change(vm_map_entry_zone, Z_GZALLOC_EXEMPT, TRUE);
+
+	vm_map_entry_reserved_zone = zinit((vm_map_size_t) sizeof(struct vm_map_entry),
+	    kentry_data_size * 64, kentry_data_size,
+	    "Reserved VM map entries");
+	zone_change(vm_map_entry_reserved_zone, Z_NOENCRYPT, TRUE);
+	/* Don't quarantine because we always need elements available */
+	zone_change(vm_map_entry_reserved_zone, Z_KASAN_QUARANTINE, FALSE);
+
+	vm_map_copy_zone = zinit((vm_map_size_t) sizeof(struct vm_map_copy),
+	    16 * 1024, PAGE_SIZE, "VM map copies");
+	zone_change(vm_map_copy_zone, Z_NOENCRYPT, TRUE);
+
+	vm_map_holes_zone = zinit((vm_map_size_t) sizeof(struct vm_map_links),
+	    16 * 1024, PAGE_SIZE, "VM map holes");
+	zone_change(vm_map_holes_zone, Z_NOENCRYPT, TRUE);
 
-	vm_map_entry_zone = zinit((vm_size_t) sizeof(struct vm_map_entry),
-					1024*1024, PAGE_SIZE*5,
-					"non-kernel map entries");
+	/*
+	 *	Cram the map and kentry zones with initial data.
+	 *	Set reserved_zone non-collectible to aid zone_gc().
+	 */
+	zone_change(vm_map_zone, Z_COLLECT, FALSE);
+	zone_change(vm_map_zone, Z_FOREIGN, TRUE);
+	zone_change(vm_map_zone, Z_GZALLOC_EXEMPT, TRUE);
+
+	zone_change(vm_map_entry_reserved_zone, Z_COLLECT, FALSE);
+	zone_change(vm_map_entry_reserved_zone, Z_EXPAND, FALSE);
+	zone_change(vm_map_entry_reserved_zone, Z_FOREIGN, TRUE);
+	zone_change(vm_map_entry_reserved_zone, Z_NOCALLOUT, TRUE);
+	zone_change(vm_map_entry_reserved_zone, Z_CALLERACCT, FALSE); /* don't charge caller */
+	zone_change(vm_map_copy_zone, Z_CALLERACCT, FALSE); /* don't charge caller */
+	zone_change(vm_map_entry_reserved_zone, Z_GZALLOC_EXEMPT, TRUE);
+
+	zone_change(vm_map_holes_zone, Z_COLLECT, TRUE);
+	zone_change(vm_map_holes_zone, Z_EXPAND, TRUE);
+	zone_change(vm_map_holes_zone, Z_FOREIGN, TRUE);
+	zone_change(vm_map_holes_zone, Z_NOCALLOUT, TRUE);
+	zone_change(vm_map_holes_zone, Z_CALLERACCT, TRUE);
+	zone_change(vm_map_holes_zone, Z_GZALLOC_EXEMPT, TRUE);
 
-	vm_map_kentry_zone = zinit((vm_size_t) sizeof(struct vm_map_entry),
-					kentry_data_size, kentry_data_size,
-					"kernel map entries");
+	/*
+	 * Add the stolen memory to zones, adjust zone size and stolen counts.
+	 * zcram only up to the maximum number of pages for each zone chunk.
+	 */
+	zcram(vm_map_zone, (vm_offset_t)map_data, map_data_size);
 
-	vm_map_copy_zone = zinit((vm_size_t) sizeof(struct vm_map_copy),
-					16*1024, PAGE_SIZE, "map copies");
+	const vm_size_t stride = ZONE_CHUNK_MAXPAGES * PAGE_SIZE;
+	for (vm_offset_t off = 0; off < kentry_data_size; off += stride) {
+		zcram(vm_map_entry_reserved_zone,
+		    (vm_offset_t)kentry_data + off,
+		    MIN(kentry_data_size - off, stride));
+	}
+	for (vm_offset_t off = 0; off < map_holes_data_size; off += stride) {
+		zcram(vm_map_holes_zone,
+		    (vm_offset_t)map_holes_data + off,
+		    MIN(map_holes_data_size - off, stride));
+	}
 
 	/*
-	 *	Cram the map and kentry zones with initial data.
-	 *	Set kentry_zone non-collectible to aid zone_gc().
+	 * Since these are covered by zones, remove them from stolen page accounting.
 	 */
-	zone_change(vm_map_zone, Z_COLLECT, FALSE);
-	zone_change(vm_map_kentry_zone, Z_COLLECT, FALSE);
-	zone_change(vm_map_kentry_zone, Z_EXPAND, FALSE);
-	zcram(vm_map_zone, map_data, map_data_size);
-	zcram(vm_map_kentry_zone, kentry_data, kentry_data_size);
+	VM_PAGE_MOVE_STOLEN(atop_64(map_data_size) + atop_64(kentry_data_size) + atop_64(map_holes_data_size));
+
+	lck_grp_attr_setdefault(&vm_map_lck_grp_attr);
+	lck_grp_init(&vm_map_lck_grp, "vm_map", &vm_map_lck_grp_attr);
+	lck_attr_setdefault(&vm_map_lck_attr);
+
+	lck_attr_setdefault(&vm_map_lck_rw_attr);
+	lck_attr_cleardebug(&vm_map_lck_rw_attr);
+
+#if VM_MAP_DEBUG_APPLE_PROTECT
+	PE_parse_boot_argn("vm_map_debug_apple_protect",
+	    &vm_map_debug_apple_protect,
+	    sizeof(vm_map_debug_apple_protect));
+#endif /* VM_MAP_DEBUG_APPLE_PROTECT */
+#if VM_MAP_DEBUG_APPLE_FOURK
+	PE_parse_boot_argn("vm_map_debug_fourk",
+	    &vm_map_debug_fourk,
+	    sizeof(vm_map_debug_fourk));
+#endif /* VM_MAP_DEBUG_FOURK */
+	PE_parse_boot_argn("vm_map_executable_immutable",
+	    &vm_map_executable_immutable,
+	    sizeof(vm_map_executable_immutable));
+	PE_parse_boot_argn("vm_map_executable_immutable_verbose",
+	    &vm_map_executable_immutable_verbose,
+	    sizeof(vm_map_executable_immutable_verbose));
+
+	PE_parse_boot_argn("malloc_no_cow",
+	    &malloc_no_cow,
+	    sizeof(malloc_no_cow));
+	if (malloc_no_cow) {
+		vm_memory_malloc_no_cow_mask = 0ULL;
+		vm_memory_malloc_no_cow_mask |= 1ULL << VM_MEMORY_MALLOC;
+		vm_memory_malloc_no_cow_mask |= 1ULL << VM_MEMORY_MALLOC_SMALL;
+		vm_memory_malloc_no_cow_mask |= 1ULL << VM_MEMORY_MALLOC_MEDIUM;
+		vm_memory_malloc_no_cow_mask |= 1ULL << VM_MEMORY_MALLOC_LARGE;
+//		vm_memory_malloc_no_cow_mask |= 1ULL << VM_MEMORY_MALLOC_HUGE;
+//		vm_memory_malloc_no_cow_mask |= 1ULL << VM_MEMORY_REALLOC;
+		vm_memory_malloc_no_cow_mask |= 1ULL << VM_MEMORY_MALLOC_TINY;
+		vm_memory_malloc_no_cow_mask |= 1ULL << VM_MEMORY_MALLOC_LARGE_REUSABLE;
+		vm_memory_malloc_no_cow_mask |= 1ULL << VM_MEMORY_MALLOC_LARGE_REUSED;
+		vm_memory_malloc_no_cow_mask |= 1ULL << VM_MEMORY_MALLOC_NANO;
+//		vm_memory_malloc_no_cow_mask |= 1ULL << VM_MEMORY_TCMALLOC;
+		PE_parse_boot_argn("vm_memory_malloc_no_cow_mask",
+		    &vm_memory_malloc_no_cow_mask,
+		    sizeof(vm_memory_malloc_no_cow_mask));
+	}
+
+#if DEBUG
+	PE_parse_boot_argn("vm_check_map_sanity", &vm_check_map_sanity, sizeof(vm_check_map_sanity));
+	if (vm_check_map_sanity) {
+		kprintf("VM sanity checking enabled\n");
+	} else {
+		kprintf("VM sanity checking disabled. Set bootarg vm_check_map_sanity=1 to enable\n");
+	}
+#endif /* DEBUG */
 }
 
 void
 vm_map_steal_memory(
 	void)
 {
-	map_data_size = round_page(10 * sizeof(struct vm_map));
+	uint32_t kentry_initial_pages;
+
+	map_data_size = round_page(10 * sizeof(struct _vm_map));
 	map_data = pmap_steal_memory(map_data_size);
 
-#if 0
 	/*
-	 * Limiting worst case: vm_map_kentry_zone needs to map each "available"
-	 * physical page (i.e. that beyond the kernel image and page tables)
-	 * individually; we guess at most one entry per eight pages in the
-	 * real world. This works out to roughly .1 of 1% of physical memory,
-	 * or roughly 1900 entries (64K) for a 64M machine with 4K pages.
+	 * kentry_initial_pages corresponds to the number of kernel map entries
+	 * required during bootstrap until the asynchronous replenishment
+	 * scheme is activated and/or entries are available from the general
+	 * map entry pool.
 	 */
+#if     defined(__LP64__)
+	kentry_initial_pages = 10;
+#else
+	kentry_initial_pages = 6;
 #endif
-	kentry_count = pmap_free_pages() / 8;
 
+#if CONFIG_GZALLOC
+	/* If using the guard allocator, reserve more memory for the kernel
+	 * reserved map entry pool.
+	 */
+	if (gzalloc_enabled()) {
+		kentry_initial_pages *= 1024;
+	}
+#endif
 
-	kentry_data_size =
-		round_page(kentry_count * sizeof(struct vm_map_entry));
+	kentry_data_size = kentry_initial_pages * PAGE_SIZE;
 	kentry_data = pmap_steal_memory(kentry_data_size);
+
+	map_holes_data_size = kentry_data_size;
+	map_holes_data = pmap_steal_memory(map_holes_data_size);
+}
+
+boolean_t vm_map_supports_hole_optimization = FALSE;
+
+void
+vm_kernel_reserved_entry_init(void)
+{
+	zone_prio_refill_configure(vm_map_entry_reserved_zone, (6 * PAGE_SIZE) / sizeof(struct vm_map_entry));
+
+	/*
+	 * Once we have our replenish thread set up, we can start using the vm_map_holes zone.
+	 */
+	zone_prio_refill_configure(vm_map_holes_zone, (6 * PAGE_SIZE) / sizeof(struct vm_map_links));
+	vm_map_supports_hole_optimization = TRUE;
+}
+
+void
+vm_map_disable_hole_optimization(vm_map_t map)
+{
+	vm_map_entry_t  head_entry, hole_entry, next_hole_entry;
+
+	if (map->holelistenabled) {
+		head_entry = hole_entry = CAST_TO_VM_MAP_ENTRY(map->holes_list);
+
+		while (hole_entry != NULL) {
+			next_hole_entry = hole_entry->vme_next;
+
+			hole_entry->vme_next = NULL;
+			hole_entry->vme_prev = NULL;
+			zfree(vm_map_holes_zone, hole_entry);
+
+			if (next_hole_entry == head_entry) {
+				hole_entry = NULL;
+			} else {
+				hole_entry = next_hole_entry;
+			}
+		}
+
+		map->holes_list = NULL;
+		map->holelistenabled = FALSE;
+
+		map->first_free = vm_map_first_entry(map);
+		SAVE_HINT_HOLE_WRITE(map, NULL);
+	}
+}
+
+boolean_t
+vm_kernel_map_is_kernel(vm_map_t map)
+{
+	return map->pmap == kernel_pmap;
 }
 
 /*
@@ -359,42 +1124,112 @@ vm_map_steal_memory(
  *	the given physical map structure, and having
  *	the given lower and upper address bounds.
  */
+
 vm_map_t
 vm_map_create(
-	pmap_t		pmap,
-	vm_offset_t	min,
-	vm_offset_t	max,
-	boolean_t	pageable)
+	pmap_t          pmap,
+	vm_map_offset_t min,
+	vm_map_offset_t max,
+	boolean_t       pageable)
+{
+	int options;
+
+	options = 0;
+	if (pageable) {
+		options |= VM_MAP_CREATE_PAGEABLE;
+	}
+	return vm_map_create_options(pmap, min, max, options);
+}
+
+vm_map_t
+vm_map_create_options(
+	pmap_t          pmap,
+	vm_map_offset_t min,
+	vm_map_offset_t max,
+	int             options)
 {
-	register vm_map_t	result;
+	vm_map_t        result;
+	struct vm_map_links     *hole_entry = NULL;
+
+	if (options & ~(VM_MAP_CREATE_ALL_OPTIONS)) {
+		/* unknown option */
+		return VM_MAP_NULL;
+	}
 
 	result = (vm_map_t) zalloc(vm_map_zone);
-	if (result == VM_MAP_NULL)
+	if (result == VM_MAP_NULL) {
 		panic("vm_map_create");
+	}
 
 	vm_map_first_entry(result) = vm_map_to_entry(result);
 	vm_map_last_entry(result)  = vm_map_to_entry(result);
 	result->hdr.nentries = 0;
-	result->hdr.entries_pageable = pageable;
+	if (options & VM_MAP_CREATE_PAGEABLE) {
+		result->hdr.entries_pageable = TRUE;
+	} else {
+		result->hdr.entries_pageable = FALSE;
+	}
+
+	vm_map_store_init( &(result->hdr));
+
+	result->hdr.page_shift = PAGE_SHIFT;
 
 	result->size = 0;
-	result->ref_count = 1;
-#if	TASK_SWAPPER
+	result->user_wire_limit = MACH_VM_MAX_ADDRESS;  /* default limit is unlimited */
+	result->user_wire_size  = 0;
+#if !CONFIG_EMBEDDED
+	result->vmmap_high_start = 0;
+#endif
+	os_ref_init_count(&result->map_refcnt, &map_refgrp, 1);
+#if     TASK_SWAPPER
 	result->res_count = 1;
 	result->sw_state = MAP_SW_IN;
-#endif	/* TASK_SWAPPER */
+#endif  /* TASK_SWAPPER */
 	result->pmap = pmap;
 	result->min_offset = min;
 	result->max_offset = max;
 	result->wiring_required = FALSE;
 	result->no_zero_fill = FALSE;
+	result->mapped_in_other_pmaps = FALSE;
 	result->wait_for_space = FALSE;
+	result->switch_protect = FALSE;
+	result->disable_vmentry_reuse = FALSE;
+	result->map_disallow_data_exec = FALSE;
+	result->is_nested_map = FALSE;
+	result->map_disallow_new_exec = FALSE;
+	result->highest_entry_end = 0;
 	result->first_free = vm_map_to_entry(result);
 	result->hint = vm_map_to_entry(result);
+	result->jit_entry_exists = FALSE;
+
+	/* "has_corpse_footprint" and "holelistenabled" are mutually exclusive */
+	if (options & VM_MAP_CREATE_CORPSE_FOOTPRINT) {
+		result->has_corpse_footprint = TRUE;
+		result->holelistenabled = FALSE;
+		result->vmmap_corpse_footprint = NULL;
+	} else {
+		result->has_corpse_footprint = FALSE;
+		if (vm_map_supports_hole_optimization) {
+			hole_entry = zalloc(vm_map_holes_zone);
+
+			hole_entry->start = min;
+#if defined(__arm__) || defined(__arm64__)
+			hole_entry->end = result->max_offset;
+#else
+			hole_entry->end = (max > (vm_map_offset_t)MACH_VM_MAX_ADDRESS) ? max : (vm_map_offset_t)MACH_VM_MAX_ADDRESS;
+#endif
+			result->holes_list = result->hole_hint = hole_entry;
+			hole_entry->prev = hole_entry->next = CAST_TO_VM_MAP_ENTRY(hole_entry);
+			result->holelistenabled = TRUE;
+		} else {
+			result->holelistenabled = FALSE;
+		}
+	}
+
 	vm_map_lock_init(result);
-	mutex_init(&result->s_lock, ETAP_VM_RESULT);
+	lck_mtx_init_ext(&result->s_lock, &result->s_lock_ext, &vm_map_lck_grp, &vm_map_lck_attr);
 
-	return(result);
+	return result;
 }
 
 /*
@@ -403,220 +1238,112 @@ vm_map_create(
  *	Allocates a VM map entry for insertion in the
  *	given map (or map copy).  No fields are filled.
  */
-#define	vm_map_entry_create(map) \
-	    _vm_map_entry_create(&(map)->hdr)
+#define vm_map_entry_create(map, map_locked)    _vm_map_entry_create(&(map)->hdr, map_locked)
 
-#define	vm_map_copy_entry_create(copy) \
-	    _vm_map_entry_create(&(copy)->cpy_hdr)
+#define vm_map_copy_entry_create(copy, map_locked)                                      \
+	_vm_map_entry_create(&(copy)->cpy_hdr, map_locked)
+unsigned reserved_zalloc_count, nonreserved_zalloc_count;
 
-vm_map_entry_t
+static vm_map_entry_t
 _vm_map_entry_create(
-	register struct vm_map_header	*map_header)
+	struct vm_map_header    *map_header, boolean_t __unused map_locked)
 {
-	register zone_t	zone;
-	register vm_map_entry_t	entry;
+	zone_t  zone;
+	vm_map_entry_t  entry;
+
+	zone = vm_map_entry_zone;
+
+	assert(map_header->entries_pageable ? !map_locked : TRUE);
+
+	if (map_header->entries_pageable) {
+		entry = (vm_map_entry_t) zalloc(zone);
+	} else {
+		entry = (vm_map_entry_t) zalloc_canblock(zone, FALSE);
 
-	if (map_header->entries_pageable)
-	    zone = vm_map_entry_zone;
-	else
-	    zone = vm_map_kentry_zone;
+		if (entry == VM_MAP_ENTRY_NULL) {
+			zone = vm_map_entry_reserved_zone;
+			entry = (vm_map_entry_t) zalloc(zone);
+			OSAddAtomic(1, &reserved_zalloc_count);
+		} else {
+			OSAddAtomic(1, &nonreserved_zalloc_count);
+		}
+	}
 
-	entry = (vm_map_entry_t) zalloc(zone);
-	if (entry == VM_MAP_ENTRY_NULL)
+	if (entry == VM_MAP_ENTRY_NULL) {
 		panic("vm_map_entry_create");
+	}
+	entry->from_reserved_zone = (zone == vm_map_entry_reserved_zone);
 
-	return(entry);
+	vm_map_store_update((vm_map_t) NULL, entry, VM_MAP_ENTRY_CREATE);
+#if     MAP_ENTRY_CREATION_DEBUG
+	entry->vme_creation_maphdr = map_header;
+	backtrace(&entry->vme_creation_bt[0],
+	    (sizeof(entry->vme_creation_bt) / sizeof(uintptr_t)), NULL);
+#endif
+	return entry;
 }
 
 /*
  *	vm_map_entry_dispose:	[ internal use only ]
  *
  *	Inverse of vm_map_entry_create.
+ *
+ *      write map lock held so no need to
+ *	do anything special to insure correctness
+ *      of the stores
  */
-#define	vm_map_entry_dispose(map, entry)			\
-MACRO_BEGIN							\
-	if((entry) == (map)->first_free)			\
-		(map)->first_free = vm_map_to_entry(map);	\
-	if((entry) == (map)->hint)				\
-		(map)->hint = vm_map_to_entry(map);		\
-	_vm_map_entry_dispose(&(map)->hdr, (entry));		\
-MACRO_END
+#define vm_map_entry_dispose(map, entry)                        \
+	_vm_map_entry_dispose(&(map)->hdr, (entry))
 
-#define	vm_map_copy_entry_dispose(map, entry) \
+#define vm_map_copy_entry_dispose(map, entry) \
 	_vm_map_entry_dispose(&(copy)->cpy_hdr, (entry))
 
-void
+static void
 _vm_map_entry_dispose(
-	register struct vm_map_header	*map_header,
-	register vm_map_entry_t		entry)
+	struct vm_map_header    *map_header,
+	vm_map_entry_t          entry)
 {
-	register zone_t		zone;
+	zone_t          zone;
 
-	if (map_header->entries_pageable)
-	    zone = vm_map_entry_zone;
-	else
-	    zone = vm_map_kentry_zone;
+	if (map_header->entries_pageable || !(entry->from_reserved_zone)) {
+		zone = vm_map_entry_zone;
+	} else {
+		zone = vm_map_entry_reserved_zone;
+	}
+
+	if (!map_header->entries_pageable) {
+		if (zone == vm_map_entry_zone) {
+			OSAddAtomic(-1, &nonreserved_zalloc_count);
+		} else {
+			OSAddAtomic(-1, &reserved_zalloc_count);
+		}
+	}
 
-	zfree(zone, (vm_offset_t) entry);
+	zfree(zone, entry);
 }
 
-boolean_t first_free_is_valid(vm_map_t map);	/* forward */
-boolean_t first_free_check = FALSE;
+#if MACH_ASSERT
+static boolean_t first_free_check = FALSE;
 boolean_t
 first_free_is_valid(
-	vm_map_t	map)
+	vm_map_t        map)
 {
-	vm_map_entry_t	entry, next;
-
-	if (!first_free_check)
+	if (!first_free_check) {
 		return TRUE;
-		
-	entry = vm_map_to_entry(map);
-	next = entry->vme_next;
-	while (trunc_page(next->vme_start) == trunc_page(entry->vme_end) ||
-	       (trunc_page(next->vme_start) == trunc_page(entry->vme_start) &&
-		next != vm_map_to_entry(map))) {
-		entry = next;
-		next = entry->vme_next;
-		if (entry == vm_map_to_entry(map))
-			break;
-	}
-	if (map->first_free != entry) {
-		printf("Bad first_free for map 0x%x: 0x%x should be 0x%x\n",
-		       map, map->first_free, entry);
-		return FALSE;
 	}
-	return TRUE;
-}
-
-/*
- *	UPDATE_FIRST_FREE:
- *
- *	Updates the map->first_free pointer to the
- *	entry immediately before the first hole in the map.
- * 	The map should be locked.
- */
-#define UPDATE_FIRST_FREE(map, new_first_free) 				\
-MACRO_BEGIN 								\
-	vm_map_t	UFF_map; 					\
-	vm_map_entry_t	UFF_first_free; 				\
-	vm_map_entry_t	UFF_next_entry; 				\
-	UFF_map = (map); 						\
-	UFF_first_free = (new_first_free);				\
-	UFF_next_entry = UFF_first_free->vme_next; 			\
-	while (trunc_page(UFF_next_entry->vme_start) == 		\
-	       trunc_page(UFF_first_free->vme_end) || 			\
-	       (trunc_page(UFF_next_entry->vme_start) == 		\
-		trunc_page(UFF_first_free->vme_start) &&		\
-		UFF_next_entry != vm_map_to_entry(UFF_map))) { 		\
-		UFF_first_free = UFF_next_entry; 			\
-		UFF_next_entry = UFF_first_free->vme_next; 		\
-		if (UFF_first_free == vm_map_to_entry(UFF_map)) 	\
-			break; 						\
-	} 								\
-	UFF_map->first_free = UFF_first_free; 				\
-	assert(first_free_is_valid(UFF_map));				\
-MACRO_END
-
-/*
- *	vm_map_entry_{un,}link:
- *
- *	Insert/remove entries from maps (or map copies).
- */
-#define vm_map_entry_link(map, after_where, entry)			\
-MACRO_BEGIN 								\
-	vm_map_t VMEL_map; 						\
-	vm_map_entry_t VMEL_entry; 					\
-	VMEL_map = (map);						\
-	VMEL_entry = (entry); 						\
-	_vm_map_entry_link(&VMEL_map->hdr, after_where, VMEL_entry); 	\
-	UPDATE_FIRST_FREE(VMEL_map, VMEL_map->first_free); 		\
-MACRO_END
-
-
-#define vm_map_copy_entry_link(copy, after_where, entry)		\
-	_vm_map_entry_link(&(copy)->cpy_hdr, after_where, (entry))
-
-#define _vm_map_entry_link(hdr, after_where, entry)			\
-	MACRO_BEGIN							\
-	(hdr)->nentries++;						\
-	(entry)->vme_prev = (after_where);				\
-	(entry)->vme_next = (after_where)->vme_next;			\
-	(entry)->vme_prev->vme_next = (entry)->vme_next->vme_prev = (entry); \
-	MACRO_END
-
-#define vm_map_entry_unlink(map, entry)					\
-MACRO_BEGIN 								\
-	vm_map_t VMEU_map; 						\
-	vm_map_entry_t VMEU_entry; 					\
-	vm_map_entry_t VMEU_first_free;					\
-	VMEU_map = (map); 						\
-	VMEU_entry = (entry); 						\
-	if (VMEU_entry->vme_start <= VMEU_map->first_free->vme_start)	\
-		VMEU_first_free = VMEU_entry->vme_prev;			\
-	else								\
-		VMEU_first_free = VMEU_map->first_free;			\
-	_vm_map_entry_unlink(&VMEU_map->hdr, VMEU_entry); 		\
-	UPDATE_FIRST_FREE(VMEU_map, VMEU_first_free);			\
-MACRO_END
-
-#define vm_map_copy_entry_unlink(copy, entry)				\
-	_vm_map_entry_unlink(&(copy)->cpy_hdr, (entry))
-
-#define _vm_map_entry_unlink(hdr, entry)				\
-	MACRO_BEGIN							\
-	(hdr)->nentries--;						\
-	(entry)->vme_next->vme_prev = (entry)->vme_prev; 		\
-	(entry)->vme_prev->vme_next = (entry)->vme_next; 		\
-	MACRO_END
-
-/*
- *	kernel_vm_map_reference:
- *
- *	kernel internal export version for iokit and bsd components
- *	in lieu of component interface semantics.
- *
- */
-void
-kernel_vm_map_reference(
-	register vm_map_t	map)
-{
-	if (map == VM_MAP_NULL)
-		return;
 
-	mutex_lock(&map->s_lock);
-#if	TASK_SWAPPER
-	assert(map->res_count > 0);
-	assert(map->ref_count >= map->res_count);
-	map->res_count++;
-#endif
-	map->ref_count++;
-	mutex_unlock(&map->s_lock);
+	return first_free_is_valid_store( map );
 }
+#endif /* MACH_ASSERT */
 
-#if	MACH_ASSERT && TASK_SWAPPER
-/*
- *	vm_map_reference:
- *
- *	Adds valid reference and residence counts to the given map.
- * 	The map must be in memory (i.e. non-zero residence count).
- *
- */
-void
-vm_map_reference(
-	register vm_map_t	map)
-{
-	if (map == VM_MAP_NULL)
-		return;
 
-	mutex_lock(&map->s_lock);
-	assert(map->res_count > 0);
-	assert(map->ref_count >= map->res_count);
-	map->ref_count++;
-	map->res_count++;
-	mutex_unlock(&map->s_lock);
-}
+#define vm_map_copy_entry_link(copy, after_where, entry)                \
+	_vm_map_store_entry_link(&(copy)->cpy_hdr, after_where, (entry))
+
+#define vm_map_copy_entry_unlink(copy, entry)                           \
+	_vm_map_store_entry_unlink(&(copy)->cpy_hdr, (entry))
 
+#if     MACH_ASSERT && TASK_SWAPPER
 /*
  *	vm_map_res_reference:
  *
@@ -626,20 +1353,22 @@ vm_map_reference(
  *	vm_map_swapin.
  *
  */
-void vm_map_res_reference(register vm_map_t map)
+void
+vm_map_res_reference(vm_map_t map)
 {
 	/* assert map is locked */
 	assert(map->res_count >= 0);
-	assert(map->ref_count >= map->res_count);
+	assert(os_ref_get_count(&map->map_refcnt) >= map->res_count);
 	if (map->res_count == 0) {
-		mutex_unlock(&map->s_lock);
+		lck_mtx_unlock(&map->s_lock);
 		vm_map_lock(map);
 		vm_map_swapin(map);
-		mutex_lock(&map->s_lock);
+		lck_mtx_lock(&map->s_lock);
 		++map->res_count;
 		vm_map_unlock(map);
-	} else
+	} else {
 		++map->res_count;
+	}
 }
 
 /*
@@ -650,15 +1379,16 @@ void vm_map_res_reference(register vm_map_t map)
  *	The map may not be in memory (i.e. zero residence count).
  *
  */
-void vm_map_reference_swap(register vm_map_t map)
+void
+vm_map_reference_swap(vm_map_t map)
 {
 	assert(map != VM_MAP_NULL);
-	mutex_lock(&map->s_lock);
+	lck_mtx_lock(&map->s_lock);
 	assert(map->res_count >= 0);
-	assert(map->ref_count >= map->res_count);
-	map->ref_count++;
+	assert(os_ref_get_count(&map->map_refcnt) >= map->res_count);
+	os_ref_retain_locked(&map->map_refcnt);
 	vm_map_res_reference(map);
-	mutex_unlock(&map->s_lock);
+	lck_mtx_unlock(&map->s_lock);
 }
 
 /*
@@ -671,87 +1401,128 @@ void vm_map_reference_swap(register vm_map_t map)
  *	The map is locked, so this function is callable from vm_map_deallocate.
  *
  */
-void vm_map_res_deallocate(register vm_map_t map)
+void
+vm_map_res_deallocate(vm_map_t map)
 {
 	assert(map->res_count > 0);
 	if (--map->res_count == 0) {
-		mutex_unlock(&map->s_lock);
+		lck_mtx_unlock(&map->s_lock);
 		vm_map_lock(map);
 		vm_map_swapout(map);
 		vm_map_unlock(map);
-		mutex_lock(&map->s_lock);
+		lck_mtx_lock(&map->s_lock);
 	}
-	assert(map->ref_count >= map->res_count);
+	assert(os_ref_get_count(&map->map_refcnt) >= map->res_count);
 }
-#endif	/* MACH_ASSERT && TASK_SWAPPER */
+#endif  /* MACH_ASSERT && TASK_SWAPPER */
 
 /*
- *	vm_map_deallocate:
+ *	vm_map_destroy:
  *
- *	Removes a reference from the specified map,
- *	destroying it if no references remain.
- *	The map should not be locked.
+ *	Actually destroy a map.
  */
 void
-vm_map_deallocate(
-	register vm_map_t	map)
+vm_map_destroy(
+	vm_map_t        map,
+	int             flags)
 {
-	unsigned int		ref;
+	vm_map_lock(map);
 
-	if (map == VM_MAP_NULL)
-		return;
+	/* final cleanup: no need to unnest shared region */
+	flags |= VM_MAP_REMOVE_NO_UNNESTING;
+	/* final cleanup: ok to remove immutable mappings */
+	flags |= VM_MAP_REMOVE_IMMUTABLE;
+	/* final cleanup: allow gaps in range */
+	flags |= VM_MAP_REMOVE_GAPS_OK;
+
+	/* clean up regular map entries */
+	(void) vm_map_delete(map, map->min_offset, map->max_offset,
+	    flags, VM_MAP_NULL);
+	/* clean up leftover special mappings (commpage, etc...) */
+#if     !defined(__arm__) && !defined(__arm64__)
+	(void) vm_map_delete(map, 0x0, 0xFFFFFFFFFFFFF000ULL,
+	    flags, VM_MAP_NULL);
+#endif /* !__arm__ && !__arm64__ */
+
+	vm_map_disable_hole_optimization(map);
+	vm_map_corpse_footprint_destroy(map);
 
-	mutex_lock(&map->s_lock);
-	ref = --map->ref_count;
-	if (ref > 0) {
-		vm_map_res_deallocate(map);
-		mutex_unlock(&map->s_lock);
-		return;
+	vm_map_unlock(map);
+
+	assert(map->hdr.nentries == 0);
+
+	if (map->pmap) {
+		pmap_destroy(map->pmap);
 	}
-	assert(map->ref_count == 0);
-	mutex_unlock(&map->s_lock);
 
-#if	TASK_SWAPPER
-	/*
-	 * The map residence count isn't decremented here because
-	 * the vm_map_delete below will traverse the entire map, 
-	 * deleting entries, and the residence counts on objects
-	 * and sharing maps will go away then.
-	 */
-#endif
+	if (vm_map_lck_attr.lck_attr_val & LCK_ATTR_DEBUG) {
+		/*
+		 * If lock debugging is enabled the mutexes get tagged as LCK_MTX_TAG_INDIRECT.
+		 * And this is regardless of whether the lck_mtx_ext_t is embedded in the
+		 * structure or kalloc'ed via lck_mtx_init.
+		 * An example is s_lock_ext within struct _vm_map.
+		 *
+		 * A lck_mtx_destroy on such a mutex will attempt a kfree and panic. We
+		 * can add another tag to detect embedded vs alloc'ed indirect external
+		 * mutexes but that'll be additional checks in the lock path and require
+		 * updating dependencies for the old vs new tag.
+		 *
+		 * Since the kfree() is for LCK_MTX_TAG_INDIRECT mutexes and that tag is applied
+		 * just when lock debugging is ON, we choose to forego explicitly destroying
+		 * the vm_map mutex and rw lock and, as a consequence, will overflow the reference
+		 * count on vm_map_lck_grp, which has no serious side-effect.
+		 */
+	} else {
+		lck_rw_destroy(&(map)->lock, &vm_map_lck_grp);
+		lck_mtx_destroy(&(map)->s_lock, &vm_map_lck_grp);
+	}
 
-	vm_map_destroy(map);
+	zfree(vm_map_zone, map);
 }
 
 /*
- *	vm_map_destroy:
- *
- *	Actually destroy a map.
+ * Returns pid of the task with the largest number of VM map entries.
+ * Used in the zone-map-exhaustion jetsam path.
  */
-void
-vm_map_destroy(
-	register vm_map_t	map)
+pid_t
+find_largest_process_vm_map_entries(void)
 {
-	vm_map_lock(map);
-	(void) vm_map_delete(map, map->min_offset,
-			     map->max_offset, VM_MAP_NO_FLAGS);
-	vm_map_unlock(map);
+	pid_t victim_pid = -1;
+	int max_vm_map_entries = 0;
+	task_t task = TASK_NULL;
+	queue_head_t *task_list = &tasks;
+
+	lck_mtx_lock(&tasks_threads_lock);
+	queue_iterate(task_list, task, task_t, tasks) {
+		if (task == kernel_task || !task->active) {
+			continue;
+		}
 
-	pmap_destroy(map->pmap);
+		vm_map_t task_map = task->map;
+		if (task_map != VM_MAP_NULL) {
+			int task_vm_map_entries = task_map->hdr.nentries;
+			if (task_vm_map_entries > max_vm_map_entries) {
+				max_vm_map_entries = task_vm_map_entries;
+				victim_pid = pid_from_task(task);
+			}
+		}
+	}
+	lck_mtx_unlock(&tasks_threads_lock);
 
-	zfree(vm_map_zone, (vm_offset_t) map);
+	printf("zone_map_exhaustion: victim pid %d, vm region count: %d\n", victim_pid, max_vm_map_entries);
+	return victim_pid;
 }
 
-#if	TASK_SWAPPER
+#if     TASK_SWAPPER
 /*
  * vm_map_swapin/vm_map_swapout
  *
- * Swap a map in and out, either referencing or releasing its resources.  
+ * Swap a map in and out, either referencing or releasing its resources.
  * These functions are internal use only; however, they must be exported
  * because they may be called from macros, which are exported.
  *
- * In the case of swapout, there could be races on the residence count, 
- * so if the residence count is up, we return, assuming that a 
+ * In the case of swapout, there could be races on the residence count,
+ * so if the residence count is up, we return, assuming that a
  * vm_map_deallocate() call in the near future will bring us back.
  *
  * Locking:
@@ -767,7 +1538,7 @@ vm_map_destroy(
  *	2) A vm_map_reference() call at this time is illegal, and will
  *	cause a panic.  vm_map_reference() is only allowed on resident
  *	maps, since it refuses to block.
- *	3) A vm_map_swapin() call during a swapin will block, and 
+ *	3) A vm_map_swapin() call during a swapin will block, and
  *	proceeed when the first swapin is done, turning into a nop.
  *	This is the reason the res_count is not incremented until
  *	after the swapin is complete.
@@ -775,9 +1546,9 @@ vm_map_destroy(
  *	the map lock is taken, during which a swapin may get the lock
  *	before a swapout about to happen.  If this happens, the swapin
  *	will detect the state and increment the reference count, causing
- *	the swapout to be a nop, thereby delaying it until a later 
- *	vm_map_deallocate.  If the swapout gets the lock first, then 
- *	the swapin will simply block until the swapout is done, and 
+ *	the swapout to be a nop, thereby delaying it until a later
+ *	vm_map_deallocate.  If the swapout gets the lock first, then
+ *	the swapin will simply block until the swapout is done, and
  *	then proceed.
  *
  * Because vm_map_swapin() is potentially an expensive operation, it
@@ -792,23 +1563,26 @@ vm_map_destroy(
 
 int vm_map_swap_enable = 1;
 
-void vm_map_swapin (vm_map_t map)
+void
+vm_map_swapin(vm_map_t map)
 {
-	register vm_map_entry_t entry;
-	
-	if (!vm_map_swap_enable)	/* debug */
+	vm_map_entry_t entry;
+
+	if (!vm_map_swap_enable) {      /* debug */
 		return;
+	}
 
 	/*
 	 * Map is locked
 	 * First deal with various races.
 	 */
-	if (map->sw_state == MAP_SW_IN)
-		/* 
+	if (map->sw_state == MAP_SW_IN) {
+		/*
 		 * we raced with swapout and won.  Returning will incr.
 		 * the res_count, turning the swapout into a nop.
 		 */
 		return;
+	}
 
 	/*
 	 * The residence count must be zero.  If we raced with another
@@ -826,7 +1600,7 @@ void vm_map_swapin (vm_map_t map)
 	assert(map->sw_state == MAP_SW_OUT);
 
 	/*
-	 * We now operate upon each map entry.  If the entry is a sub- 
+	 * We now operate upon each map entry.  If the entry is a sub-
 	 * or share-map, we call vm_map_res_reference upon it.
 	 * If the entry is an object, we call vm_object_res_reference
 	 * (this may iterate through the shadow chain).
@@ -837,14 +1611,14 @@ void vm_map_swapin (vm_map_t map)
 	entry = vm_map_first_entry(map);
 
 	while (entry != vm_map_to_entry(map)) {
-		if (entry->object.vm_object != VM_OBJECT_NULL) {
+		if (VME_OBJECT(entry) != VM_OBJECT_NULL) {
 			if (entry->is_sub_map) {
-				vm_map_t lmap = entry->object.sub_map;
-				mutex_lock(&lmap->s_lock);
+				vm_map_t lmap = VME_SUBMAP(entry);
+				lck_mtx_lock(&lmap->s_lock);
 				vm_map_res_reference(lmap);
-				mutex_unlock(&lmap->s_lock);
+				lck_mtx_unlock(&lmap->s_lock);
 			} else {
-				vm_object_t object = entry->object.vm_object;
+				vm_object_t object = VME_OBEJCT(entry);
 				vm_object_lock(object);
 				/*
 				 * This call may iterate through the
@@ -860,22 +1634,23 @@ void vm_map_swapin (vm_map_t map)
 	map->sw_state = MAP_SW_IN;
 }
 
-void vm_map_swapout(vm_map_t map)
+void
+vm_map_swapout(vm_map_t map)
 {
-	register vm_map_entry_t entry;
-	
+	vm_map_entry_t entry;
+
 	/*
 	 * Map is locked
 	 * First deal with various races.
 	 * If we raced with a swapin and lost, the residence count
 	 * will have been incremented to 1, and we simply return.
 	 */
-	mutex_lock(&map->s_lock);
+	lck_mtx_lock(&map->s_lock);
 	if (map->res_count != 0) {
-		mutex_unlock(&map->s_lock);
+		lck_mtx_unlock(&map->s_lock);
 		return;
 	}
-	mutex_unlock(&map->s_lock);
+	lck_mtx_unlock(&map->s_lock);
 
 	/*
 	 * There are no intermediate states of a map going out or
@@ -883,11 +1658,12 @@ void vm_map_swapout(vm_map_t map)
 	 */
 	assert(map->sw_state == MAP_SW_IN);
 
-	if (!vm_map_swap_enable)
+	if (!vm_map_swap_enable) {
 		return;
+	}
 
 	/*
-	 * We now operate upon each map entry.  If the entry is a sub- 
+	 * We now operate upon each map entry.  If the entry is a sub-
 	 * or share-map, we call vm_map_res_deallocate upon it.
 	 * If the entry is an object, we call vm_object_res_deallocate
 	 * (this may iterate through the shadow chain).
@@ -898,19 +1674,19 @@ void vm_map_swapout(vm_map_t map)
 	entry = vm_map_first_entry(map);
 
 	while (entry != vm_map_to_entry(map)) {
-		if (entry->object.vm_object != VM_OBJECT_NULL) {
+		if (VME_OBJECT(entry) != VM_OBJECT_NULL) {
 			if (entry->is_sub_map) {
-				vm_map_t lmap = entry->object.sub_map;
-				mutex_lock(&lmap->s_lock);
+				vm_map_t lmap = VME_SUBMAP(entry);
+				lck_mtx_lock(&lmap->s_lock);
 				vm_map_res_deallocate(lmap);
-				mutex_unlock(&lmap->s_lock);
+				lck_mtx_unlock(&lmap->s_lock);
 			} else {
-				vm_object_t object = entry->object.vm_object;
+				vm_object_t object = VME_OBJECT(entry);
 				vm_object_lock(object);
 				/*
-				 * This call may take a long time, 
-				 * since it could actively push 
-				 * out pages (if we implement it 
+				 * This call may take a long time,
+				 * since it could actively push
+				 * out pages (if we implement it
 				 * that way).
 				 */
 				vm_object_res_deallocate(object);
@@ -923,100 +1699,25 @@ void vm_map_swapout(vm_map_t map)
 	map->sw_state = MAP_SW_OUT;
 }
 
-#endif	/* TASK_SWAPPER */
-
-
-/*
- *	SAVE_HINT:
- *
- *	Saves the specified entry as the hint for
- *	future lookups.  Performs necessary interlocks.
- */
-#define	SAVE_HINT(map,value) \
-		mutex_lock(&(map)->s_lock); \
-		(map)->hint = (value); \
-		mutex_unlock(&(map)->s_lock);
+#endif  /* TASK_SWAPPER */
 
 /*
  *	vm_map_lookup_entry:	[ internal use only ]
  *
- *	Finds the map entry containing (or
- *	immediately preceding) the specified address
- *	in the given map; the entry is returned
+ *	Calls into the vm map store layer to find the map
+ *	entry containing (or immediately preceding) the
+ *	specified address in the given map; the entry is returned
  *	in the "entry" parameter.  The boolean
  *	result indicates whether the address is
  *	actually contained in the map.
  */
 boolean_t
 vm_map_lookup_entry(
-	register vm_map_t	map,
-	register vm_offset_t	address,
-	vm_map_entry_t		*entry)		/* OUT */
+	vm_map_t                map,
+	vm_map_offset_t address,
+	vm_map_entry_t          *entry)         /* OUT */
 {
-	register vm_map_entry_t		cur;
-	register vm_map_entry_t		last;
-
-	/*
-	 *	Start looking either from the head of the
-	 *	list, or from the hint.
-	 */
-
-	mutex_lock(&map->s_lock);
-	cur = map->hint;
-	mutex_unlock(&map->s_lock);
-
-	if (cur == vm_map_to_entry(map))
-		cur = cur->vme_next;
-
-	if (address >= cur->vme_start) {
-	    	/*
-		 *	Go from hint to end of list.
-		 *
-		 *	But first, make a quick check to see if
-		 *	we are already looking at the entry we
-		 *	want (which is usually the case).
-		 *	Note also that we don't need to save the hint
-		 *	here... it is the same hint (unless we are
-		 *	at the header, in which case the hint didn't
-		 *	buy us anything anyway).
-		 */
-		last = vm_map_to_entry(map);
-		if ((cur != last) && (cur->vme_end > address)) {
-			*entry = cur;
-			return(TRUE);
-		}
-	}
-	else {
-	    	/*
-		 *	Go from start to hint, *inclusively*
-		 */
-		last = cur->vme_next;
-		cur = vm_map_first_entry(map);
-	}
-
-	/*
-	 *	Search linearly
-	 */
-
-	while (cur != last) {
-		if (cur->vme_end > address) {
-			if (address >= cur->vme_start) {
-			    	/*
-				 *	Save this lookup for future
-				 *	hints, and return
-				 */
-
-				*entry = cur;
-				SAVE_HINT(map, cur);
-				return(TRUE);
-			}
-			break;
-		}
-		cur = cur->vme_next;
-	}
-	*entry = cur->vme_prev;
-	SAVE_HINT(map, *entry);
-	return(FALSE);
+	return vm_map_store_lookup_entry( map, address, entry );
 }
 
 /*
@@ -1034,17 +1735,31 @@ vm_map_lookup_entry(
  */
 kern_return_t
 vm_map_find_space(
-	register vm_map_t	map,
-	vm_offset_t		*address,	/* OUT */
-	vm_size_t		size,
-	vm_offset_t		mask,
-	vm_map_entry_t		*o_entry)	/* OUT */
+	vm_map_t        map,
+	vm_map_offset_t         *address,       /* OUT */
+	vm_map_size_t           size,
+	vm_map_offset_t         mask,
+	int                     flags __unused,
+	vm_map_kernel_flags_t   vmk_flags,
+	vm_tag_t                tag,
+	vm_map_entry_t          *o_entry)       /* OUT */
 {
-	register vm_map_entry_t	entry, new_entry;
-	register vm_offset_t	start;
-	register vm_offset_t	end;
+	vm_map_entry_t                  entry, new_entry;
+	vm_map_offset_t start;
+	vm_map_offset_t end;
+	vm_map_entry_t                  hole_entry;
 
-	new_entry = vm_map_entry_create(map);
+	if (size == 0) {
+		*address = 0;
+		return KERN_INVALID_ARGUMENT;
+	}
+
+	if (vmk_flags.vmkf_guard_after) {
+		/* account for the back guard page in the size */
+		size += VM_MAP_PAGE_SIZE(map);
+	}
+
+	new_entry = vm_map_entry_create(map, FALSE);
 
 	/*
 	 *	Look for the first possible address; if there's already
@@ -1053,11 +1768,32 @@ vm_map_find_space(
 
 	vm_map_lock(map);
 
-	assert(first_free_is_valid(map));
-	if ((entry = map->first_free) == vm_map_to_entry(map))
-		start = map->min_offset;
-	else
-		start = entry->vme_end;
+	if (map->disable_vmentry_reuse == TRUE) {
+		VM_MAP_HIGHEST_ENTRY(map, entry, start);
+	} else {
+		if (map->holelistenabled) {
+			hole_entry = CAST_TO_VM_MAP_ENTRY(map->holes_list);
+
+			if (hole_entry == NULL) {
+				/*
+				 * No more space in the map?
+				 */
+				vm_map_entry_dispose(map, new_entry);
+				vm_map_unlock(map);
+				return KERN_NO_SPACE;
+			}
+
+			entry = hole_entry;
+			start = entry->vme_start;
+		} else {
+			assert(first_free_is_valid(map));
+			if ((entry = map->first_free) == vm_map_to_entry(map)) {
+				start = map->min_offset;
+			} else {
+				start = entry->vme_end;
+			}
+		}
+	}
 
 	/*
 	 *	In any case, the "entry" always precedes
@@ -1065,7 +1801,7 @@ vm_map_find_space(
 	 */
 
 	while (TRUE) {
-		register vm_map_entry_t	next;
+		vm_map_entry_t  next;
 
 		/*
 		 *	Find the end of the proposed new region.
@@ -1073,43 +1809,78 @@ vm_map_find_space(
 		 *	wrap around the address.
 		 */
 
+		if (vmk_flags.vmkf_guard_before) {
+			/* reserve space for the front guard page */
+			start += VM_MAP_PAGE_SIZE(map);
+		}
 		end = ((start + mask) & ~mask);
+
 		if (end < start) {
 			vm_map_entry_dispose(map, new_entry);
 			vm_map_unlock(map);
-			return(KERN_NO_SPACE);
+			return KERN_NO_SPACE;
 		}
 		start = end;
+		assert(VM_MAP_PAGE_ALIGNED(start, VM_MAP_PAGE_MASK(map)));
 		end += size;
+		assert(VM_MAP_PAGE_ALIGNED(end, VM_MAP_PAGE_MASK(map)));
 
 		if ((end > map->max_offset) || (end < start)) {
 			vm_map_entry_dispose(map, new_entry);
 			vm_map_unlock(map);
-			return(KERN_NO_SPACE);
+			return KERN_NO_SPACE;
 		}
 
-		/*
-		 *	If there are no more entries, we must win.
-		 */
-
 		next = entry->vme_next;
-		if (next == vm_map_to_entry(map))
-			break;
 
-		/*
-		 *	If there is another entry, it must be
-		 *	after the end of the potential new region.
-		 */
+		if (map->holelistenabled) {
+			if (entry->vme_end >= end) {
+				break;
+			}
+		} else {
+			/*
+			 *	If there are no more entries, we must win.
+			 *
+			 *	OR
+			 *
+			 *	If there is another entry, it must be
+			 *	after the end of the potential new region.
+			 */
 
-		if (next->vme_start >= end)
-			break;
+			if (next == vm_map_to_entry(map)) {
+				break;
+			}
+
+			if (next->vme_start >= end) {
+				break;
+			}
+		}
 
 		/*
 		 *	Didn't fit -- move to the next entry.
 		 */
 
 		entry = next;
-		start = entry->vme_end;
+
+		if (map->holelistenabled) {
+			if (entry == CAST_TO_VM_MAP_ENTRY(map->holes_list)) {
+				/*
+				 * Wrapped around
+				 */
+				vm_map_entry_dispose(map, new_entry);
+				vm_map_unlock(map);
+				return KERN_NO_SPACE;
+			}
+			start = entry->vme_start;
+		} else {
+			start = entry->vme_end;
+		}
+	}
+
+	if (map->holelistenabled) {
+		if (vm_map_lookup_entry(map, entry->vme_start, &entry)) {
+			panic("Found an existing entry (%p) instead of potential hole at address: 0x%llx.\n", entry, (unsigned long long)entry->vme_start);
+		}
 	}
 
 	/*
@@ -1122,18 +1893,27 @@ vm_map_find_space(
 	 *		the map should be locked.
 	 */
 
+	if (vmk_flags.vmkf_guard_before) {
+		/* go back for the front guard page */
+		start -= VM_MAP_PAGE_SIZE(map);
+	}
 	*address = start;
 
+	assert(start < end);
 	new_entry->vme_start = start;
 	new_entry->vme_end = end;
 	assert(page_aligned(new_entry->vme_start));
 	assert(page_aligned(new_entry->vme_end));
+	assert(VM_MAP_PAGE_ALIGNED(new_entry->vme_start,
+	    VM_MAP_PAGE_MASK(map)));
+	assert(VM_MAP_PAGE_ALIGNED(new_entry->vme_end,
+	    VM_MAP_PAGE_MASK(map)));
 
 	new_entry->is_shared = FALSE;
 	new_entry->is_sub_map = FALSE;
-	new_entry->use_pmap = FALSE;
-	new_entry->object.vm_object = VM_OBJECT_NULL;
-	new_entry->offset = (vm_object_offset_t) 0;
+	new_entry->use_pmap = TRUE;
+	VME_OBJECT_SET(new_entry, VM_OBJECT_NULL);
+	VME_OFFSET_SET(new_entry, (vm_object_offset_t) 0);
 
 	new_entry->needs_copy = FALSE;
 
@@ -1146,29 +1926,51 @@ vm_map_find_space(
 
 	new_entry->in_transition = FALSE;
 	new_entry->needs_wakeup = FALSE;
+	new_entry->no_cache = FALSE;
+	new_entry->permanent = FALSE;
+	new_entry->superpage_size = FALSE;
+	if (VM_MAP_PAGE_SHIFT(map) != PAGE_SHIFT) {
+		new_entry->map_aligned = TRUE;
+	} else {
+		new_entry->map_aligned = FALSE;
+	}
+
+	new_entry->used_for_jit = FALSE;
+	new_entry->pmap_cs_associated = FALSE;
+	new_entry->zero_wired_pages = FALSE;
+	new_entry->iokit_acct = FALSE;
+	new_entry->vme_resilient_codesign = FALSE;
+	new_entry->vme_resilient_media = FALSE;
+	if (vmk_flags.vmkf_atomic_entry) {
+		new_entry->vme_atomic = TRUE;
+	} else {
+		new_entry->vme_atomic = FALSE;
+	}
+
+	VME_ALIAS_SET(new_entry, tag);
 
 	/*
 	 *	Insert the new entry into the list
 	 */
 
-	vm_map_entry_link(map, entry, new_entry);
+	vm_map_store_entry_link(map, entry, new_entry, VM_MAP_KERNEL_FLAGS_NONE);
 
 	map->size += size;
 
 	/*
 	 *	Update the lookup hint
 	 */
-	SAVE_HINT(map, new_entry);
+	SAVE_HINT_MAP_WRITE(map, new_entry);
 
 	*o_entry = new_entry;
-	return(KERN_SUCCESS);
+	return KERN_SUCCESS;
 }
 
 int vm_map_pmap_enter_print = FALSE;
 int vm_map_pmap_enter_enable = FALSE;
 
 /*
- *	Routine:	vm_map_pmap_enter
+ *	Routine:	vm_map_pmap_enter [internal only]
  *
  *	Description:
  *		Force pages from the specified object to be entered into
@@ -1176,69 +1978,178 @@ int vm_map_pmap_enter_enable = FALSE;
  *		As soon as a page not found in the object the scan ends.
  *
  *	Returns:
- *		Nothing.  
+ *		Nothing.
  *
  *	In/out conditions:
  *		The source map should not be locked on entry.
  */
-void
+__unused static void
 vm_map_pmap_enter(
-	vm_map_t		map,
-	register vm_offset_t 	addr,
-	register vm_offset_t	end_addr,
-	register vm_object_t 	object,
-	vm_object_offset_t	offset,
-	vm_prot_t		protection)
+	vm_map_t                map,
+	vm_map_offset_t         addr,
+	vm_map_offset_t         end_addr,
+	vm_object_t             object,
+	vm_object_offset_t      offset,
+	vm_prot_t               protection)
 {
+	int                     type_of_fault;
+	kern_return_t           kr;
+	struct vm_object_fault_info fault_info = {};
+
+	if (map->pmap == 0) {
+		return;
+	}
 
 	while (addr < end_addr) {
-		register vm_page_t	m;
+		vm_page_t       m;
+
+
+		/*
+		 * TODO:
+		 * From vm_map_enter(), we come into this function without the map
+		 * lock held or the object lock held.
+		 * We haven't taken a reference on the object either.
+		 * We should do a proper lookup on the map to make sure
+		 * that things are sane before we go locking objects that
+		 * could have been deallocated from under us.
+		 */
 
 		vm_object_lock(object);
-		vm_object_paging_begin(object);
 
 		m = vm_page_lookup(object, offset);
-		if (m == VM_PAGE_NULL || m->busy ||
-		    (m->unusual && ( m->error || m->restart || m->absent ||
-				    protection & m->page_lock))) {
 
-			vm_object_paging_end(object);
+		if (m == VM_PAGE_NULL || m->vmp_busy || m->vmp_fictitious ||
+		    (m->vmp_unusual && (m->vmp_error || m->vmp_restart || m->vmp_absent))) {
 			vm_object_unlock(object);
 			return;
 		}
 
-		assert(!m->fictitious);	/* XXX is this possible ??? */
-
 		if (vm_map_pmap_enter_print) {
 			printf("vm_map_pmap_enter:");
-			printf("map: %x, addr: %x, object: %x, offset: %x\n",
-				map, addr, object, offset);
+			printf("map: %p, addr: %llx, object: %p, offset: %llx\n",
+			    map, (unsigned long long)addr, object, (unsigned long long)offset);
 		}
-		m->busy = TRUE;
+		type_of_fault = DBG_CACHE_HIT_FAULT;
+		kr = vm_fault_enter(m, map->pmap,
+		    addr, protection, protection,
+		    VM_PAGE_WIRED(m),
+		    FALSE,                 /* change_wiring */
+		    VM_KERN_MEMORY_NONE,                 /* tag - not wiring */
+		    &fault_info,
+		    NULL,                  /* need_retry */
+		    &type_of_fault);
+
+		vm_object_unlock(object);
+
+		offset += PAGE_SIZE_64;
+		addr += PAGE_SIZE;
+	}
+}
+
+boolean_t vm_map_pmap_is_empty(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end);
+boolean_t
+vm_map_pmap_is_empty(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end)
+{
+#ifdef MACHINE_PMAP_IS_EMPTY
+	return pmap_is_empty(map->pmap, start, end);
+#else   /* MACHINE_PMAP_IS_EMPTY */
+	vm_map_offset_t offset;
+	ppnum_t         phys_page;
 
-		if (m->no_isync == TRUE) {
-		        pmap_sync_caches_phys(m->phys_addr);
+	if (map->pmap == NULL) {
+		return TRUE;
+	}
 
-			m->no_isync = FALSE;
+	for (offset = start;
+	    offset < end;
+	    offset += PAGE_SIZE) {
+		phys_page = pmap_find_phys(map->pmap, offset);
+		if (phys_page) {
+			kprintf("vm_map_pmap_is_empty(%p,0x%llx,0x%llx): "
+			    "page %d at 0x%llx\n",
+			    map, (long long)start, (long long)end,
+			    phys_page, (long long)offset);
+			return FALSE;
 		}
-		vm_object_unlock(object);
+	}
+	return TRUE;
+#endif  /* MACHINE_PMAP_IS_EMPTY */
+}
 
-		PMAP_ENTER(map->pmap, addr, m,
-			   protection, FALSE);
+#define MAX_TRIES_TO_GET_RANDOM_ADDRESS 1000
+kern_return_t
+vm_map_random_address_for_size(
+	vm_map_t        map,
+	vm_map_offset_t *address,
+	vm_map_size_t   size)
+{
+	kern_return_t   kr = KERN_SUCCESS;
+	int             tries = 0;
+	vm_map_offset_t random_addr = 0;
+	vm_map_offset_t hole_end;
 
-		vm_object_lock(object);
+	vm_map_entry_t  next_entry = VM_MAP_ENTRY_NULL;
+	vm_map_entry_t  prev_entry = VM_MAP_ENTRY_NULL;
+	vm_map_size_t   vm_hole_size = 0;
+	vm_map_size_t   addr_space_size;
 
-		PAGE_WAKEUP_DONE(m);
-		vm_page_lock_queues();
-		if (!m->active && !m->inactive)
-		    vm_page_activate(m);
-		vm_page_unlock_queues();
-		vm_object_paging_end(object);
-		vm_object_unlock(object);
+	addr_space_size = vm_map_max(map) - vm_map_min(map);
 
-		offset += PAGE_SIZE_64;
-		addr += PAGE_SIZE;
+	assert(page_aligned(size));
+
+	while (tries < MAX_TRIES_TO_GET_RANDOM_ADDRESS) {
+		random_addr = ((vm_map_offset_t)random()) << PAGE_SHIFT;
+		random_addr = vm_map_trunc_page(
+			vm_map_min(map) + (random_addr % addr_space_size),
+			VM_MAP_PAGE_MASK(map));
+
+		if (vm_map_lookup_entry(map, random_addr, &prev_entry) == FALSE) {
+			if (prev_entry == vm_map_to_entry(map)) {
+				next_entry = vm_map_first_entry(map);
+			} else {
+				next_entry = prev_entry->vme_next;
+			}
+			if (next_entry == vm_map_to_entry(map)) {
+				hole_end = vm_map_max(map);
+			} else {
+				hole_end = next_entry->vme_start;
+			}
+			vm_hole_size = hole_end - random_addr;
+			if (vm_hole_size >= size) {
+				*address = random_addr;
+				break;
+			}
+		}
+		tries++;
+	}
+
+	if (tries == MAX_TRIES_TO_GET_RANDOM_ADDRESS) {
+		kr = KERN_NO_SPACE;
+	}
+	return kr;
+}
+
+static boolean_t
+vm_memory_malloc_no_cow(
+	int alias)
+{
+	uint64_t alias_mask;
+
+	if (alias > 63) {
+		return FALSE;
+	}
+
+	alias_mask = 1ULL << alias;
+	if (alias_mask & vm_memory_malloc_no_cow_mask) {
+		return TRUE;
 	}
+	return FALSE;
 }
 
 /*
@@ -1251,49 +2162,335 @@ vm_map_pmap_enter(
  *
  *		Arguments are as defined in the vm_map call.
  */
+int _map_enter_debug = 0;
+static unsigned int vm_map_enter_restore_successes = 0;
+static unsigned int vm_map_enter_restore_failures = 0;
 kern_return_t
 vm_map_enter(
-	register vm_map_t	map,
-	vm_offset_t		*address,	/* IN/OUT */
-	vm_size_t		size,
-	vm_offset_t		mask,
-	int			flags,
-	vm_object_t		object,
-	vm_object_offset_t	offset,
-	boolean_t		needs_copy,
-	vm_prot_t		cur_protection,
-	vm_prot_t		max_protection,
-	vm_inherit_t		inheritance)
-{
-	vm_map_entry_t		entry;
-	register vm_offset_t	start;
-	register vm_offset_t	end;
-	kern_return_t		result = KERN_SUCCESS;
-
-	boolean_t		anywhere = VM_FLAGS_ANYWHERE & flags;
-	char			alias;
-
-	VM_GET_FLAGS_ALIAS(flags, alias);
-
-#define	RETURN(value)	{ result = value; goto BailOut; }
-
-	assert(page_aligned(*address));
+	vm_map_t                map,
+	vm_map_offset_t         *address,       /* IN/OUT */
+	vm_map_size_t           size,
+	vm_map_offset_t         mask,
+	int                     flags,
+	vm_map_kernel_flags_t   vmk_flags,
+	vm_tag_t                alias,
+	vm_object_t             object,
+	vm_object_offset_t      offset,
+	boolean_t               needs_copy,
+	vm_prot_t               cur_protection,
+	vm_prot_t               max_protection,
+	vm_inherit_t            inheritance)
+{
+	vm_map_entry_t          entry, new_entry;
+	vm_map_offset_t         start, tmp_start, tmp_offset;
+	vm_map_offset_t         end, tmp_end;
+	vm_map_offset_t         tmp2_start, tmp2_end;
+	vm_map_offset_t         desired_empty_end;
+	vm_map_offset_t         step;
+	kern_return_t           result = KERN_SUCCESS;
+	vm_map_t                zap_old_map = VM_MAP_NULL;
+	vm_map_t                zap_new_map = VM_MAP_NULL;
+	boolean_t               map_locked = FALSE;
+	boolean_t               pmap_empty = TRUE;
+	boolean_t               new_mapping_established = FALSE;
+	boolean_t               keep_map_locked = vmk_flags.vmkf_keep_map_locked;
+	boolean_t               anywhere = ((flags & VM_FLAGS_ANYWHERE) != 0);
+	boolean_t               purgable = ((flags & VM_FLAGS_PURGABLE) != 0);
+	boolean_t               overwrite = ((flags & VM_FLAGS_OVERWRITE) != 0);
+	boolean_t               no_cache = ((flags & VM_FLAGS_NO_CACHE) != 0);
+	boolean_t               is_submap = vmk_flags.vmkf_submap;
+	boolean_t               permanent = vmk_flags.vmkf_permanent;
+	boolean_t               no_copy_on_read = vmk_flags.vmkf_no_copy_on_read;
+	boolean_t               entry_for_jit = vmk_flags.vmkf_map_jit;
+	boolean_t               iokit_acct = vmk_flags.vmkf_iokit_acct;
+	boolean_t               resilient_codesign = ((flags & VM_FLAGS_RESILIENT_CODESIGN) != 0);
+	boolean_t               resilient_media = ((flags & VM_FLAGS_RESILIENT_MEDIA) != 0);
+	boolean_t               random_address = ((flags & VM_FLAGS_RANDOM_ADDR) != 0);
+	unsigned int            superpage_size = ((flags & VM_FLAGS_SUPERPAGE_MASK) >> VM_FLAGS_SUPERPAGE_SHIFT);
+	vm_tag_t                user_alias;
+	vm_map_offset_t         effective_min_offset, effective_max_offset;
+	kern_return_t           kr;
+	boolean_t               clear_map_aligned = FALSE;
+	vm_map_entry_t          hole_entry;
+	vm_map_size_t           chunk_size = 0;
+
+	assertf(vmk_flags.__vmkf_unused == 0, "vmk_flags unused=0x%x\n", vmk_flags.__vmkf_unused);
+
+	if (flags & VM_FLAGS_4GB_CHUNK) {
+#if defined(__LP64__)
+		chunk_size = (4ULL * 1024 * 1024 * 1024); /* max. 4GB chunks for the new allocation */
+#else /* __LP64__ */
+		chunk_size = ANON_CHUNK_SIZE;
+#endif /* __LP64__ */
+	} else {
+		chunk_size = ANON_CHUNK_SIZE;
+	}
+
+	if (superpage_size) {
+		switch (superpage_size) {
+			/*
+			 * Note that the current implementation only supports
+			 * a single size for superpages, SUPERPAGE_SIZE, per
+			 * architecture. As soon as more sizes are supposed
+			 * to be supported, SUPERPAGE_SIZE has to be replaced
+			 * with a lookup of the size depending on superpage_size.
+			 */
+#ifdef __x86_64__
+		case SUPERPAGE_SIZE_ANY:
+			/* handle it like 2 MB and round up to page size */
+			size = (size + 2 * 1024 * 1024 - 1) & ~(2 * 1024 * 1024 - 1);
+		case SUPERPAGE_SIZE_2MB:
+			break;
+#endif
+		default:
+			return KERN_INVALID_ARGUMENT;
+		}
+		mask = SUPERPAGE_SIZE - 1;
+		if (size & (SUPERPAGE_SIZE - 1)) {
+			return KERN_INVALID_ARGUMENT;
+		}
+		inheritance = VM_INHERIT_NONE;  /* fork() children won't inherit superpages */
+	}
+
+
+	if ((cur_protection & VM_PROT_WRITE) &&
+	    (cur_protection & VM_PROT_EXECUTE) &&
+#if !CONFIG_EMBEDDED
+	    map != kernel_map &&
+	    (cs_process_global_enforcement() ||
+	    (vmk_flags.vmkf_cs_enforcement_override
+	    ? vmk_flags.vmkf_cs_enforcement
+	    : cs_process_enforcement(NULL))) &&
+#endif /* !CONFIG_EMBEDDED */
+	    !entry_for_jit) {
+		DTRACE_VM3(cs_wx,
+		    uint64_t, 0,
+		    uint64_t, 0,
+		    vm_prot_t, cur_protection);
+		printf("CODE SIGNING: %d[%s] %s: curprot cannot be write+execute. "
+#if VM_PROTECT_WX_FAIL
+		    "failing\n",
+#else /* VM_PROTECT_WX_FAIL */
+		    "turning off execute\n",
+#endif /* VM_PROTECT_WX_FAIL */
+		    proc_selfpid(),
+		    (current_task()->bsd_info
+		    ? proc_name_address(current_task()->bsd_info)
+		    : "?"),
+		    __FUNCTION__);
+		cur_protection &= ~VM_PROT_EXECUTE;
+#if VM_PROTECT_WX_FAIL
+		return KERN_PROTECTION_FAILURE;
+#endif /* VM_PROTECT_WX_FAIL */
+	}
+
+	/*
+	 * If the task has requested executable lockdown,
+	 * deny any new executable mapping.
+	 */
+	if (map->map_disallow_new_exec == TRUE) {
+		if (cur_protection & VM_PROT_EXECUTE) {
+			return KERN_PROTECTION_FAILURE;
+		}
+	}
+
+	if (resilient_codesign) {
+		assert(!is_submap);
+		if ((cur_protection & (VM_PROT_WRITE | VM_PROT_EXECUTE)) ||
+		    (max_protection & (VM_PROT_WRITE | VM_PROT_EXECUTE))) {
+			return KERN_PROTECTION_FAILURE;
+		}
+	}
+
+	if (resilient_media) {
+		assert(!is_submap);
+//		assert(!needs_copy);
+		if (object != VM_OBJECT_NULL &&
+		    !object->internal) {
+			/*
+			 * This mapping is directly backed by an external
+			 * memory manager (e.g. a vnode pager for a file):
+			 * we would not have any safe place to inject
+			 * a zero-filled page if an actual page is not
+			 * available, without possibly impacting the actual
+			 * contents of the mapped object (e.g. the file),
+			 * so we can't provide any media resiliency here.
+			 */
+			return KERN_INVALID_ARGUMENT;
+		}
+	}
+
+	if (is_submap) {
+		if (purgable) {
+			/* submaps can not be purgeable */
+			return KERN_INVALID_ARGUMENT;
+		}
+		if (object == VM_OBJECT_NULL) {
+			/* submaps can not be created lazily */
+			return KERN_INVALID_ARGUMENT;
+		}
+	}
+	if (vmk_flags.vmkf_already) {
+		/*
+		 * VM_FLAGS_ALREADY says that it's OK if the same mapping
+		 * is already present.  For it to be meaningul, the requested
+		 * mapping has to be at a fixed address (!VM_FLAGS_ANYWHERE) and
+		 * we shouldn't try and remove what was mapped there first
+		 * (!VM_FLAGS_OVERWRITE).
+		 */
+		if ((flags & VM_FLAGS_ANYWHERE) ||
+		    (flags & VM_FLAGS_OVERWRITE)) {
+			return KERN_INVALID_ARGUMENT;
+		}
+	}
+
+	effective_min_offset = map->min_offset;
+
+	if (vmk_flags.vmkf_beyond_max) {
+		/*
+		 * Allow an insertion beyond the map's max offset.
+		 */
+#if     !defined(__arm__) && !defined(__arm64__)
+		if (vm_map_is_64bit(map)) {
+			effective_max_offset = 0xFFFFFFFFFFFFF000ULL;
+		} else
+#endif  /* __arm__ */
+		effective_max_offset = 0x00000000FFFFF000ULL;
+	} else {
+#if     !defined(CONFIG_EMBEDDED)
+		if (__improbable(vmk_flags.vmkf_32bit_map_va)) {
+			effective_max_offset = MIN(map->max_offset, 0x00000000FFFFF000ULL);
+		} else {
+			effective_max_offset = map->max_offset;
+		}
+#else
+		effective_max_offset = map->max_offset;
+#endif
+	}
+
+	if (size == 0 ||
+	    (offset & PAGE_MASK_64) != 0) {
+		*address = 0;
+		return KERN_INVALID_ARGUMENT;
+	}
+
+	if (map->pmap == kernel_pmap) {
+		user_alias = VM_KERN_MEMORY_NONE;
+	} else {
+		user_alias = alias;
+	}
+
+	if (user_alias == VM_MEMORY_MALLOC_MEDIUM) {
+		chunk_size = MALLOC_MEDIUM_CHUNK_SIZE;
+	}
+
+#define RETURN(value)   { result = value; goto BailOut; }
+
+	assert(page_aligned(*address));
 	assert(page_aligned(size));
- StartAgain: ;
+
+	if (!VM_MAP_PAGE_ALIGNED(size, VM_MAP_PAGE_MASK(map))) {
+		/*
+		 * In most cases, the caller rounds the size up to the
+		 * map's page size.
+		 * If we get a size that is explicitly not map-aligned here,
+		 * we'll have to respect the caller's wish and mark the
+		 * mapping as "not map-aligned" to avoid tripping the
+		 * map alignment checks later.
+		 */
+		clear_map_aligned = TRUE;
+	}
+	if (!anywhere &&
+	    !VM_MAP_PAGE_ALIGNED(*address, VM_MAP_PAGE_MASK(map))) {
+		/*
+		 * We've been asked to map at a fixed address and that
+		 * address is not aligned to the map's specific alignment.
+		 * The caller should know what it's doing (i.e. most likely
+		 * mapping some fragmented copy map, transferring memory from
+		 * a VM map with a different alignment), so clear map_aligned
+		 * for this new VM map entry and proceed.
+		 */
+		clear_map_aligned = TRUE;
+	}
+
+	/*
+	 * Only zero-fill objects are allowed to be purgable.
+	 * LP64todo - limit purgable objects to 32-bits for now
+	 */
+	if (purgable &&
+	    (offset != 0 ||
+	    (object != VM_OBJECT_NULL &&
+	    (object->vo_size != size ||
+	    object->purgable == VM_PURGABLE_DENY))
+	    || size > ANON_MAX_SIZE)) { /* LP64todo: remove when dp capable */
+		return KERN_INVALID_ARGUMENT;
+	}
+
+	if (!anywhere && overwrite) {
+		/*
+		 * Create a temporary VM map to hold the old mappings in the
+		 * affected area while we create the new one.
+		 * This avoids releasing the VM map lock in
+		 * vm_map_entry_delete() and allows atomicity
+		 * when we want to replace some mappings with a new one.
+		 * It also allows us to restore the old VM mappings if the
+		 * new mapping fails.
+		 */
+		zap_old_map = vm_map_create(PMAP_NULL,
+		    *address,
+		    *address + size,
+		    map->hdr.entries_pageable);
+		vm_map_set_page_shift(zap_old_map, VM_MAP_PAGE_SHIFT(map));
+		vm_map_disable_hole_optimization(zap_old_map);
+	}
+
+StartAgain:;
 
 	start = *address;
 
 	if (anywhere) {
 		vm_map_lock(map);
+		map_locked = TRUE;
+
+		if (entry_for_jit) {
+#if CONFIG_EMBEDDED
+			if (map->jit_entry_exists) {
+				result = KERN_INVALID_ARGUMENT;
+				goto BailOut;
+			}
+			random_address = TRUE;
+#endif /* CONFIG_EMBEDDED */
+		}
+
+		if (random_address) {
+			/*
+			 * Get a random start address.
+			 */
+			result = vm_map_random_address_for_size(map, address, size);
+			if (result != KERN_SUCCESS) {
+				goto BailOut;
+			}
+			start = *address;
+		}
+#if !CONFIG_EMBEDDED
+		else if ((start == 0 || start == vm_map_min(map)) &&
+		    !map->disable_vmentry_reuse &&
+		    map->vmmap_high_start != 0) {
+			start = map->vmmap_high_start;
+		}
+#endif
+
 
 		/*
 		 *	Calculate the first possible address.
 		 */
 
-		if (start < map->min_offset)
-			start = map->min_offset;
-		if (start > map->max_offset)
+		if (start < effective_min_offset) {
+			start = effective_min_offset;
+		}
+		if (start > effective_max_offset) {
 			RETURN(KERN_NO_SPACE);
+		}
 
 		/*
 		 *	Look for the first possible address;
@@ -1301,15 +2498,84 @@ vm_map_enter(
 		 *	address, we have to start after it.
 		 */
 
-		assert(first_free_is_valid(map));
-		if (start == map->min_offset) {
-			if ((entry = map->first_free) != vm_map_to_entry(map))
-				start = entry->vme_end;
+		if (map->disable_vmentry_reuse == TRUE) {
+			VM_MAP_HIGHEST_ENTRY(map, entry, start);
 		} else {
-			vm_map_entry_t	tmp_entry;
-			if (vm_map_lookup_entry(map, start, &tmp_entry))
-				start = tmp_entry->vme_end;
-			entry = tmp_entry;
+			if (map->holelistenabled) {
+				hole_entry = CAST_TO_VM_MAP_ENTRY(map->holes_list);
+
+				if (hole_entry == NULL) {
+					/*
+					 * No more space in the map?
+					 */
+					result = KERN_NO_SPACE;
+					goto BailOut;
+				} else {
+					boolean_t found_hole = FALSE;
+
+					do {
+						if (hole_entry->vme_start >= start) {
+							start = hole_entry->vme_start;
+							found_hole = TRUE;
+							break;
+						}
+
+						if (hole_entry->vme_end > start) {
+							found_hole = TRUE;
+							break;
+						}
+						hole_entry = hole_entry->vme_next;
+					} while (hole_entry != CAST_TO_VM_MAP_ENTRY(map->holes_list));
+
+					if (found_hole == FALSE) {
+						result = KERN_NO_SPACE;
+						goto BailOut;
+					}
+
+					entry = hole_entry;
+
+					if (start == 0) {
+						start += PAGE_SIZE_64;
+					}
+				}
+			} else {
+				assert(first_free_is_valid(map));
+
+				entry = map->first_free;
+
+				if (entry == vm_map_to_entry(map)) {
+					entry = NULL;
+				} else {
+					if (entry->vme_next == vm_map_to_entry(map)) {
+						/*
+						 * Hole at the end of the map.
+						 */
+						entry = NULL;
+					} else {
+						if (start < (entry->vme_next)->vme_start) {
+							start = entry->vme_end;
+							start = vm_map_round_page(start,
+							    VM_MAP_PAGE_MASK(map));
+						} else {
+							/*
+							 * Need to do a lookup.
+							 */
+							entry = NULL;
+						}
+					}
+				}
+
+				if (entry == NULL) {
+					vm_map_entry_t  tmp_entry;
+					if (vm_map_lookup_entry(map, start, &tmp_entry)) {
+						assert(!entry_for_jit);
+						start = tmp_entry->vme_end;
+						start = vm_map_round_page(start,
+						    VM_MAP_PAGE_MASK(map));
+					}
+					entry = tmp_entry;
+				}
+			}
 		}
 
 		/*
@@ -1319,61 +2585,102 @@ vm_map_enter(
 		 */
 
 		while (TRUE) {
-			register vm_map_entry_t	next;
+			vm_map_entry_t  next;
 
-		    	/*
+			/*
 			 *	Find the end of the proposed new region.
 			 *	Be sure we didn't go beyond the end, or
 			 *	wrap around the address.
 			 */
 
 			end = ((start + mask) & ~mask);
-			if (end < start)
+			end = vm_map_round_page(end,
+			    VM_MAP_PAGE_MASK(map));
+			if (end < start) {
 				RETURN(KERN_NO_SPACE);
+			}
 			start = end;
+			assert(VM_MAP_PAGE_ALIGNED(start,
+			    VM_MAP_PAGE_MASK(map)));
 			end += size;
 
-			if ((end > map->max_offset) || (end < start)) {
+			/* We want an entire page of empty space, but don't increase the allocation size. */
+			desired_empty_end = vm_map_round_page(end, VM_MAP_PAGE_MASK(map));
+
+			if ((desired_empty_end > effective_max_offset) || (desired_empty_end < start)) {
 				if (map->wait_for_space) {
-					if (size <= (map->max_offset -
-						     map->min_offset)) {
+					assert(!keep_map_locked);
+					if (size <= (effective_max_offset -
+					    effective_min_offset)) {
 						assert_wait((event_t)map,
-							    THREAD_ABORTSAFE);
+						    THREAD_ABORTSAFE);
 						vm_map_unlock(map);
-						thread_block((void (*)(void))0);
+						map_locked = FALSE;
+						thread_block(THREAD_CONTINUE_NULL);
 						goto StartAgain;
 					}
 				}
 				RETURN(KERN_NO_SPACE);
 			}
 
-			/*
-			 *	If there are no more entries, we must win.
-			 */
-
 			next = entry->vme_next;
-			if (next == vm_map_to_entry(map))
-				break;
 
-			/*
-			 *	If there is another entry, it must be
-			 *	after the end of the potential new region.
-			 */
+			if (map->holelistenabled) {
+				if (entry->vme_end >= desired_empty_end) {
+					break;
+				}
+			} else {
+				/*
+				 *	If there are no more entries, we must win.
+				 *
+				 *	OR
+				 *
+				 *	If there is another entry, it must be
+				 *	after the end of the potential new region.
+				 */
 
-			if (next->vme_start >= end)
-				break;
+				if (next == vm_map_to_entry(map)) {
+					break;
+				}
+
+				if (next->vme_start >= desired_empty_end) {
+					break;
+				}
+			}
 
 			/*
 			 *	Didn't fit -- move to the next entry.
 			 */
 
 			entry = next;
-			start = entry->vme_end;
+
+			if (map->holelistenabled) {
+				if (entry == CAST_TO_VM_MAP_ENTRY(map->holes_list)) {
+					/*
+					 * Wrapped around
+					 */
+					result = KERN_NO_SPACE;
+					goto BailOut;
+				}
+				start = entry->vme_start;
+			} else {
+				start = entry->vme_end;
+			}
+
+			start = vm_map_round_page(start,
+			    VM_MAP_PAGE_MASK(map));
+		}
+
+		if (map->holelistenabled) {
+			if (vm_map_lookup_entry(map, entry->vme_start, &entry)) {
+				panic("Found an existing entry (%p) instead of potential hole at address: 0x%llx.\n", entry, (unsigned long long)entry->vme_start);
+			}
 		}
+
 		*address = start;
+		assert(VM_MAP_PAGE_ALIGNED(*address,
+		    VM_MAP_PAGE_MASK(map)));
 	} else {
-		vm_map_entry_t		temp_entry;
-
 		/*
 		 *	Verify that:
 		 *		the address doesn't itself violate
@@ -1381,8 +2688,10 @@ vm_map_enter(
 		 */
 
 		vm_map_lock(map);
-		if ((start & mask) != 0)
+		map_locked = TRUE;
+		if ((start & mask) != 0) {
 			RETURN(KERN_NO_SPACE);
+		}
 
 		/*
 		 *	...	the address is within bounds
@@ -1390,20 +2699,106 @@ vm_map_enter(
 
 		end = start + size;
 
-		if ((start < map->min_offset) ||
-		    (end > map->max_offset) ||
+		if ((start < effective_min_offset) ||
+		    (end > effective_max_offset) ||
 		    (start >= end)) {
 			RETURN(KERN_INVALID_ADDRESS);
 		}
 
+		if (overwrite && zap_old_map != VM_MAP_NULL) {
+			int remove_flags;
+			/*
+			 * Fixed mapping and "overwrite" flag: attempt to
+			 * remove all existing mappings in the specified
+			 * address range, saving them in our "zap_old_map".
+			 */
+			remove_flags = VM_MAP_REMOVE_SAVE_ENTRIES;
+			remove_flags |= VM_MAP_REMOVE_NO_MAP_ALIGN;
+			if (vmk_flags.vmkf_overwrite_immutable) {
+				/* we can overwrite immutable mappings */
+				remove_flags |= VM_MAP_REMOVE_IMMUTABLE;
+			}
+			(void) vm_map_delete(map, start, end,
+			    remove_flags,
+			    zap_old_map);
+		}
+
 		/*
 		 *	...	the starting address isn't allocated
 		 */
 
-		if (vm_map_lookup_entry(map, start, &temp_entry))
-			RETURN(KERN_NO_SPACE);
+		if (vm_map_lookup_entry(map, start, &entry)) {
+			if (!(vmk_flags.vmkf_already)) {
+				RETURN(KERN_NO_SPACE);
+			}
+			/*
+			 * Check if what's already there is what we want.
+			 */
+			tmp_start = start;
+			tmp_offset = offset;
+			if (entry->vme_start < start) {
+				tmp_start -= start - entry->vme_start;
+				tmp_offset -= start - entry->vme_start;
+			}
+			for (; entry->vme_start < end;
+			    entry = entry->vme_next) {
+				/*
+				 * Check if the mapping's attributes
+				 * match the existing map entry.
+				 */
+				if (entry == vm_map_to_entry(map) ||
+				    entry->vme_start != tmp_start ||
+				    entry->is_sub_map != is_submap ||
+				    VME_OFFSET(entry) != tmp_offset ||
+				    entry->needs_copy != needs_copy ||
+				    entry->protection != cur_protection ||
+				    entry->max_protection != max_protection ||
+				    entry->inheritance != inheritance ||
+				    entry->iokit_acct != iokit_acct ||
+				    VME_ALIAS(entry) != alias) {
+					/* not the same mapping ! */
+					RETURN(KERN_NO_SPACE);
+				}
+				/*
+				 * Check if the same object is being mapped.
+				 */
+				if (is_submap) {
+					if (VME_SUBMAP(entry) !=
+					    (vm_map_t) object) {
+						/* not the same submap */
+						RETURN(KERN_NO_SPACE);
+					}
+				} else {
+					if (VME_OBJECT(entry) != object) {
+						/* not the same VM object... */
+						vm_object_t obj2;
+
+						obj2 = VME_OBJECT(entry);
+						if ((obj2 == VM_OBJECT_NULL ||
+						    obj2->internal) &&
+						    (object == VM_OBJECT_NULL ||
+						    object->internal)) {
+							/*
+							 * ... but both are
+							 * anonymous memory,
+							 * so equivalent.
+							 */
+						} else {
+							RETURN(KERN_NO_SPACE);
+						}
+					}
+				}
 
-		entry = temp_entry;
+				tmp_offset += entry->vme_end - entry->vme_start;
+				tmp_start += entry->vme_end - entry->vme_start;
+				if (entry->vme_end >= end) {
+					/* reached the end of our mapping */
+					break;
+				}
+			}
+			/* it all matches:  let's use what's already there ! */
+			RETURN(KERN_MEMORY_PRESENT);
+		}
 
 		/*
 		 *	...	the next region doesn't overlap the
@@ -1411,8 +2806,9 @@ vm_map_enter(
 		 */
 
 		if ((entry->vme_next != vm_map_to_entry(map)) &&
-		    (entry->vme_next->vme_start < end))
+		    (entry->vme_next->vme_start < end)) {
 			RETURN(KERN_NO_SPACE);
+		}
 	}
 
 	/*
@@ -1428,4498 +2824,9319 @@ vm_map_enter(
 	/*
 	 *	See whether we can avoid creating a new entry (and object) by
 	 *	extending one of our neighbors.  [So far, we only attempt to
-	 *	extend from below.]
+	 *	extend from below.]  Note that we can never extend/join
+	 *	purgable objects because they need to remain distinct
+	 *	entities in order to implement their "volatile object"
+	 *	semantics.
 	 */
 
-	if ((object == VM_OBJECT_NULL) &&
+	if (purgable ||
+	    entry_for_jit ||
+	    vm_memory_malloc_no_cow(user_alias)) {
+		if (object == VM_OBJECT_NULL) {
+			object = vm_object_allocate(size);
+			object->copy_strategy = MEMORY_OBJECT_COPY_NONE;
+			object->true_share = FALSE;
+			if (purgable) {
+				task_t owner;
+				object->purgable = VM_PURGABLE_NONVOLATILE;
+				if (map->pmap == kernel_pmap) {
+					/*
+					 * Purgeable mappings made in a kernel
+					 * map are "owned" by the kernel itself
+					 * rather than the current user task
+					 * because they're likely to be used by
+					 * more than this user task (see
+					 * execargs_purgeable_allocate(), for
+					 * example).
+					 */
+					owner = kernel_task;
+				} else {
+					owner = current_task();
+				}
+				assert(object->vo_owner == NULL);
+				assert(object->resident_page_count == 0);
+				assert(object->wired_page_count == 0);
+				vm_object_lock(object);
+				vm_purgeable_nonvolatile_enqueue(object, owner);
+				vm_object_unlock(object);
+			}
+			offset = (vm_object_offset_t)0;
+		}
+	} else if ((is_submap == FALSE) &&
+	    (object == VM_OBJECT_NULL) &&
 	    (entry != vm_map_to_entry(map)) &&
 	    (entry->vme_end == start) &&
 	    (!entry->is_shared) &&
 	    (!entry->is_sub_map) &&
-	    (entry->alias == alias) &&
-	    (entry->inheritance == inheritance) &&
+	    (!entry->in_transition) &&
+	    (!entry->needs_wakeup) &&
+	    (entry->behavior == VM_BEHAVIOR_DEFAULT) &&
 	    (entry->protection == cur_protection) &&
 	    (entry->max_protection == max_protection) &&
-	    (entry->behavior == VM_BEHAVIOR_DEFAULT) &&
-	    (entry->in_transition == 0) &&
-	    ((entry->vme_end - entry->vme_start) + size < NO_COALESCE_LIMIT) &&
-	    (entry->wired_count == 0)) { /* implies user_wired_count == 0 */
-		if (vm_object_coalesce(entry->object.vm_object,
-				VM_OBJECT_NULL,
-				entry->offset,
-				(vm_object_offset_t) 0,
-				(vm_size_t)(entry->vme_end - entry->vme_start),
-				(vm_size_t)(end - entry->vme_end))) {
-
+	    (entry->inheritance == inheritance) &&
+	    ((user_alias == VM_MEMORY_REALLOC) ||
+	    (VME_ALIAS(entry) == alias)) &&
+	    (entry->no_cache == no_cache) &&
+	    (entry->permanent == permanent) &&
+	    /* no coalescing for immutable executable mappings */
+	    !((entry->protection & VM_PROT_EXECUTE) &&
+	    entry->permanent) &&
+	    (!entry->superpage_size && !superpage_size) &&
+	    /*
+	     * No coalescing if not map-aligned, to avoid propagating
+	     * that condition any further than needed:
+	     */
+	    (!entry->map_aligned || !clear_map_aligned) &&
+	    (!entry->zero_wired_pages) &&
+	    (!entry->used_for_jit && !entry_for_jit) &&
+	    (!entry->pmap_cs_associated) &&
+	    (entry->iokit_acct == iokit_acct) &&
+	    (!entry->vme_resilient_codesign) &&
+	    (!entry->vme_resilient_media) &&
+	    (!entry->vme_atomic) &&
+	    (entry->vme_no_copy_on_read == no_copy_on_read) &&
+
+	    ((entry->vme_end - entry->vme_start) + size <=
+	    (user_alias == VM_MEMORY_REALLOC ?
+	    ANON_CHUNK_SIZE :
+	    NO_COALESCE_LIMIT)) &&
+
+	    (entry->wired_count == 0)) {        /* implies user_wired_count == 0 */
+		if (vm_object_coalesce(VME_OBJECT(entry),
+		    VM_OBJECT_NULL,
+		    VME_OFFSET(entry),
+		    (vm_object_offset_t) 0,
+		    (vm_map_size_t)(entry->vme_end - entry->vme_start),
+		    (vm_map_size_t)(end - entry->vme_end))) {
 			/*
 			 *	Coalesced the two objects - can extend
 			 *	the previous map entry to include the
 			 *	new range.
 			 */
 			map->size += (end - entry->vme_end);
+			assert(entry->vme_start < end);
+			assert(VM_MAP_PAGE_ALIGNED(end,
+			    VM_MAP_PAGE_MASK(map)));
+			if (__improbable(vm_debug_events)) {
+				DTRACE_VM5(map_entry_extend, vm_map_t, map, vm_map_entry_t, entry, vm_address_t, entry->vme_start, vm_address_t, entry->vme_end, vm_address_t, end);
+			}
 			entry->vme_end = end;
-			UPDATE_FIRST_FREE(map, map->first_free);
+			if (map->holelistenabled) {
+				vm_map_store_update_first_free(map, entry, TRUE);
+			} else {
+				vm_map_store_update_first_free(map, map->first_free, TRUE);
+			}
+			new_mapping_established = TRUE;
 			RETURN(KERN_SUCCESS);
 		}
 	}
 
-	/*
-	 *	Create a new entry
-	 */
+	step = superpage_size ? SUPERPAGE_SIZE : (end - start);
+	new_entry = NULL;
+
+	for (tmp2_start = start; tmp2_start < end; tmp2_start += step) {
+		tmp2_end = tmp2_start + step;
+		/*
+		 *	Create a new entry
+		 *
+		 * XXX FBDP
+		 * The reserved "page zero" in each process's address space can
+		 * be arbitrarily large.  Splitting it into separate objects and
+		 * therefore different VM map entries serves no purpose and just
+		 * slows down operations on the VM map, so let's not split the
+		 * allocation into chunks if the max protection is NONE.  That
+		 * memory should never be accessible, so it will never get to the
+		 * default pager.
+		 */
+		tmp_start = tmp2_start;
+		if (object == VM_OBJECT_NULL &&
+		    size > chunk_size &&
+		    max_protection != VM_PROT_NONE &&
+		    superpage_size == 0) {
+			tmp_end = tmp_start + chunk_size;
+		} else {
+			tmp_end = tmp2_end;
+		}
+		do {
+			new_entry = vm_map_entry_insert(
+				map, entry, tmp_start, tmp_end,
+				object, offset, needs_copy,
+				FALSE, FALSE,
+				cur_protection, max_protection,
+				VM_BEHAVIOR_DEFAULT,
+				(entry_for_jit)? VM_INHERIT_NONE: inheritance,
+				0,
+				no_cache,
+				permanent,
+				no_copy_on_read,
+				superpage_size,
+				clear_map_aligned,
+				is_submap,
+				entry_for_jit,
+				alias);
+
+			assert((object != kernel_object) || (VM_KERN_MEMORY_NONE != alias));
+
+			if (resilient_codesign &&
+			    !((cur_protection | max_protection) &
+			    (VM_PROT_WRITE | VM_PROT_EXECUTE))) {
+				new_entry->vme_resilient_codesign = TRUE;
+			}
 
-	{ /**/
-	register vm_map_entry_t	new_entry;
+			if (resilient_media &&
+			    (object == VM_OBJECT_NULL ||
+			    object->internal)) {
+				new_entry->vme_resilient_media = TRUE;
+			}
 
-	new_entry = vm_map_entry_insert(map, entry, start, end, object,
-					offset, needs_copy, FALSE, FALSE,
-					cur_protection, max_protection,
-					VM_BEHAVIOR_DEFAULT, inheritance, 0);
-	new_entry->alias = alias;
-	vm_map_unlock(map);
+			assert(!new_entry->iokit_acct);
+			if (!is_submap &&
+			    object != VM_OBJECT_NULL &&
+			    (object->purgable != VM_PURGABLE_DENY ||
+			    object->vo_ledger_tag)) {
+				assert(new_entry->use_pmap);
+				assert(!new_entry->iokit_acct);
+				/*
+				 * Turn off pmap accounting since
+				 * purgeable (or tagged) objects have their
+				 * own ledgers.
+				 */
+				new_entry->use_pmap = FALSE;
+			} else if (!is_submap &&
+			    iokit_acct &&
+			    object != VM_OBJECT_NULL &&
+			    object->internal) {
+				/* alternate accounting */
+				assert(!new_entry->iokit_acct);
+				assert(new_entry->use_pmap);
+				new_entry->iokit_acct = TRUE;
+				new_entry->use_pmap = FALSE;
+				DTRACE_VM4(
+					vm_map_iokit_mapped_region,
+					vm_map_t, map,
+					vm_map_offset_t, new_entry->vme_start,
+					vm_map_offset_t, new_entry->vme_end,
+					int, VME_ALIAS(new_entry));
+				vm_map_iokit_mapped_region(
+					map,
+					(new_entry->vme_end -
+					new_entry->vme_start));
+			} else if (!is_submap) {
+				assert(!new_entry->iokit_acct);
+				assert(new_entry->use_pmap);
+			}
 
-	/*	Wire down the new entry if the user
-	 *	requested all new map entries be wired.
-	 */
-	if (map->wiring_required) {
-		result = vm_map_wire(map, start, end,
-				    new_entry->protection, TRUE);
-		return(result);
-	}
+			if (is_submap) {
+				vm_map_t        submap;
+				boolean_t       submap_is_64bit;
+				boolean_t       use_pmap;
+
+				assert(new_entry->is_sub_map);
+				assert(!new_entry->use_pmap);
+				assert(!new_entry->iokit_acct);
+				submap = (vm_map_t) object;
+				submap_is_64bit = vm_map_is_64bit(submap);
+				use_pmap = vmk_flags.vmkf_nested_pmap;
+#ifndef NO_NESTED_PMAP
+				if (use_pmap && submap->pmap == NULL) {
+					ledger_t ledger = map->pmap->ledger;
+					/* we need a sub pmap to nest... */
+					submap->pmap = pmap_create_options(ledger, 0,
+					    submap_is_64bit ? PMAP_CREATE_64BIT : 0);
+					if (submap->pmap == NULL) {
+						/* let's proceed without nesting... */
+					}
+#if     defined(__arm__) || defined(__arm64__)
+					else {
+						pmap_set_nested(submap->pmap);
+					}
+#endif
+				}
+				if (use_pmap && submap->pmap != NULL) {
+					kr = pmap_nest(map->pmap,
+					    submap->pmap,
+					    tmp_start,
+					    tmp_start,
+					    tmp_end - tmp_start);
+					if (kr != KERN_SUCCESS) {
+						printf("vm_map_enter: "
+						    "pmap_nest(0x%llx,0x%llx) "
+						    "error 0x%x\n",
+						    (long long)tmp_start,
+						    (long long)tmp_end,
+						    kr);
+					} else {
+						/* we're now nested ! */
+						new_entry->use_pmap = TRUE;
+						pmap_empty = FALSE;
+					}
+				}
+#endif /* NO_NESTED_PMAP */
+			}
+			entry = new_entry;
+
+			if (superpage_size) {
+				vm_page_t pages, m;
+				vm_object_t sp_object;
+				vm_object_offset_t sp_offset;
+
+				VME_OFFSET_SET(entry, 0);
+
+				/* allocate one superpage */
+				kr = cpm_allocate(SUPERPAGE_SIZE, &pages, 0, SUPERPAGE_NBASEPAGES - 1, TRUE, 0);
+				if (kr != KERN_SUCCESS) {
+					/* deallocate whole range... */
+					new_mapping_established = TRUE;
+					/* ... but only up to "tmp_end" */
+					size -= end - tmp_end;
+					RETURN(kr);
+				}
 
-	if ((object != VM_OBJECT_NULL) &&
-	    (vm_map_pmap_enter_enable) &&
-	    (!anywhere)	 &&
-	    (!needs_copy) && 
-	    (size < (128*1024))) {
-		vm_map_pmap_enter(map, start, end, 
-				  object, offset, cur_protection);
+				/* create one vm_object per superpage */
+				sp_object = vm_object_allocate((vm_map_size_t)(entry->vme_end - entry->vme_start));
+				sp_object->phys_contiguous = TRUE;
+				sp_object->vo_shadow_offset = (vm_object_offset_t)VM_PAGE_GET_PHYS_PAGE(pages) * PAGE_SIZE;
+				VME_OBJECT_SET(entry, sp_object);
+				assert(entry->use_pmap);
+
+				/* enter the base pages into the object */
+				vm_object_lock(sp_object);
+				for (sp_offset = 0;
+				    sp_offset < SUPERPAGE_SIZE;
+				    sp_offset += PAGE_SIZE) {
+					m = pages;
+					pmap_zero_page(VM_PAGE_GET_PHYS_PAGE(m));
+					pages = NEXT_PAGE(m);
+					*(NEXT_PAGE_PTR(m)) = VM_PAGE_NULL;
+					vm_page_insert_wired(m, sp_object, sp_offset, VM_KERN_MEMORY_OSFMK);
+				}
+				vm_object_unlock(sp_object);
+			}
+		} while (tmp_end != tmp2_end &&
+		    (tmp_start = tmp_end) &&
+		    (tmp_end = (tmp2_end - tmp_end > chunk_size) ?
+		    tmp_end + chunk_size : tmp2_end));
 	}
 
-	return(result);
-	} /**/
+	new_mapping_established = TRUE;
 
- BailOut: ;
-	vm_map_unlock(map);
-	return(result);
+BailOut:
+	assert(map_locked == TRUE);
 
-#undef	RETURN
-}
+	if (result == KERN_SUCCESS) {
+		vm_prot_t pager_prot;
+		memory_object_t pager;
+
+#if DEBUG
+		if (pmap_empty &&
+		    !(vmk_flags.vmkf_no_pmap_check)) {
+			assert(vm_map_pmap_is_empty(map,
+			    *address,
+			    *address + size));
+		}
+#endif /* DEBUG */
 
-/*
- *	vm_map_clip_start:	[ internal use only ]
- *
- *	Asserts that the given entry begins at or after
- *	the specified address; if necessary,
- *	it splits the entry into two.
- */
-#ifndef i386
-#define vm_map_clip_start(map, entry, startaddr) 			\
-MACRO_BEGIN 								\
-	vm_map_t VMCS_map;						\
-	vm_map_entry_t VMCS_entry;					\
-	vm_offset_t VMCS_startaddr;					\
-	VMCS_map = (map);						\
-	VMCS_entry = (entry);						\
-	VMCS_startaddr = (startaddr);					\
-	if (VMCS_startaddr > VMCS_entry->vme_start) { 			\
-		if(entry->use_pmap) {					\
-	   		vm_offset_t	pmap_base_addr;			\
-	   		vm_offset_t	pmap_end_addr;			\
-									\
-	   		pmap_base_addr = 0xF0000000 & entry->vme_start;	\
-	   		pmap_end_addr = (pmap_base_addr + 0x10000000) - 1; \
-   	   		pmap_unnest(map->pmap, pmap_base_addr,		\
-			       	(pmap_end_addr - pmap_base_addr) + 1);	\
-			entry->use_pmap = FALSE;			\
-		}							\
-		_vm_map_clip_start(&VMCS_map->hdr,VMCS_entry,VMCS_startaddr);\
-	}								\
-	UPDATE_FIRST_FREE(VMCS_map, VMCS_map->first_free);		\
-MACRO_END
-#else
-#define vm_map_clip_start(map, entry, startaddr) 			\
-MACRO_BEGIN 								\
-	vm_map_t VMCS_map;						\
-	vm_map_entry_t VMCS_entry;					\
-	vm_offset_t VMCS_startaddr;					\
-	VMCS_map = (map);						\
-	VMCS_entry = (entry);						\
-	VMCS_startaddr = (startaddr);					\
-	if (VMCS_startaddr > VMCS_entry->vme_start) { 			\
-		_vm_map_clip_start(&VMCS_map->hdr,VMCS_entry,VMCS_startaddr);\
-	}								\
-	UPDATE_FIRST_FREE(VMCS_map, VMCS_map->first_free);		\
-MACRO_END
-#endif
+		/*
+		 * For "named" VM objects, let the pager know that the
+		 * memory object is being mapped.  Some pagers need to keep
+		 * track of this, to know when they can reclaim the memory
+		 * object, for example.
+		 * VM calls memory_object_map() for each mapping (specifying
+		 * the protection of each mapping) and calls
+		 * memory_object_last_unmap() when all the mappings are gone.
+		 */
+		pager_prot = max_protection;
+		if (needs_copy) {
+			/*
+			 * Copy-On-Write mapping: won't modify
+			 * the memory object.
+			 */
+			pager_prot &= ~VM_PROT_WRITE;
+		}
+		if (!is_submap &&
+		    object != VM_OBJECT_NULL &&
+		    object->named &&
+		    object->pager != MEMORY_OBJECT_NULL) {
+			vm_object_lock(object);
+			pager = object->pager;
+			if (object->named &&
+			    pager != MEMORY_OBJECT_NULL) {
+				assert(object->pager_ready);
+				vm_object_mapping_wait(object, THREAD_UNINT);
+				vm_object_mapping_begin(object);
+				vm_object_unlock(object);
 
-#define vm_map_copy_clip_start(copy, entry, startaddr) \
-	MACRO_BEGIN \
-	if ((startaddr) > (entry)->vme_start) \
-		_vm_map_clip_start(&(copy)->cpy_hdr,(entry),(startaddr)); \
-	MACRO_END
+				kr = memory_object_map(pager, pager_prot);
+				assert(kr == KERN_SUCCESS);
 
-/*
- *	This routine is called only when it is known that
- *	the entry must be split.
- */
-void
-_vm_map_clip_start(
-	register struct vm_map_header	*map_header,
-	register vm_map_entry_t		entry,
-	register vm_offset_t		start)
-{
-	register vm_map_entry_t	new_entry;
-
-	/*
-	 *	Split off the front portion --
-	 *	note that we must insert the new
-	 *	entry BEFORE this one, so that
-	 *	this entry has the specified starting
-	 *	address.
-	 */
-
-	new_entry = _vm_map_entry_create(map_header);
-	vm_map_entry_copy_full(new_entry, entry);
-
-	new_entry->vme_end = start;
-	entry->offset += (start - entry->vme_start);
-	entry->vme_start = start;
-
-	_vm_map_entry_link(map_header, entry->vme_prev, new_entry);
-
-	if (entry->is_sub_map)
-	 	vm_map_reference(new_entry->object.sub_map);
-	else
-		vm_object_reference(new_entry->object.vm_object);
-}
-
-
-/*
- *	vm_map_clip_end:	[ internal use only ]
- *
- *	Asserts that the given entry ends at or before
- *	the specified address; if necessary,
- *	it splits the entry into two.
- */
-#ifndef i386
-#define vm_map_clip_end(map, entry, endaddr) 				\
-MACRO_BEGIN 								\
-	vm_map_t VMCE_map;						\
-	vm_map_entry_t VMCE_entry;					\
-	vm_offset_t VMCE_endaddr;					\
-	VMCE_map = (map);						\
-	VMCE_entry = (entry);						\
-	VMCE_endaddr = (endaddr);					\
-	if (VMCE_endaddr < VMCE_entry->vme_end) { 			\
-		if(entry->use_pmap) {					\
-	   		vm_offset_t	pmap_base_addr;			\
-	   		vm_offset_t	pmap_end_addr;			\
-									\
-	   		pmap_base_addr = 0xF0000000 & entry->vme_start;	\
-	   		pmap_end_addr = (pmap_base_addr + 0x10000000) - 1; \
-   	   		pmap_unnest(map->pmap, pmap_base_addr,		\
-			       	(pmap_end_addr - pmap_base_addr) + 1);	\
-			entry->use_pmap = FALSE;			\
-		}							\
-		_vm_map_clip_end(&VMCE_map->hdr,VMCE_entry,VMCE_endaddr); \
-	}								\
-	UPDATE_FIRST_FREE(VMCE_map, VMCE_map->first_free);		\
-MACRO_END
-#else
-#define vm_map_clip_end(map, entry, endaddr) 				\
-MACRO_BEGIN 								\
-	vm_map_t VMCE_map;						\
-	vm_map_entry_t VMCE_entry;					\
-	vm_offset_t VMCE_endaddr;					\
-	VMCE_map = (map);						\
-	VMCE_entry = (entry);						\
-	VMCE_endaddr = (endaddr);					\
-	if (VMCE_endaddr < VMCE_entry->vme_end) { 			\
-		_vm_map_clip_end(&VMCE_map->hdr,VMCE_entry,VMCE_endaddr); \
-	}								\
-	UPDATE_FIRST_FREE(VMCE_map, VMCE_map->first_free);		\
-MACRO_END
-#endif
+				vm_object_lock(object);
+				vm_object_mapping_end(object);
+			}
+			vm_object_unlock(object);
+		}
+	}
 
-#define vm_map_copy_clip_end(copy, entry, endaddr) \
-	MACRO_BEGIN \
-	if ((endaddr) < (entry)->vme_end) \
-		_vm_map_clip_end(&(copy)->cpy_hdr,(entry),(endaddr)); \
-	MACRO_END
+	assert(map_locked == TRUE);
 
-/*
- *	This routine is called only when it is known that
- *	the entry must be split.
- */
-void
-_vm_map_clip_end(
-	register struct vm_map_header	*map_header,
-	register vm_map_entry_t		entry,
-	register vm_offset_t		end)
-{
-	register vm_map_entry_t	new_entry;
+	if (!keep_map_locked) {
+		vm_map_unlock(map);
+		map_locked = FALSE;
+	}
 
 	/*
-	 *	Create a new entry and insert it
-	 *	AFTER the specified entry
+	 * We can't hold the map lock if we enter this block.
 	 */
 
-	new_entry = _vm_map_entry_create(map_header);
-	vm_map_entry_copy_full(new_entry, entry);
-
-	new_entry->vme_start = entry->vme_end = end;
-	new_entry->offset += (end - entry->vme_start);
+	if (result == KERN_SUCCESS) {
+		/*	Wire down the new entry if the user
+		 *	requested all new map entries be wired.
+		 */
+		if ((map->wiring_required) || (superpage_size)) {
+			assert(!keep_map_locked);
+			pmap_empty = FALSE; /* pmap won't be empty */
+			kr = vm_map_wire_kernel(map, start, end,
+			    new_entry->protection, VM_KERN_MEMORY_MLOCK,
+			    TRUE);
+			result = kr;
+		}
 
-	_vm_map_entry_link(map_header, entry, new_entry);
+	}
 
-	if (entry->is_sub_map)
-	 	vm_map_reference(new_entry->object.sub_map);
-	else
-		vm_object_reference(new_entry->object.vm_object);
-}
+	if (result != KERN_SUCCESS) {
+		if (new_mapping_established) {
+			/*
+			 * We have to get rid of the new mappings since we
+			 * won't make them available to the user.
+			 * Try and do that atomically, to minimize the risk
+			 * that someone else create new mappings that range.
+			 */
+			zap_new_map = vm_map_create(PMAP_NULL,
+			    *address,
+			    *address + size,
+			    map->hdr.entries_pageable);
+			vm_map_set_page_shift(zap_new_map,
+			    VM_MAP_PAGE_SHIFT(map));
+			vm_map_disable_hole_optimization(zap_new_map);
+
+			if (!map_locked) {
+				vm_map_lock(map);
+				map_locked = TRUE;
+			}
+			(void) vm_map_delete(map, *address, *address + size,
+			    (VM_MAP_REMOVE_SAVE_ENTRIES |
+			    VM_MAP_REMOVE_NO_MAP_ALIGN),
+			    zap_new_map);
+		}
+		if (zap_old_map != VM_MAP_NULL &&
+		    zap_old_map->hdr.nentries != 0) {
+			vm_map_entry_t  entry1, entry2;
 
+			/*
+			 * The new mapping failed.  Attempt to restore
+			 * the old mappings, saved in the "zap_old_map".
+			 */
+			if (!map_locked) {
+				vm_map_lock(map);
+				map_locked = TRUE;
+			}
 
-/*
- *	VM_MAP_RANGE_CHECK:	[ internal use only ]
- *
- *	Asserts that the starting and ending region
- *	addresses fall within the valid range of the map.
- */
-#define	VM_MAP_RANGE_CHECK(map, start, end)		\
-		{					\
-		if (start < vm_map_min(map))		\
-			start = vm_map_min(map);	\
-		if (end > vm_map_max(map))		\
-			end = vm_map_max(map);		\
-		if (start > end)			\
-			start = end;			\
+			/* first check if the coast is still clear */
+			start = vm_map_first_entry(zap_old_map)->vme_start;
+			end = vm_map_last_entry(zap_old_map)->vme_end;
+			if (vm_map_lookup_entry(map, start, &entry1) ||
+			    vm_map_lookup_entry(map, end, &entry2) ||
+			    entry1 != entry2) {
+				/*
+				 * Part of that range has already been
+				 * re-mapped:  we can't restore the old
+				 * mappings...
+				 */
+				vm_map_enter_restore_failures++;
+			} else {
+				/*
+				 * Transfer the saved map entries from
+				 * "zap_old_map" to the original "map",
+				 * inserting them all after "entry1".
+				 */
+				for (entry2 = vm_map_first_entry(zap_old_map);
+				    entry2 != vm_map_to_entry(zap_old_map);
+				    entry2 = vm_map_first_entry(zap_old_map)) {
+					vm_map_size_t entry_size;
+
+					entry_size = (entry2->vme_end -
+					    entry2->vme_start);
+					vm_map_store_entry_unlink(zap_old_map,
+					    entry2);
+					zap_old_map->size -= entry_size;
+					vm_map_store_entry_link(map, entry1, entry2,
+					    VM_MAP_KERNEL_FLAGS_NONE);
+					map->size += entry_size;
+					entry1 = entry2;
+				}
+				if (map->wiring_required) {
+					/*
+					 * XXX TODO: we should rewire the
+					 * old pages here...
+					 */
+				}
+				vm_map_enter_restore_successes++;
+			}
 		}
-
-/*
- *	vm_map_range_check:	[ internal use only ]
- *	
- *	Check that the region defined by the specified start and
- *	end addresses are wholly contained within a single map
- *	entry or set of adjacent map entries of the spacified map,
- *	i.e. the specified region contains no unmapped space.
- *	If any or all of the region is unmapped, FALSE is returned.
- *	Otherwise, TRUE is returned and if the output argument 'entry'
- *	is not NULL it points to the map entry containing the start
- *	of the region.
- *
- *	The map is locked for reading on entry and is left locked.
- */
-boolean_t
-vm_map_range_check(
-	register vm_map_t	map,
-	register vm_offset_t	start,
-	register vm_offset_t	end,
-	vm_map_entry_t		*entry)
-{
-	vm_map_entry_t		cur;
-	register vm_offset_t	prev;
+	}
 
 	/*
-	 * 	Basic sanity checks first
+	 * The caller is responsible for releasing the lock if it requested to
+	 * keep the map locked.
 	 */
-	if (start < vm_map_min(map) || end > vm_map_max(map) || start > end)
-		return (FALSE);
+	if (map_locked && !keep_map_locked) {
+		vm_map_unlock(map);
+	}
 
 	/*
-	 * 	Check first if the region starts within a valid
-	 *	mapping for the map.
+	 * Get rid of the "zap_maps" and all the map entries that
+	 * they may still contain.
 	 */
-	if (!vm_map_lookup_entry(map, start, &cur))
-		return (FALSE);
+	if (zap_old_map != VM_MAP_NULL) {
+		vm_map_destroy(zap_old_map, VM_MAP_REMOVE_NO_PMAP_CLEANUP);
+		zap_old_map = VM_MAP_NULL;
+	}
+	if (zap_new_map != VM_MAP_NULL) {
+		vm_map_destroy(zap_new_map, VM_MAP_REMOVE_NO_PMAP_CLEANUP);
+		zap_new_map = VM_MAP_NULL;
+	}
 
-	/*
-	 *	Optimize for the case that the region is contained 
-	 *	in a single map entry.
-	 */
-	if (entry != (vm_map_entry_t *) NULL)
-		*entry = cur;
-	if (end <= cur->vme_end)
-		return (TRUE);
+	return result;
 
-	/*
-	 * 	If the region is not wholly contained within a
-	 * 	single entry, walk the entries looking for holes.
-	 */
-	prev = cur->vme_end;
-	cur = cur->vme_next;
-	while ((cur != vm_map_to_entry(map)) && (prev == cur->vme_start)) {
-		if (end <= cur->vme_end)
-			return (TRUE);
-		prev = cur->vme_end;
-		cur = cur->vme_next;
-	}
-	return (FALSE);
+#undef  RETURN
 }
 
-/*
- *	vm_map_submap:		[ kernel use only ]
- *
- *	Mark the given range as handled by a subordinate map.
- *
- *	This range must have been created with vm_map_find using
- *	the vm_submap_object, and no other operations may have been
- *	performed on this range prior to calling vm_map_submap.
- *
- *	Only a limited number of operations can be performed
- *	within this rage after calling vm_map_submap:
- *		vm_fault
- *	[Don't try vm_map_copyin!]
- *
- *	To remove a submapping, one must first remove the
- *	range from the superior map, and then destroy the
- *	submap (if desired).  [Better yet, don't try it.]
- */
+#if __arm64__
+extern const struct memory_object_pager_ops fourk_pager_ops;
 kern_return_t
-vm_map_submap(
-	register vm_map_t	map,
-	register vm_offset_t	start,
-	register vm_offset_t	end,
-	vm_map_t		submap,
-	vm_offset_t		offset,
-	boolean_t		use_pmap)
+vm_map_enter_fourk(
+	vm_map_t                map,
+	vm_map_offset_t         *address,       /* IN/OUT */
+	vm_map_size_t           size,
+	vm_map_offset_t         mask,
+	int                     flags,
+	vm_map_kernel_flags_t   vmk_flags,
+	vm_tag_t                alias,
+	vm_object_t             object,
+	vm_object_offset_t      offset,
+	boolean_t               needs_copy,
+	vm_prot_t               cur_protection,
+	vm_prot_t               max_protection,
+	vm_inherit_t            inheritance)
 {
-	vm_map_entry_t		entry;
-	register kern_return_t	result = KERN_INVALID_ARGUMENT;
-	register vm_object_t	object;
-
-	vm_map_lock(map);
-
-	VM_MAP_RANGE_CHECK(map, start, end);
-
-	if (vm_map_lookup_entry(map, start, &entry)) {
-		vm_map_clip_start(map, entry, start);
+	vm_map_entry_t          entry, new_entry;
+	vm_map_offset_t         start, fourk_start;
+	vm_map_offset_t         end, fourk_end;
+	vm_map_size_t           fourk_size;
+	kern_return_t           result = KERN_SUCCESS;
+	vm_map_t                zap_old_map = VM_MAP_NULL;
+	vm_map_t                zap_new_map = VM_MAP_NULL;
+	boolean_t               map_locked = FALSE;
+	boolean_t               pmap_empty = TRUE;
+	boolean_t               new_mapping_established = FALSE;
+	boolean_t               keep_map_locked = vmk_flags.vmkf_keep_map_locked;
+	boolean_t               anywhere = ((flags & VM_FLAGS_ANYWHERE) != 0);
+	boolean_t               purgable = ((flags & VM_FLAGS_PURGABLE) != 0);
+	boolean_t               overwrite = ((flags & VM_FLAGS_OVERWRITE) != 0);
+	boolean_t               no_cache = ((flags & VM_FLAGS_NO_CACHE) != 0);
+	boolean_t               is_submap = vmk_flags.vmkf_submap;
+	boolean_t               permanent = vmk_flags.vmkf_permanent;
+	boolean_t               no_copy_on_read = vmk_flags.vmkf_permanent;
+	boolean_t               entry_for_jit = vmk_flags.vmkf_map_jit;
+//	boolean_t		iokit_acct = vmk_flags.vmkf_iokit_acct;
+	unsigned int            superpage_size = ((flags & VM_FLAGS_SUPERPAGE_MASK) >> VM_FLAGS_SUPERPAGE_SHIFT);
+	vm_map_offset_t         effective_min_offset, effective_max_offset;
+	kern_return_t           kr;
+	boolean_t               clear_map_aligned = FALSE;
+	memory_object_t         fourk_mem_obj;
+	vm_object_t             fourk_object;
+	vm_map_offset_t         fourk_pager_offset;
+	int                     fourk_pager_index_start, fourk_pager_index_num;
+	int                     cur_idx;
+	boolean_t               fourk_copy;
+	vm_object_t             copy_object;
+	vm_object_offset_t      copy_offset;
+
+	fourk_mem_obj = MEMORY_OBJECT_NULL;
+	fourk_object = VM_OBJECT_NULL;
+
+	if (superpage_size) {
+		return KERN_NOT_SUPPORTED;
 	}
-	else
-		entry = entry->vme_next;
 
-	if(entry == vm_map_to_entry(map)) {
-		vm_map_unlock(map);
-		return KERN_INVALID_ARGUMENT;
+	if ((cur_protection & VM_PROT_WRITE) &&
+	    (cur_protection & VM_PROT_EXECUTE) &&
+#if !CONFIG_EMBEDDED
+	    map != kernel_map &&
+	    cs_process_enforcement(NULL) &&
+#endif /* !CONFIG_EMBEDDED */
+	    !entry_for_jit) {
+		DTRACE_VM3(cs_wx,
+		    uint64_t, 0,
+		    uint64_t, 0,
+		    vm_prot_t, cur_protection);
+		printf("CODE SIGNING: %d[%s] %s: curprot cannot be write+execute. "
+		    "turning off execute\n",
+		    proc_selfpid(),
+		    (current_task()->bsd_info
+		    ? proc_name_address(current_task()->bsd_info)
+		    : "?"),
+		    __FUNCTION__);
+		cur_protection &= ~VM_PROT_EXECUTE;
 	}
 
-	vm_map_clip_end(map, entry, end);
-
-	if ((entry->vme_start == start) && (entry->vme_end == end) &&
-	    (!entry->is_sub_map) &&
-	    ((object = entry->object.vm_object) == vm_submap_object) &&
-	    (object->resident_page_count == 0) &&
-	    (object->copy == VM_OBJECT_NULL) &&
-	    (object->shadow == VM_OBJECT_NULL) &&
-	    (!object->pager_created)) {
-		entry->offset = (vm_object_offset_t)offset;
-		entry->object.vm_object = VM_OBJECT_NULL;
-		vm_object_deallocate(object);
-		entry->is_sub_map = TRUE;
-		vm_map_reference(entry->object.sub_map = submap);
-#ifndef i386
-		if ((use_pmap) && (offset == 0)) {
-			/* nest if platform code will allow */
-			result = pmap_nest(map->pmap, (entry->object.sub_map)->pmap, 
-							start, end - start);
-			if(result)
-				panic("pmap_nest failed!");
-			entry->use_pmap = TRUE;
+	/*
+	 * If the task has requested executable lockdown,
+	 * deny any new executable mapping.
+	 */
+	if (map->map_disallow_new_exec == TRUE) {
+		if (cur_protection & VM_PROT_EXECUTE) {
+			return KERN_PROTECTION_FAILURE;
 		}
-#endif
-#ifdef i386
-		pmap_remove(map->pmap, start, end);
-#endif
-		result = KERN_SUCCESS;
 	}
-	vm_map_unlock(map);
 
-	return(result);
-}
+	if (is_submap) {
+		return KERN_NOT_SUPPORTED;
+	}
+	if (vmk_flags.vmkf_already) {
+		return KERN_NOT_SUPPORTED;
+	}
+	if (purgable || entry_for_jit) {
+		return KERN_NOT_SUPPORTED;
+	}
 
-/*
- *	vm_map_protect:
- *
- *	Sets the protection of the specified address
- *	region in the target map.  If "set_max" is
- *	specified, the maximum protection is to be set;
- *	otherwise, only the current protection is affected.
- */
-kern_return_t
-vm_map_protect(
-	register vm_map_t	map,
-	register vm_offset_t	start,
-	register vm_offset_t	end,
-	register vm_prot_t	new_prot,
-	register boolean_t	set_max)
-{
-	register vm_map_entry_t		current;
-	register vm_offset_t		prev;
-	vm_map_entry_t			entry;
-	vm_prot_t			new_max;
-	boolean_t			clip;
-
-	XPR(XPR_VM_MAP,
-		"vm_map_protect, 0x%X start 0x%X end 0x%X, new 0x%X %d",
-		(integer_t)map, start, end, new_prot, set_max);
+	effective_min_offset = map->min_offset;
 
-	vm_map_lock(map);
+	if (vmk_flags.vmkf_beyond_max) {
+		return KERN_NOT_SUPPORTED;
+	} else {
+		effective_max_offset = map->max_offset;
+	}
 
-	/*
-	 * 	Lookup the entry.  If it doesn't start in a valid
-	 *	entry, return an error.  Remember if we need to
-	 *	clip the entry.  We don't do it here because we don't
-	 *	want to make any changes until we've scanned the 
-	 *	entire range below for address and protection
-	 *	violations.
-	 */
-	if (!(clip = vm_map_lookup_entry(map, start, &entry))) {
-		vm_map_unlock(map);
-		return(KERN_INVALID_ADDRESS);
+	if (size == 0 ||
+	    (offset & FOURK_PAGE_MASK) != 0) {
+		*address = 0;
+		return KERN_INVALID_ARGUMENT;
 	}
 
-	/*
-	 *	Make a first pass to check for protection and address
-	 *	violations.
-	 */
+#define RETURN(value)   { result = value; goto BailOut; }
 
-	current = entry;
-	prev = current->vme_start;
-	while ((current != vm_map_to_entry(map)) &&
-	       (current->vme_start < end)) {
+	assert(VM_MAP_PAGE_ALIGNED(*address, FOURK_PAGE_MASK));
+	assert(VM_MAP_PAGE_ALIGNED(size, FOURK_PAGE_MASK));
 
+	if (!anywhere && overwrite) {
+		return KERN_NOT_SUPPORTED;
+	}
+	if (!anywhere && overwrite) {
 		/*
-		 * If there is a hole, return an error.
+		 * Create a temporary VM map to hold the old mappings in the
+		 * affected area while we create the new one.
+		 * This avoids releasing the VM map lock in
+		 * vm_map_entry_delete() and allows atomicity
+		 * when we want to replace some mappings with a new one.
+		 * It also allows us to restore the old VM mappings if the
+		 * new mapping fails.
 		 */
-		if (current->vme_start != prev) {
-			vm_map_unlock(map);
-			return(KERN_INVALID_ADDRESS);
-		}
-
-		new_max = current->max_protection;
-		if(new_prot & VM_PROT_COPY) {
-			new_max |= VM_PROT_WRITE;
-			if ((new_prot & (new_max | VM_PROT_COPY)) != new_prot) {
-				vm_map_unlock(map);
-				return(KERN_PROTECTION_FAILURE);
-			}
-		} else {
-			if ((new_prot & new_max) != new_prot) {
-				vm_map_unlock(map);
-				return(KERN_PROTECTION_FAILURE);
-			}
-		}
-
-		prev = current->vme_end;
-		current = current->vme_next;
-	}
-	if (end > prev) {
-		vm_map_unlock(map);
-		return(KERN_INVALID_ADDRESS);
+		zap_old_map = vm_map_create(PMAP_NULL,
+		    *address,
+		    *address + size,
+		    map->hdr.entries_pageable);
+		vm_map_set_page_shift(zap_old_map, VM_MAP_PAGE_SHIFT(map));
+		vm_map_disable_hole_optimization(zap_old_map);
 	}
 
-	/*
-	 *	Go back and fix up protections.
-	 *	Clip to start here if the range starts within
-	 *	the entry.
-	 */
+	fourk_start = *address;
+	fourk_size = size;
+	fourk_end = fourk_start + fourk_size;
 
-	current = entry;
-	if (clip) {
-		vm_map_clip_start(map, entry, start);
-	}
-	while ((current != vm_map_to_entry(map)) &&
-	       (current->vme_start < end)) {
+	start = vm_map_trunc_page(*address, VM_MAP_PAGE_MASK(map));
+	end = vm_map_round_page(fourk_end, VM_MAP_PAGE_MASK(map));
+	size = end - start;
 
-		vm_prot_t	old_prot;
+	if (anywhere) {
+		return KERN_NOT_SUPPORTED;
+	} else {
+		/*
+		 *	Verify that:
+		 *		the address doesn't itself violate
+		 *		the mask requirement.
+		 */
 
-		vm_map_clip_end(map, current, end);
+		vm_map_lock(map);
+		map_locked = TRUE;
+		if ((start & mask) != 0) {
+			RETURN(KERN_NO_SPACE);
+		}
 
-		old_prot = current->protection;
+		/*
+		 *	...	the address is within bounds
+		 */
+
+		end = start + size;
 
-		if(new_prot & VM_PROT_COPY) {
-			/* caller is asking specifically to copy the      */
-			/* mapped data, this implies that max protection  */
-			/* will include write.  Caller must be prepared   */
-			/* for loss of shared memory communication in the */
-			/* target area after taking this step */
-			current->needs_copy = TRUE;
-			current->max_protection |= VM_PROT_WRITE;
+		if ((start < effective_min_offset) ||
+		    (end > effective_max_offset) ||
+		    (start >= end)) {
+			RETURN(KERN_INVALID_ADDRESS);
 		}
 
-		if (set_max)
-			current->protection =
-				(current->max_protection = 
-					new_prot & ~VM_PROT_COPY) &
-					old_prot;
-		else
-			current->protection = new_prot & ~VM_PROT_COPY;
+		if (overwrite && zap_old_map != VM_MAP_NULL) {
+			/*
+			 * Fixed mapping and "overwrite" flag: attempt to
+			 * remove all existing mappings in the specified
+			 * address range, saving them in our "zap_old_map".
+			 */
+			(void) vm_map_delete(map, start, end,
+			    (VM_MAP_REMOVE_SAVE_ENTRIES |
+			    VM_MAP_REMOVE_NO_MAP_ALIGN),
+			    zap_old_map);
+		}
 
 		/*
-		 *	Update physical map if necessary.
-		 *	If the request is to turn off write protection, 
-		 *	we won't do it for real (in pmap). This is because 
-		 *	it would cause copy-on-write to fail.  We've already 
-		 *	set, the new protection in the map, so if a 
-		 *	write-protect fault occurred, it will be fixed up 
-		 *	properly, COW or not.
+		 *	...	the starting address isn't allocated
 		 */
-	 	/* the 256M hack for existing hardware limitations */
-		if (current->protection != old_prot) {
-	 	   if(current->is_sub_map && current->use_pmap) {
-			vm_offset_t	pmap_base_addr;
-			vm_offset_t	pmap_end_addr;
-			vm_map_entry_t	local_entry;
-
-			pmap_base_addr = 0xF0000000 & current->vme_start;
-			pmap_end_addr = (pmap_base_addr + 0x10000000) - 1;
-#ifndef i386
-			if(!vm_map_lookup_entry(map, 
-					pmap_base_addr, &local_entry))
-			   panic("vm_map_protect: nested pmap area is missing");
-			   while ((local_entry != vm_map_to_entry(map)) &&
-	       	  	          (local_entry->vme_start < pmap_end_addr)) {
-				local_entry->use_pmap = FALSE;
-				local_entry = local_entry->vme_next;
-			   }
-			   pmap_unnest(map->pmap, pmap_base_addr,
-			       		(pmap_end_addr - pmap_base_addr) + 1);
-#endif
-		   }
-		   if (!(current->protection & VM_PROT_WRITE)) {
-			/* Look one level in we support nested pmaps */
-			/* from mapped submaps which are direct entries */
-			/* in our map */
-			if(current->is_sub_map && current->use_pmap) {
-				pmap_protect(current->object.sub_map->pmap, 
-					current->vme_start,
-					current->vme_end,
-					current->protection);
+		if (vm_map_lookup_entry(map, start, &entry)) {
+			vm_object_t cur_object, shadow_object;
+
+			/*
+			 * We might already some 4K mappings
+			 * in a 16K page here.
+			 */
+
+			if (entry->vme_end - entry->vme_start
+			    != SIXTEENK_PAGE_SIZE) {
+				RETURN(KERN_NO_SPACE);
+			}
+			if (entry->is_sub_map) {
+				RETURN(KERN_NO_SPACE);
+			}
+			if (VME_OBJECT(entry) == VM_OBJECT_NULL) {
+				RETURN(KERN_NO_SPACE);
+			}
+
+			/* go all the way down the shadow chain */
+			cur_object = VME_OBJECT(entry);
+			vm_object_lock(cur_object);
+			while (cur_object->shadow != VM_OBJECT_NULL) {
+				shadow_object = cur_object->shadow;
+				vm_object_lock(shadow_object);
+				vm_object_unlock(cur_object);
+				cur_object = shadow_object;
+				shadow_object = VM_OBJECT_NULL;
+			}
+			if (cur_object->internal ||
+			    cur_object->pager == NULL) {
+				vm_object_unlock(cur_object);
+				RETURN(KERN_NO_SPACE);
+			}
+			if (cur_object->pager->mo_pager_ops
+			    != &fourk_pager_ops) {
+				vm_object_unlock(cur_object);
+				RETURN(KERN_NO_SPACE);
+			}
+			fourk_object = cur_object;
+			fourk_mem_obj = fourk_object->pager;
+
+			/* keep the "4K" object alive */
+			vm_object_reference_locked(fourk_object);
+			vm_object_unlock(fourk_object);
+
+			/* merge permissions */
+			entry->protection |= cur_protection;
+			entry->max_protection |= max_protection;
+			if ((entry->protection & (VM_PROT_WRITE |
+			    VM_PROT_EXECUTE)) ==
+			    (VM_PROT_WRITE | VM_PROT_EXECUTE) &&
+			    fourk_binary_compatibility_unsafe &&
+			    fourk_binary_compatibility_allow_wx) {
+				/* write+execute: need to be "jit" */
+				entry->used_for_jit = TRUE;
+			}
+
+			goto map_in_fourk_pager;
+		}
+
+		/*
+		 *	...	the next region doesn't overlap the
+		 *		end point.
+		 */
+
+		if ((entry->vme_next != vm_map_to_entry(map)) &&
+		    (entry->vme_next->vme_start < end)) {
+			RETURN(KERN_NO_SPACE);
+		}
+	}
+
+	/*
+	 *	At this point,
+	 *		"start" and "end" should define the endpoints of the
+	 *			available new range, and
+	 *		"entry" should refer to the region before the new
+	 *			range, and
+	 *
+	 *		the map should be locked.
+	 */
+
+	/* create a new "4K" pager */
+	fourk_mem_obj = fourk_pager_create();
+	fourk_object = fourk_pager_to_vm_object(fourk_mem_obj);
+	assert(fourk_object);
+
+	/* keep the "4" object alive */
+	vm_object_reference(fourk_object);
+
+	/* create a "copy" object, to map the "4K" object copy-on-write */
+	fourk_copy = TRUE;
+	result = vm_object_copy_strategically(fourk_object,
+	    0,
+	    end - start,
+	    &copy_object,
+	    &copy_offset,
+	    &fourk_copy);
+	assert(result == KERN_SUCCESS);
+	assert(copy_object != VM_OBJECT_NULL);
+	assert(copy_offset == 0);
+
+	/* take a reference on the copy object, for this mapping */
+	vm_object_reference(copy_object);
+
+	/* map the "4K" pager's copy object */
+	new_entry =
+	    vm_map_entry_insert(map, entry,
+	    vm_map_trunc_page(start,
+	    VM_MAP_PAGE_MASK(map)),
+	    vm_map_round_page(end,
+	    VM_MAP_PAGE_MASK(map)),
+	    copy_object,
+	    0,                         /* offset */
+	    FALSE,                         /* needs_copy */
+	    FALSE,
+	    FALSE,
+	    cur_protection, max_protection,
+	    VM_BEHAVIOR_DEFAULT,
+	    ((entry_for_jit)
+	    ? VM_INHERIT_NONE
+	    : inheritance),
+	    0,
+	    no_cache,
+	    permanent,
+	    no_copy_on_read,
+	    superpage_size,
+	    clear_map_aligned,
+	    is_submap,
+	    FALSE,                         /* jit */
+	    alias);
+	entry = new_entry;
+
+#if VM_MAP_DEBUG_FOURK
+	if (vm_map_debug_fourk) {
+		printf("FOURK_PAGER: map %p [0x%llx:0x%llx] new pager %p\n",
+		    map,
+		    (uint64_t) entry->vme_start,
+		    (uint64_t) entry->vme_end,
+		    fourk_mem_obj);
+	}
+#endif /* VM_MAP_DEBUG_FOURK */
+
+	new_mapping_established = TRUE;
+
+map_in_fourk_pager:
+	/* "map" the original "object" where it belongs in the "4K" pager */
+	fourk_pager_offset = (fourk_start & SIXTEENK_PAGE_MASK);
+	fourk_pager_index_start = (int) (fourk_pager_offset / FOURK_PAGE_SIZE);
+	if (fourk_size > SIXTEENK_PAGE_SIZE) {
+		fourk_pager_index_num = 4;
+	} else {
+		fourk_pager_index_num = (int) (fourk_size / FOURK_PAGE_SIZE);
+	}
+	if (fourk_pager_index_start + fourk_pager_index_num > 4) {
+		fourk_pager_index_num = 4 - fourk_pager_index_start;
+	}
+	for (cur_idx = 0;
+	    cur_idx < fourk_pager_index_num;
+	    cur_idx++) {
+		vm_object_t             old_object;
+		vm_object_offset_t      old_offset;
+
+		kr = fourk_pager_populate(fourk_mem_obj,
+		    TRUE,                       /* overwrite */
+		    fourk_pager_index_start + cur_idx,
+		    object,
+		    (object
+		    ? (offset +
+		    (cur_idx * FOURK_PAGE_SIZE))
+		    : 0),
+		    &old_object,
+		    &old_offset);
+#if VM_MAP_DEBUG_FOURK
+		if (vm_map_debug_fourk) {
+			if (old_object == (vm_object_t) -1 &&
+			    old_offset == (vm_object_offset_t) -1) {
+				printf("FOURK_PAGER: map %p [0x%llx:0x%llx] "
+				    "pager [%p:0x%llx] "
+				    "populate[%d] "
+				    "[object:%p,offset:0x%llx]\n",
+				    map,
+				    (uint64_t) entry->vme_start,
+				    (uint64_t) entry->vme_end,
+				    fourk_mem_obj,
+				    VME_OFFSET(entry),
+				    fourk_pager_index_start + cur_idx,
+				    object,
+				    (object
+				    ? (offset + (cur_idx * FOURK_PAGE_SIZE))
+				    : 0));
 			} else {
-				pmap_protect(map->pmap, current->vme_start,
-					current->vme_end,
-					current->protection);
+				printf("FOURK_PAGER: map %p [0x%llx:0x%llx] "
+				    "pager [%p:0x%llx] "
+				    "populate[%d] [object:%p,offset:0x%llx] "
+				    "old [%p:0x%llx]\n",
+				    map,
+				    (uint64_t) entry->vme_start,
+				    (uint64_t) entry->vme_end,
+				    fourk_mem_obj,
+				    VME_OFFSET(entry),
+				    fourk_pager_index_start + cur_idx,
+				    object,
+				    (object
+				    ? (offset + (cur_idx * FOURK_PAGE_SIZE))
+				    : 0),
+				    old_object,
+				    old_offset);
 			}
-		   }
 		}
-		current = current->vme_next;
+#endif /* VM_MAP_DEBUG_FOURK */
+
+		assert(kr == KERN_SUCCESS);
+		if (object != old_object &&
+		    object != VM_OBJECT_NULL &&
+		    object != (vm_object_t) -1) {
+			vm_object_reference(object);
+		}
+		if (object != old_object &&
+		    old_object != VM_OBJECT_NULL &&
+		    old_object != (vm_object_t) -1) {
+			vm_object_deallocate(old_object);
+		}
 	}
 
-	vm_map_unlock(map);
-	return(KERN_SUCCESS);
-}
+BailOut:
+	assert(map_locked == TRUE);
 
-/*
- *	vm_map_inherit:
- *
- *	Sets the inheritance of the specified address
- *	range in the target map.  Inheritance
- *	affects how the map will be shared with
- *	child maps at the time of vm_map_fork.
- */
-kern_return_t
-vm_map_inherit(
-	register vm_map_t	map,
-	register vm_offset_t	start,
-	register vm_offset_t	end,
-	register vm_inherit_t	new_inheritance)
-{
-	register vm_map_entry_t	entry;
-	vm_map_entry_t	temp_entry;
+	if (fourk_object != VM_OBJECT_NULL) {
+		vm_object_deallocate(fourk_object);
+		fourk_object = VM_OBJECT_NULL;
+		fourk_mem_obj = MEMORY_OBJECT_NULL;
+	}
 
-	vm_map_lock(map);
+	if (result == KERN_SUCCESS) {
+		vm_prot_t pager_prot;
+		memory_object_t pager;
+
+#if DEBUG
+		if (pmap_empty &&
+		    !(vmk_flags.vmkf_no_pmap_check)) {
+			assert(vm_map_pmap_is_empty(map,
+			    *address,
+			    *address + size));
+		}
+#endif /* DEBUG */
 
-	VM_MAP_RANGE_CHECK(map, start, end);
+		/*
+		 * For "named" VM objects, let the pager know that the
+		 * memory object is being mapped.  Some pagers need to keep
+		 * track of this, to know when they can reclaim the memory
+		 * object, for example.
+		 * VM calls memory_object_map() for each mapping (specifying
+		 * the protection of each mapping) and calls
+		 * memory_object_last_unmap() when all the mappings are gone.
+		 */
+		pager_prot = max_protection;
+		if (needs_copy) {
+			/*
+			 * Copy-On-Write mapping: won't modify
+			 * the memory object.
+			 */
+			pager_prot &= ~VM_PROT_WRITE;
+		}
+		if (!is_submap &&
+		    object != VM_OBJECT_NULL &&
+		    object->named &&
+		    object->pager != MEMORY_OBJECT_NULL) {
+			vm_object_lock(object);
+			pager = object->pager;
+			if (object->named &&
+			    pager != MEMORY_OBJECT_NULL) {
+				assert(object->pager_ready);
+				vm_object_mapping_wait(object, THREAD_UNINT);
+				vm_object_mapping_begin(object);
+				vm_object_unlock(object);
 
-	if (vm_map_lookup_entry(map, start, &temp_entry)) {
-		entry = temp_entry;
-		vm_map_clip_start(map, entry, start);
+				kr = memory_object_map(pager, pager_prot);
+				assert(kr == KERN_SUCCESS);
+
+				vm_object_lock(object);
+				vm_object_mapping_end(object);
+			}
+			vm_object_unlock(object);
+		}
+		if (!is_submap &&
+		    fourk_object != VM_OBJECT_NULL &&
+		    fourk_object->named &&
+		    fourk_object->pager != MEMORY_OBJECT_NULL) {
+			vm_object_lock(fourk_object);
+			pager = fourk_object->pager;
+			if (fourk_object->named &&
+			    pager != MEMORY_OBJECT_NULL) {
+				assert(fourk_object->pager_ready);
+				vm_object_mapping_wait(fourk_object,
+				    THREAD_UNINT);
+				vm_object_mapping_begin(fourk_object);
+				vm_object_unlock(fourk_object);
+
+				kr = memory_object_map(pager, VM_PROT_READ);
+				assert(kr == KERN_SUCCESS);
+
+				vm_object_lock(fourk_object);
+				vm_object_mapping_end(fourk_object);
+			}
+			vm_object_unlock(fourk_object);
+		}
 	}
-	else {
-		temp_entry = temp_entry->vme_next;
-		entry = temp_entry;
+
+	assert(map_locked == TRUE);
+
+	if (!keep_map_locked) {
+		vm_map_unlock(map);
+		map_locked = FALSE;
 	}
 
-	/* first check entire range for submaps which can't support the */
-	/* given inheritance. */
-	while ((entry != vm_map_to_entry(map)) && (entry->vme_start < end)) {
-		if(entry->is_sub_map) {
-			if(new_inheritance == VM_INHERIT_COPY)
-				return(KERN_INVALID_ARGUMENT);
+	/*
+	 * We can't hold the map lock if we enter this block.
+	 */
+
+	if (result == KERN_SUCCESS) {
+		/*	Wire down the new entry if the user
+		 *	requested all new map entries be wired.
+		 */
+		if ((map->wiring_required) || (superpage_size)) {
+			assert(!keep_map_locked);
+			pmap_empty = FALSE; /* pmap won't be empty */
+			kr = vm_map_wire_kernel(map, start, end,
+			    new_entry->protection, VM_KERN_MEMORY_MLOCK,
+			    TRUE);
+			result = kr;
 		}
 
-		entry = entry->vme_next;
 	}
 
-	entry = temp_entry;
+	if (result != KERN_SUCCESS) {
+		if (new_mapping_established) {
+			/*
+			 * We have to get rid of the new mappings since we
+			 * won't make them available to the user.
+			 * Try and do that atomically, to minimize the risk
+			 * that someone else create new mappings that range.
+			 */
+			zap_new_map = vm_map_create(PMAP_NULL,
+			    *address,
+			    *address + size,
+			    map->hdr.entries_pageable);
+			vm_map_set_page_shift(zap_new_map,
+			    VM_MAP_PAGE_SHIFT(map));
+			vm_map_disable_hole_optimization(zap_new_map);
+
+			if (!map_locked) {
+				vm_map_lock(map);
+				map_locked = TRUE;
+			}
+			(void) vm_map_delete(map, *address, *address + size,
+			    (VM_MAP_REMOVE_SAVE_ENTRIES |
+			    VM_MAP_REMOVE_NO_MAP_ALIGN),
+			    zap_new_map);
+		}
+		if (zap_old_map != VM_MAP_NULL &&
+		    zap_old_map->hdr.nentries != 0) {
+			vm_map_entry_t  entry1, entry2;
 
-	while ((entry != vm_map_to_entry(map)) && (entry->vme_start < end)) {
-		vm_map_clip_end(map, entry, end);
+			/*
+			 * The new mapping failed.  Attempt to restore
+			 * the old mappings, saved in the "zap_old_map".
+			 */
+			if (!map_locked) {
+				vm_map_lock(map);
+				map_locked = TRUE;
+			}
 
-		entry->inheritance = new_inheritance;
+			/* first check if the coast is still clear */
+			start = vm_map_first_entry(zap_old_map)->vme_start;
+			end = vm_map_last_entry(zap_old_map)->vme_end;
+			if (vm_map_lookup_entry(map, start, &entry1) ||
+			    vm_map_lookup_entry(map, end, &entry2) ||
+			    entry1 != entry2) {
+				/*
+				 * Part of that range has already been
+				 * re-mapped:  we can't restore the old
+				 * mappings...
+				 */
+				vm_map_enter_restore_failures++;
+			} else {
+				/*
+				 * Transfer the saved map entries from
+				 * "zap_old_map" to the original "map",
+				 * inserting them all after "entry1".
+				 */
+				for (entry2 = vm_map_first_entry(zap_old_map);
+				    entry2 != vm_map_to_entry(zap_old_map);
+				    entry2 = vm_map_first_entry(zap_old_map)) {
+					vm_map_size_t entry_size;
+
+					entry_size = (entry2->vme_end -
+					    entry2->vme_start);
+					vm_map_store_entry_unlink(zap_old_map,
+					    entry2);
+					zap_old_map->size -= entry_size;
+					vm_map_store_entry_link(map, entry1, entry2,
+					    VM_MAP_KERNEL_FLAGS_NONE);
+					map->size += entry_size;
+					entry1 = entry2;
+				}
+				if (map->wiring_required) {
+					/*
+					 * XXX TODO: we should rewire the
+					 * old pages here...
+					 */
+				}
+				vm_map_enter_restore_successes++;
+			}
+		}
+	}
 
-		entry = entry->vme_next;
+	/*
+	 * The caller is responsible for releasing the lock if it requested to
+	 * keep the map locked.
+	 */
+	if (map_locked && !keep_map_locked) {
+		vm_map_unlock(map);
 	}
 
-	vm_map_unlock(map);
-	return(KERN_SUCCESS);
+	/*
+	 * Get rid of the "zap_maps" and all the map entries that
+	 * they may still contain.
+	 */
+	if (zap_old_map != VM_MAP_NULL) {
+		vm_map_destroy(zap_old_map, VM_MAP_REMOVE_NO_PMAP_CLEANUP);
+		zap_old_map = VM_MAP_NULL;
+	}
+	if (zap_new_map != VM_MAP_NULL) {
+		vm_map_destroy(zap_new_map, VM_MAP_REMOVE_NO_PMAP_CLEANUP);
+		zap_new_map = VM_MAP_NULL;
+	}
+
+	return result;
+
+#undef  RETURN
 }
+#endif /* __arm64__ */
 
 /*
- *	vm_map_wire:
- *
- *	Sets the pageability of the specified address range in the
- *	target map as wired.  Regions specified as not pageable require
- *	locked-down physical memory and physical page maps.  The
- *	access_type variable indicates types of accesses that must not
- *	generate page faults.  This is checked against protection of
- *	memory being locked-down.
- *
- *	The map must not be locked, but a reference must remain to the
- *	map throughout the call.
+ * Counters for the prefault optimization.
  */
-kern_return_t
-vm_map_wire_nested(
-	register vm_map_t	map,
-	register vm_offset_t	start,
-	register vm_offset_t	end,
-	register vm_prot_t	access_type,
-	boolean_t		user_wire,
-	pmap_t			map_pmap)
-{
-	register vm_map_entry_t	entry;
-	struct vm_map_entry	*first_entry, tmp_entry;
-	vm_map_t		pmap_map;
-	register vm_offset_t	s,e;
-	kern_return_t		rc;
-	boolean_t		need_wakeup;
-	boolean_t		main_map = FALSE;
-	boolean_t		interruptible_state;
-	thread_t		cur_thread;
-	unsigned int		last_timestamp;
-	vm_size_t		size;
-
-	vm_map_lock(map);
-	if(map_pmap == NULL)
-		main_map = TRUE;
-	last_timestamp = map->timestamp;
+int64_t vm_prefault_nb_pages = 0;
+int64_t vm_prefault_nb_bailout = 0;
+
+static kern_return_t
+vm_map_enter_mem_object_helper(
+	vm_map_t                target_map,
+	vm_map_offset_t         *address,
+	vm_map_size_t           initial_size,
+	vm_map_offset_t         mask,
+	int                     flags,
+	vm_map_kernel_flags_t   vmk_flags,
+	vm_tag_t                tag,
+	ipc_port_t              port,
+	vm_object_offset_t      offset,
+	boolean_t               copy,
+	vm_prot_t               cur_protection,
+	vm_prot_t               max_protection,
+	vm_inherit_t            inheritance,
+	upl_page_list_ptr_t     page_list,
+	unsigned int            page_list_count)
+{
+	vm_map_address_t        map_addr;
+	vm_map_size_t           map_size;
+	vm_object_t             object;
+	vm_object_size_t        size;
+	kern_return_t           result;
+	boolean_t               mask_cur_protection, mask_max_protection;
+	boolean_t               kernel_prefault, try_prefault = (page_list_count != 0);
+	vm_map_offset_t         offset_in_mapping = 0;
+#if __arm64__
+	boolean_t               fourk = vmk_flags.vmkf_fourk;
+#endif /* __arm64__ */
+
+	assertf(vmk_flags.__vmkf_unused == 0, "vmk_flags unused=0x%x\n", vmk_flags.__vmkf_unused);
+
+	mask_cur_protection = cur_protection & VM_PROT_IS_MASK;
+	mask_max_protection = max_protection & VM_PROT_IS_MASK;
+	cur_protection &= ~VM_PROT_IS_MASK;
+	max_protection &= ~VM_PROT_IS_MASK;
 
-	VM_MAP_RANGE_CHECK(map, start, end);
-	assert(page_aligned(start));
-	assert(page_aligned(end));
-	if (start == end) {
-		/* We wired what the caller asked for, zero pages */
-		vm_map_unlock(map);
-		return KERN_SUCCESS;
+	/*
+	 * Check arguments for validity
+	 */
+	if ((target_map == VM_MAP_NULL) ||
+	    (cur_protection & ~VM_PROT_ALL) ||
+	    (max_protection & ~VM_PROT_ALL) ||
+	    (inheritance > VM_INHERIT_LAST_VALID) ||
+	    (try_prefault && (copy || !page_list)) ||
+	    initial_size == 0) {
+		return KERN_INVALID_ARGUMENT;
 	}
 
-	if (vm_map_lookup_entry(map, start, &first_entry)) {
-		entry = first_entry;
-		/* vm_map_clip_start will be done later. */
-	} else {
-		/* Start address is not in map */
-		vm_map_unlock(map);
-		return(KERN_INVALID_ADDRESS);
+#if __arm64__
+	if (fourk) {
+		map_addr = vm_map_trunc_page(*address, FOURK_PAGE_MASK);
+		map_size = vm_map_round_page(initial_size, FOURK_PAGE_MASK);
+	} else
+#endif /* __arm64__ */
+	{
+		map_addr = vm_map_trunc_page(*address,
+		    VM_MAP_PAGE_MASK(target_map));
+		map_size = vm_map_round_page(initial_size,
+		    VM_MAP_PAGE_MASK(target_map));
 	}
+	size = vm_object_round_page(initial_size);
 
-	s=start;
-	need_wakeup = FALSE;
-	cur_thread = current_thread();
-	while ((entry != vm_map_to_entry(map)) && (entry->vme_start < end)) {
-		/*
-		 * If another thread is wiring/unwiring this entry then
-		 * block after informing other thread to wake us up.
-		 */
-		if (entry->in_transition) {
-			/*
-			 * We have not clipped the entry.  Make sure that
-			 * the start address is in range so that the lookup
-			 * below will succeed.
-			 */
-			s = entry->vme_start < start? start: entry->vme_start;
+	/*
+	 * Find the vm object (if any) corresponding to this port.
+	 */
+	if (!IP_VALID(port)) {
+		object = VM_OBJECT_NULL;
+		offset = 0;
+		copy = FALSE;
+	} else if (ip_kotype(port) == IKOT_NAMED_ENTRY) {
+		vm_named_entry_t        named_entry;
+
+		named_entry = (vm_named_entry_t) port->ip_kobject;
+
+		if (flags & (VM_FLAGS_RETURN_DATA_ADDR |
+		    VM_FLAGS_RETURN_4K_DATA_ADDR)) {
+			offset += named_entry->data_offset;
+		}
 
-			entry->needs_wakeup = TRUE;
+		/* a few checks to make sure user is obeying rules */
+		if (size == 0) {
+			if (offset >= named_entry->size) {
+				return KERN_INVALID_RIGHT;
+			}
+			size = named_entry->size - offset;
+		}
+		if (mask_max_protection) {
+			max_protection &= named_entry->protection;
+		}
+		if (mask_cur_protection) {
+			cur_protection &= named_entry->protection;
+		}
+		if ((named_entry->protection & max_protection) !=
+		    max_protection) {
+			return KERN_INVALID_RIGHT;
+		}
+		if ((named_entry->protection & cur_protection) !=
+		    cur_protection) {
+			return KERN_INVALID_RIGHT;
+		}
+		if (offset + size < offset) {
+			/* overflow */
+			return KERN_INVALID_ARGUMENT;
+		}
+		if (named_entry->size < (offset + initial_size)) {
+			return KERN_INVALID_ARGUMENT;
+		}
 
-			/*
-			 * wake up anybody waiting on entries that we have
-			 * already wired.
-			 */
-			if (need_wakeup) {
-				vm_map_entry_wakeup(map);
-				need_wakeup = FALSE;
+		if (named_entry->is_copy) {
+			/* for a vm_map_copy, we can only map it whole */
+			if ((size != named_entry->size) &&
+			    (vm_map_round_page(size,
+			    VM_MAP_PAGE_MASK(target_map)) ==
+			    named_entry->size)) {
+				/* XXX FBDP use the rounded size... */
+				size = vm_map_round_page(
+					size,
+					VM_MAP_PAGE_MASK(target_map));
 			}
-			/*
-			 * User wiring is interruptible
-			 */
-			vm_map_entry_wait(map, 
-					  (user_wire) ? THREAD_ABORTSAFE :
-					                THREAD_UNINT);
-			if (user_wire && cur_thread->wait_result ==
-							THREAD_INTERRUPTED) {
+
+			if (!(flags & VM_FLAGS_ANYWHERE) &&
+			    (offset != 0 ||
+			    size != named_entry->size)) {
 				/*
-				 * undo the wirings we have done so far
-				 * We do not clear the needs_wakeup flag,
-				 * because we cannot tell if we were the
-				 * only one waiting.
+				 * XXX for a mapping at a "fixed" address,
+				 * we can't trim after mapping the whole
+				 * memory entry, so reject a request for a
+				 * partial mapping.
 				 */
-				vm_map_unwire(map, start, s, user_wire);
-				return(KERN_FAILURE);
+				return KERN_INVALID_ARGUMENT;
 			}
+		}
 
-			vm_map_lock(map);
-			/*
-			 * Cannot avoid a lookup here. reset timestamp.
-			 */
-			last_timestamp = map->timestamp;
+		/* the callers parameter offset is defined to be the */
+		/* offset from beginning of named entry offset in object */
+		offset = offset + named_entry->offset;
 
+		if (!VM_MAP_PAGE_ALIGNED(size,
+		    VM_MAP_PAGE_MASK(target_map))) {
 			/*
-			 * The entry could have been clipped, look it up again.
-			 * Worse that can happen is, it may not exist anymore.
+			 * Let's not map more than requested;
+			 * vm_map_enter() will handle this "not map-aligned"
+			 * case.
 			 */
-			if (!vm_map_lookup_entry(map, s, &first_entry)) {
-				if (!user_wire)
-					panic("vm_map_wire: re-lookup failed");
+			map_size = size;
+		}
+
+		named_entry_lock(named_entry);
+		if (named_entry->is_sub_map) {
+			vm_map_t                submap;
+
+			if (flags & (VM_FLAGS_RETURN_DATA_ADDR |
+			    VM_FLAGS_RETURN_4K_DATA_ADDR)) {
+				panic("VM_FLAGS_RETURN_DATA_ADDR not expected for submap.");
+			}
 
+			submap = named_entry->backing.map;
+			vm_map_lock(submap);
+			vm_map_reference(submap);
+			vm_map_unlock(submap);
+			named_entry_unlock(named_entry);
+
+			vmk_flags.vmkf_submap = TRUE;
+
+			result = vm_map_enter(target_map,
+			    &map_addr,
+			    map_size,
+			    mask,
+			    flags,
+			    vmk_flags,
+			    tag,
+			    (vm_object_t)(uintptr_t) submap,
+			    offset,
+			    copy,
+			    cur_protection,
+			    max_protection,
+			    inheritance);
+			if (result != KERN_SUCCESS) {
+				vm_map_deallocate(submap);
+			} else {
 				/*
-				 * User: undo everything upto the previous
-				 * entry.  let vm_map_unwire worry about
-				 * checking the validity of the range.
+				 * No need to lock "submap" just to check its
+				 * "mapped" flag: that flag is never reset
+				 * once it's been set and if we race, we'll
+				 * just end up setting it twice, which is OK.
 				 */
-				vm_map_unlock(map);
-				vm_map_unwire(map, start, s, user_wire);
-				return(KERN_FAILURE);
+				if (submap->mapped_in_other_pmaps == FALSE &&
+				    vm_map_pmap(submap) != PMAP_NULL &&
+				    vm_map_pmap(submap) !=
+				    vm_map_pmap(target_map)) {
+					/*
+					 * This submap is being mapped in a map
+					 * that uses a different pmap.
+					 * Set its "mapped_in_other_pmaps" flag
+					 * to indicate that we now need to
+					 * remove mappings from all pmaps rather
+					 * than just the submap's pmap.
+					 */
+					vm_map_lock(submap);
+					submap->mapped_in_other_pmaps = TRUE;
+					vm_map_unlock(submap);
+				}
+				*address = map_addr;
+			}
+			return result;
+		} else if (named_entry->is_copy) {
+			kern_return_t   kr;
+			vm_map_copy_t   copy_map;
+			vm_map_entry_t  copy_entry;
+			vm_map_offset_t copy_addr;
+
+			if (flags & ~(VM_FLAGS_FIXED |
+			    VM_FLAGS_ANYWHERE |
+			    VM_FLAGS_OVERWRITE |
+			    VM_FLAGS_RETURN_4K_DATA_ADDR |
+			    VM_FLAGS_RETURN_DATA_ADDR |
+			    VM_FLAGS_ALIAS_MASK)) {
+				named_entry_unlock(named_entry);
+				return KERN_INVALID_ARGUMENT;
 			}
-			entry = first_entry;
-			continue;
-		}
-		
-		if(entry->is_sub_map) {
-			vm_offset_t	sub_start;
-			vm_offset_t	sub_end;
-			vm_offset_t	local_end;
-			pmap_t		pmap;
-			
-			vm_map_clip_start(map, entry, start);
-			vm_map_clip_end(map, entry, end);
 
-			sub_start += entry->offset;
-			sub_end = entry->vme_end - entry->vme_start;
-			sub_end += entry->offset;
-			
-			local_end = entry->vme_end;
-			if(map_pmap == NULL) {
-				if(entry->use_pmap) {
-					pmap = entry->object.sub_map->pmap;
-				} else {
-					pmap = map->pmap;
+			if (flags & (VM_FLAGS_RETURN_DATA_ADDR |
+			    VM_FLAGS_RETURN_4K_DATA_ADDR)) {
+				offset_in_mapping = offset - vm_object_trunc_page(offset);
+				if (flags & VM_FLAGS_RETURN_4K_DATA_ADDR) {
+					offset_in_mapping &= ~((signed)(0xFFF));
 				}
-				if (entry->wired_count) {
-					if (entry->wired_count 
-							>= MAX_WIRE_COUNT)
-					panic("vm_map_wire: too many wirings");
-
-					if (user_wire &&
-			    			entry->user_wired_count 
-							>= MAX_WIRE_COUNT) {
-				   	   vm_map_unlock(map);
-				   	   vm_map_unwire(map, start,
-						entry->vme_start, user_wire);
-				   	   return(KERN_FAILURE);
-					}
-					if (!user_wire || 
-					      (entry->user_wired_count++ == 0))
-						entry->wired_count++;
-					entry = entry->vme_next;
-					continue;
+				offset = vm_object_trunc_page(offset);
+				map_size = vm_object_round_page(offset + offset_in_mapping + initial_size) - offset;
+			}
 
-				} else {
-					vm_object_t		object;
-					vm_object_offset_t	offset_hi;
-					vm_object_offset_t	offset_lo;
-					vm_object_offset_t	offset;
-					vm_prot_t		prot;
-					boolean_t		wired;
-					vm_behavior_t		behavior;
-					vm_offset_t		local_start;
-					vm_map_entry_t		local_entry;
-					vm_map_version_t	 version;
-					vm_map_t		lookup_map;
-
-					/* call vm_map_lookup_locked to */
-					/* cause any needs copy to be   */
-					/* evaluated */
-					local_start = entry->vme_start;
-					lookup_map = map;
-					vm_map_lock_write_to_read(map);
-					if(vm_map_lookup_locked(
-						&lookup_map, local_start, 
-						VM_PROT_WRITE,
-						&version, &object,
-						&offset, &prot, &wired,
-						&behavior, &offset_lo,
-						&offset_hi, &pmap_map)) {
-						
-						vm_map_unlock(lookup_map);
-				   	   	vm_map_unwire(map, start,
-						   entry->vme_start, user_wire);
-				   	   	return(KERN_FAILURE);
-					}
-					if(pmap_map != lookup_map)
-						vm_map_unlock(pmap_map);
-					if(lookup_map != map) {
-						vm_map_unlock(lookup_map);
-						vm_map_lock(map);
-					} else {
-						vm_map_unlock(map);
-						vm_map_lock(map);
-					}
-					last_timestamp = 
-						version.main_timestamp;
-					vm_object_unlock(object);
-					if (vm_map_lookup_entry(map, 
-						local_start, &local_entry)) {
-						vm_map_unlock(map);
-				   	   	vm_map_unwire(map, start,
-						   entry->vme_start, user_wire);
-				   	   	return(KERN_FAILURE);
+			copy_map = named_entry->backing.copy;
+			assert(copy_map->type == VM_MAP_COPY_ENTRY_LIST);
+			if (copy_map->type != VM_MAP_COPY_ENTRY_LIST) {
+				/* unsupported type; should not happen */
+				printf("vm_map_enter_mem_object: "
+				    "memory_entry->backing.copy "
+				    "unsupported type 0x%x\n",
+				    copy_map->type);
+				named_entry_unlock(named_entry);
+				return KERN_INVALID_ARGUMENT;
+			}
+
+			/* reserve a contiguous range */
+			kr = vm_map_enter(target_map,
+			    &map_addr,
+			    /* map whole mem entry, trim later: */
+			    named_entry->size,
+			    mask,
+			    flags & (VM_FLAGS_ANYWHERE |
+			    VM_FLAGS_OVERWRITE |
+			    VM_FLAGS_RETURN_4K_DATA_ADDR |
+			    VM_FLAGS_RETURN_DATA_ADDR),
+			    vmk_flags,
+			    tag,
+			    VM_OBJECT_NULL,
+			    0,
+			    FALSE,               /* copy */
+			    cur_protection,
+			    max_protection,
+			    inheritance);
+			if (kr != KERN_SUCCESS) {
+				named_entry_unlock(named_entry);
+				return kr;
+			}
+
+			copy_addr = map_addr;
+
+			for (copy_entry = vm_map_copy_first_entry(copy_map);
+			    copy_entry != vm_map_copy_to_entry(copy_map);
+			    copy_entry = copy_entry->vme_next) {
+				int                     remap_flags;
+				vm_map_kernel_flags_t   vmk_remap_flags;
+				vm_map_t                copy_submap;
+				vm_object_t             copy_object;
+				vm_map_size_t           copy_size;
+				vm_object_offset_t      copy_offset;
+				int                     copy_vm_alias;
+
+				remap_flags = 0;
+				vmk_remap_flags = VM_MAP_KERNEL_FLAGS_NONE;
+
+				copy_object = VME_OBJECT(copy_entry);
+				copy_offset = VME_OFFSET(copy_entry);
+				copy_size = (copy_entry->vme_end -
+				    copy_entry->vme_start);
+				VM_GET_FLAGS_ALIAS(flags, copy_vm_alias);
+				if (copy_vm_alias == 0) {
+					/*
+					 * Caller does not want a specific
+					 * alias for this new mapping:  use
+					 * the alias of the original mapping.
+					 */
+					copy_vm_alias = VME_ALIAS(copy_entry);
+				}
+
+				/* sanity check */
+				if ((copy_addr + copy_size) >
+				    (map_addr +
+				    named_entry->size /* XXX full size */)) {
+					/* over-mapping too much !? */
+					kr = KERN_INVALID_ARGUMENT;
+					/* abort */
+					break;
+				}
+
+				/* take a reference on the object */
+				if (copy_entry->is_sub_map) {
+					vmk_remap_flags.vmkf_submap = TRUE;
+					copy_submap = VME_SUBMAP(copy_entry);
+					vm_map_lock(copy_submap);
+					vm_map_reference(copy_submap);
+					vm_map_unlock(copy_submap);
+					copy_object = (vm_object_t)(uintptr_t) copy_submap;
+				} else if (!copy &&
+				    copy_object != VM_OBJECT_NULL &&
+				    (copy_entry->needs_copy ||
+				    copy_object->shadowed ||
+				    (!copy_object->true_share &&
+				    !copy_entry->is_shared &&
+				    copy_object->vo_size > copy_size))) {
+					/*
+					 * We need to resolve our side of this
+					 * "symmetric" copy-on-write now; we
+					 * need a new object to map and share,
+					 * instead of the current one which
+					 * might still be shared with the
+					 * original mapping.
+					 *
+					 * Note: A "vm_map_copy_t" does not
+					 * have a lock but we're protected by
+					 * the named entry's lock here.
+					 */
+					// assert(copy_object->copy_strategy == MEMORY_OBJECT_COPY_SYMMETRIC);
+					VME_OBJECT_SHADOW(copy_entry, copy_size);
+					if (!copy_entry->needs_copy &&
+					    copy_entry->protection & VM_PROT_WRITE) {
+						vm_prot_t prot;
+
+						prot = copy_entry->protection & ~VM_PROT_WRITE;
+						vm_object_pmap_protect(copy_object,
+						    copy_offset,
+						    copy_size,
+						    PMAP_NULL,
+						    0,
+						    prot);
 					}
-					/* did we have a change of type? */
-					if (!local_entry->is_sub_map)
-						continue;
-					entry = local_entry;
-					if (user_wire)
-						entry->user_wired_count++;
-					entry->wired_count++;
 
-					entry->in_transition = TRUE;
+					copy_entry->needs_copy = FALSE;
+					copy_entry->is_shared = TRUE;
+					copy_object = VME_OBJECT(copy_entry);
+					copy_offset = VME_OFFSET(copy_entry);
+					vm_object_lock(copy_object);
+					vm_object_reference_locked(copy_object);
+					if (copy_object->copy_strategy == MEMORY_OBJECT_COPY_SYMMETRIC) {
+						/* we're about to make a shared mapping of this object */
+						copy_object->copy_strategy = MEMORY_OBJECT_COPY_DELAY;
+						copy_object->true_share = TRUE;
+					}
+					vm_object_unlock(copy_object);
+				} else {
+					/*
+					 * We already have the right object
+					 * to map.
+					 */
+					copy_object = VME_OBJECT(copy_entry);
+					vm_object_reference(copy_object);
+				}
 
-					vm_map_unlock(map);
-					rc = vm_map_wire_nested(
-						entry->object.sub_map, 
-						sub_start, sub_end,
-						access_type, 
-						user_wire, pmap);
-					vm_map_lock(map);
-					last_timestamp = map->timestamp;
+				/* over-map the object into destination */
+				remap_flags |= flags;
+				remap_flags |= VM_FLAGS_FIXED;
+				remap_flags |= VM_FLAGS_OVERWRITE;
+				remap_flags &= ~VM_FLAGS_ANYWHERE;
+				if (!copy && !copy_entry->is_sub_map) {
+					/*
+					 * copy-on-write should have been
+					 * resolved at this point, or we would
+					 * end up sharing instead of copying.
+					 */
+					assert(!copy_entry->needs_copy);
+				}
+#if !CONFIG_EMBEDDED
+				if (copy_entry->used_for_jit) {
+					vmk_remap_flags.vmkf_map_jit = TRUE;
+				}
+#endif /* !CONFIG_EMBEDDED */
+				kr = vm_map_enter(target_map,
+				    &copy_addr,
+				    copy_size,
+				    (vm_map_offset_t) 0,
+				    remap_flags,
+				    vmk_remap_flags,
+				    copy_vm_alias,
+				    copy_object,
+				    copy_offset,
+				    ((copy_object == NULL) ? FALSE : copy),
+				    cur_protection,
+				    max_protection,
+				    inheritance);
+				if (kr != KERN_SUCCESS) {
+					if (copy_entry->is_sub_map) {
+						vm_map_deallocate(copy_submap);
+					} else {
+						vm_object_deallocate(copy_object);
+					}
+					/* abort */
+					break;
 				}
-			} else {
-				vm_map_unlock(map);
-				rc = vm_map_wire_nested(entry->object.sub_map, 
-						sub_start, sub_end,
-						access_type, 
-						user_wire, pmap);
-				vm_map_lock(map);
-				last_timestamp = map->timestamp;
-			}
-			s = entry->vme_start;
-			e = entry->vme_end;
-			if (last_timestamp+1 != map->timestamp) {
-			/*
-			 * Find the entry again.  It could have been clipped
-			 * after we unlocked the map.
-			 */
-		 	   	if (!vm_map_lookup_entry(map, local_end,
-							 &first_entry))
-					panic("vm_map_wire: re-lookup failed");
 
-		   		entry = first_entry;
+				/* next mapping */
+				copy_addr += copy_size;
 			}
 
-			last_timestamp = map->timestamp;
-			while ((entry != vm_map_to_entry(map)) &&
-		       		     (entry->vme_start < e)) {
-				assert(entry->in_transition);
-				entry->in_transition = FALSE;
-				if (entry->needs_wakeup) {
-					entry->needs_wakeup = FALSE;
-					need_wakeup = TRUE;
+			if (kr == KERN_SUCCESS) {
+				if (flags & (VM_FLAGS_RETURN_DATA_ADDR |
+				    VM_FLAGS_RETURN_4K_DATA_ADDR)) {
+					*address = map_addr + offset_in_mapping;
+				} else {
+					*address = map_addr;
 				}
-				if (rc != KERN_SUCCESS) {/* from vm_*_wire */
-				   if(main_map) {
-					if (user_wire)
-						entry->user_wired_count--;
-					entry->wired_count--;
-				   }
+
+				if (offset) {
+					/*
+					 * Trim in front, from 0 to "offset".
+					 */
+					vm_map_remove(target_map,
+					    map_addr,
+					    map_addr + offset,
+					    VM_MAP_REMOVE_NO_FLAGS);
+					*address += offset;
+				}
+				if (offset + map_size < named_entry->size) {
+					/*
+					 * Trim in back, from
+					 * "offset + map_size" to
+					 * "named_entry->size".
+					 */
+					vm_map_remove(target_map,
+					    (map_addr +
+					    offset + map_size),
+					    (map_addr +
+					    named_entry->size),
+					    VM_MAP_REMOVE_NO_FLAGS);
 				}
-				entry = entry->vme_next;
 			}
-			if (rc != KERN_SUCCESS) {	/* from vm_*_wire */
-				vm_map_unlock(map);
-				if (need_wakeup)
-					vm_map_entry_wakeup(map);
-				/*
-				 * undo everything upto the previous entry.
-				 */
-				(void)vm_map_unwire(map, start, s, user_wire);
-				return rc;
+			named_entry_unlock(named_entry);
+
+			if (kr != KERN_SUCCESS) {
+				if (!(flags & VM_FLAGS_OVERWRITE)) {
+					/* deallocate the contiguous range */
+					(void) vm_deallocate(target_map,
+					    map_addr,
+					    map_size);
+				}
 			}
-			continue;
-		}
 
-		/*
-		 * If this entry is already wired then increment
-		 * the appropriate wire reference count.
-		 */
-		if (entry->wired_count && main_map) {
-			/* sanity check: wired_count is a short */
-			if (entry->wired_count >= MAX_WIRE_COUNT)
-				panic("vm_map_wire: too many wirings");
+			return kr;
+		} else {
+			unsigned int    access;
+			vm_prot_t       protections;
+			unsigned int    wimg_mode;
 
-			if (user_wire &&
-			    entry->user_wired_count >= MAX_WIRE_COUNT) {
-				vm_map_unlock(map);
-				vm_map_unwire(map, start,
-						entry->vme_start, user_wire);
-				return(KERN_FAILURE);
+			/* we are mapping a VM object */
+
+			protections = named_entry->protection & VM_PROT_ALL;
+			access = GET_MAP_MEM(named_entry->protection);
+
+			if (flags & (VM_FLAGS_RETURN_DATA_ADDR |
+			    VM_FLAGS_RETURN_4K_DATA_ADDR)) {
+				offset_in_mapping = offset - vm_object_trunc_page(offset);
+				if (flags & VM_FLAGS_RETURN_4K_DATA_ADDR) {
+					offset_in_mapping &= ~((signed)(0xFFF));
+				}
+				offset = vm_object_trunc_page(offset);
+				map_size = vm_object_round_page(offset + offset_in_mapping + initial_size) - offset;
 			}
-			/*
-			 * entry is already wired down, get our reference
-			 * after clipping to our range.
-			 */
-			vm_map_clip_start(map, entry, start);
-			vm_map_clip_end(map, entry, end);
-			if (!user_wire || (entry->user_wired_count++ == 0))
-				entry->wired_count++;
 
-			entry = entry->vme_next;
-			continue;
-		}
+			object = named_entry->backing.object;
+			assert(object != VM_OBJECT_NULL);
+			vm_object_lock(object);
+			named_entry_unlock(named_entry);
 
-		/*
-		 * Unwired entry or wire request transmitted via submap
-		 */
+			vm_object_reference_locked(object);
 
+			wimg_mode = object->wimg_bits;
+			vm_prot_to_wimg(access, &wimg_mode);
+			if (object->wimg_bits != wimg_mode) {
+				vm_object_change_wimg_mode(object, wimg_mode);
+			}
 
+			vm_object_unlock(object);
+		}
+	} else if (ip_kotype(port) == IKOT_MEMORY_OBJECT) {
 		/*
-		 * Perform actions of vm_map_lookup that need the write
-		 * lock on the map: create a shadow object for a
-		 * copy-on-write region, or an object for a zero-fill
-		 * region.
-		 */
-		size = entry->vme_end - entry->vme_start;
-		/*
-		 * If wiring a copy-on-write page, we need to copy it now
-		 * even if we're only (currently) requesting read access.
-		 * This is aggressive, but once it's wired we can't move it.
+		 * JMM - This is temporary until we unify named entries
+		 * and raw memory objects.
+		 *
+		 * Detected fake ip_kotype for a memory object.  In
+		 * this case, the port isn't really a port at all, but
+		 * instead is just a raw memory object.
 		 */
-		if (entry->needs_copy) {
-			vm_object_shadow(&entry->object.vm_object,
-					 &entry->offset, size);
-			entry->needs_copy = FALSE;
-		} else if (entry->object.vm_object == VM_OBJECT_NULL) {
-			entry->object.vm_object = vm_object_allocate(size);
-			entry->offset = (vm_object_offset_t)0;
+		if (flags & (VM_FLAGS_RETURN_DATA_ADDR |
+		    VM_FLAGS_RETURN_4K_DATA_ADDR)) {
+			panic("VM_FLAGS_RETURN_DATA_ADDR not expected for raw memory object.");
 		}
 
-		vm_map_clip_start(map, entry, start);
-		vm_map_clip_end(map, entry, end);
+		object = memory_object_to_vm_object((memory_object_t)port);
+		if (object == VM_OBJECT_NULL) {
+			return KERN_INVALID_OBJECT;
+		}
+		vm_object_reference(object);
+
+		/* wait for object (if any) to be ready */
+		if (object != VM_OBJECT_NULL) {
+			if (object == kernel_object) {
+				printf("Warning: Attempt to map kernel object"
+				    " by a non-private kernel entity\n");
+				return KERN_INVALID_OBJECT;
+			}
+			if (!object->pager_ready) {
+				vm_object_lock(object);
 
-		s = entry->vme_start;
-		e = entry->vme_end;
+				while (!object->pager_ready) {
+					vm_object_wait(object,
+					    VM_OBJECT_EVENT_PAGER_READY,
+					    THREAD_UNINT);
+					vm_object_lock(object);
+				}
+				vm_object_unlock(object);
+			}
+		}
+	} else {
+		return KERN_INVALID_OBJECT;
+	}
+
+	if (object != VM_OBJECT_NULL &&
+	    object->named &&
+	    object->pager != MEMORY_OBJECT_NULL &&
+	    object->copy_strategy != MEMORY_OBJECT_COPY_NONE) {
+		memory_object_t pager;
+		vm_prot_t       pager_prot;
+		kern_return_t   kr;
 
 		/*
-		 * Check for holes and protection mismatch.
-		 * Holes: Next entry should be contiguous unless this
-		 *	  is the end of the region.
-		 * Protection: Access requested must be allowed, unless
-		 *	wiring is by protection class
+		 * For "named" VM objects, let the pager know that the
+		 * memory object is being mapped.  Some pagers need to keep
+		 * track of this, to know when they can reclaim the memory
+		 * object, for example.
+		 * VM calls memory_object_map() for each mapping (specifying
+		 * the protection of each mapping) and calls
+		 * memory_object_last_unmap() when all the mappings are gone.
 		 */
-		if ((((entry->vme_end < end) &&
-		     ((entry->vme_next == vm_map_to_entry(map)) ||
-		      (entry->vme_next->vme_start > entry->vme_end))) ||
-		     ((entry->protection & access_type) != access_type))) {
+		pager_prot = max_protection;
+		if (copy) {
 			/*
-			 * Found a hole or protection problem.
-			 * Unwire the region we wired so far.
+			 * Copy-On-Write mapping: won't modify the
+			 * memory object.
 			 */
-			if (start != entry->vme_start) {
-				vm_map_unlock(map);
-				vm_map_unwire(map, start, s, user_wire);
-			} else {
-				vm_map_unlock(map);
-			}
-			return((entry->protection&access_type) != access_type?
-				KERN_PROTECTION_FAILURE: KERN_INVALID_ADDRESS);
+			pager_prot &= ~VM_PROT_WRITE;
 		}
+		vm_object_lock(object);
+		pager = object->pager;
+		if (object->named &&
+		    pager != MEMORY_OBJECT_NULL &&
+		    object->copy_strategy != MEMORY_OBJECT_COPY_NONE) {
+			assert(object->pager_ready);
+			vm_object_mapping_wait(object, THREAD_UNINT);
+			vm_object_mapping_begin(object);
+			vm_object_unlock(object);
 
-		assert(entry->wired_count == 0 && entry->user_wired_count == 0);
+			kr = memory_object_map(pager, pager_prot);
+			assert(kr == KERN_SUCCESS);
 
-		if(main_map) {
-			if (user_wire)
-				entry->user_wired_count++;
-			entry->wired_count++;
+			vm_object_lock(object);
+			vm_object_mapping_end(object);
 		}
+		vm_object_unlock(object);
+	}
 
-		entry->in_transition = TRUE;
-
-		/*
-		 * This entry might get split once we unlock the map.
-		 * In vm_fault_wire(), we need the current range as
-		 * defined by this entry.  In order for this to work
-		 * along with a simultaneous clip operation, we make a
-		 * temporary copy of this entry and use that for the
-		 * wiring.  Note that the underlying objects do not
-		 * change during a clip.
-		 */
-		tmp_entry = *entry;
+	/*
+	 *	Perform the copy if requested
+	 */
 
-		/*
-		 * The in_transition state guarentees that the entry
-		 * (or entries for this range, if split occured) will be
-		 * there when the map lock is acquired for the second time.
-		 */
-		vm_map_unlock(map);
+	if (copy) {
+		vm_object_t             new_object;
+		vm_object_offset_t      new_offset;
 
-		if (!user_wire && cur_thread != THREAD_NULL) {
-			interruptible_state = cur_thread->interruptible;
-			cur_thread->interruptible = FALSE;
-		}
-		  
-		if(map_pmap)
-			rc = vm_fault_wire(map, &tmp_entry, map_pmap);
-		else
-			rc = vm_fault_wire(map, &tmp_entry, map->pmap);
+		result = vm_object_copy_strategically(object, offset,
+		    map_size,
+		    &new_object, &new_offset,
+		    &copy);
 
-		if (!user_wire && cur_thread != THREAD_NULL)
-			cur_thread->interruptible = interruptible_state;
 
-		vm_map_lock(map);
+		if (result == KERN_MEMORY_RESTART_COPY) {
+			boolean_t success;
+			boolean_t src_needs_copy;
 
-		if (last_timestamp+1 != map->timestamp) {
 			/*
-			 * Find the entry again.  It could have been clipped
-			 * after we unlocked the map.
+			 * XXX
+			 * We currently ignore src_needs_copy.
+			 * This really is the issue of how to make
+			 * MEMORY_OBJECT_COPY_SYMMETRIC safe for
+			 * non-kernel users to use. Solution forthcoming.
+			 * In the meantime, since we don't allow non-kernel
+			 * memory managers to specify symmetric copy,
+			 * we won't run into problems here.
 			 */
-			if (!vm_map_lookup_entry(map, tmp_entry.vme_start,
-								&first_entry))
-				panic("vm_map_wire: re-lookup failed");
-
-			entry = first_entry;
+			new_object = object;
+			new_offset = offset;
+			success = vm_object_copy_quickly(&new_object,
+			    new_offset,
+			    map_size,
+			    &src_needs_copy,
+			    &copy);
+			assert(success);
+			result = KERN_SUCCESS;
 		}
+		/*
+		 *	Throw away the reference to the
+		 *	original object, as it won't be mapped.
+		 */
 
-		last_timestamp = map->timestamp;
+		vm_object_deallocate(object);
 
-		while ((entry != vm_map_to_entry(map)) &&
-		       (entry->vme_start < tmp_entry.vme_end)) {
-			assert(entry->in_transition);
-			entry->in_transition = FALSE;
-			if (entry->needs_wakeup) {
-				entry->needs_wakeup = FALSE;
-				need_wakeup = TRUE;
-			}
-			if (rc != KERN_SUCCESS) {	/* from vm_*_wire */
-				if(main_map) {
-					if (user_wire)
-						entry->user_wired_count--;
-					entry->wired_count--;
-				}
-			}
-			entry = entry->vme_next;
+		if (result != KERN_SUCCESS) {
+			return result;
 		}
 
-		if (rc != KERN_SUCCESS) {		/* from vm_*_wire */
-			vm_map_unlock(map);
-			if (need_wakeup)
-				vm_map_entry_wakeup(map);
-			/*
-			 * undo everything upto the previous entry.
-			 */
-			(void)vm_map_unwire(map, start, s, user_wire);
-			return rc;
-		}
-	} /* end while loop through map entries */
-	vm_map_unlock(map);
+		object = new_object;
+		offset = new_offset;
+	}
 
 	/*
-	 * wake up anybody waiting on entries we wired.
+	 * If non-kernel users want to try to prefault pages, the mapping and prefault
+	 * needs to be atomic.
 	 */
-	if (need_wakeup)
-		vm_map_entry_wakeup(map);
+	kernel_prefault = (try_prefault && vm_kernel_map_is_kernel(target_map));
+	vmk_flags.vmkf_keep_map_locked = (try_prefault && !kernel_prefault);
+
+#if __arm64__
+	if (fourk) {
+		/* map this object in a "4K" pager */
+		result = vm_map_enter_fourk(target_map,
+		    &map_addr,
+		    map_size,
+		    (vm_map_offset_t) mask,
+		    flags,
+		    vmk_flags,
+		    tag,
+		    object,
+		    offset,
+		    copy,
+		    cur_protection,
+		    max_protection,
+		    inheritance);
+	} else
+#endif /* __arm64__ */
+	{
+		result = vm_map_enter(target_map,
+		    &map_addr, map_size,
+		    (vm_map_offset_t)mask,
+		    flags,
+		    vmk_flags,
+		    tag,
+		    object, offset,
+		    copy,
+		    cur_protection, max_protection,
+		    inheritance);
+	}
+	if (result != KERN_SUCCESS) {
+		vm_object_deallocate(object);
+	}
+
+	/*
+	 * Try to prefault, and do not forget to release the vm map lock.
+	 */
+	if (result == KERN_SUCCESS && try_prefault) {
+		mach_vm_address_t va = map_addr;
+		kern_return_t kr = KERN_SUCCESS;
+		unsigned int i = 0;
+		int pmap_options;
+
+		pmap_options = kernel_prefault ? 0 : PMAP_OPTIONS_NOWAIT;
+		if (object->internal) {
+			pmap_options |= PMAP_OPTIONS_INTERNAL;
+		}
+
+		for (i = 0; i < page_list_count; ++i) {
+			if (!UPL_VALID_PAGE(page_list, i)) {
+				if (kernel_prefault) {
+					assertf(FALSE, "kernel_prefault && !UPL_VALID_PAGE");
+					result = KERN_MEMORY_ERROR;
+					break;
+				}
+			} else {
+				/*
+				 * If this function call failed, we should stop
+				 * trying to optimize, other calls are likely
+				 * going to fail too.
+				 *
+				 * We are not gonna report an error for such
+				 * failure though. That's an optimization, not
+				 * something critical.
+				 */
+				kr = pmap_enter_options(target_map->pmap,
+				    va, UPL_PHYS_PAGE(page_list, i),
+				    cur_protection, VM_PROT_NONE,
+				    0, TRUE, pmap_options, NULL);
+				if (kr != KERN_SUCCESS) {
+					OSIncrementAtomic64(&vm_prefault_nb_bailout);
+					if (kernel_prefault) {
+						result = kr;
+					}
+					break;
+				}
+				OSIncrementAtomic64(&vm_prefault_nb_pages);
+			}
 
-	return(KERN_SUCCESS);
+			/* Next virtual address */
+			va += PAGE_SIZE;
+		}
+		if (vmk_flags.vmkf_keep_map_locked) {
+			vm_map_unlock(target_map);
+		}
+	}
 
+	if (flags & (VM_FLAGS_RETURN_DATA_ADDR |
+	    VM_FLAGS_RETURN_4K_DATA_ADDR)) {
+		*address = map_addr + offset_in_mapping;
+	} else {
+		*address = map_addr;
+	}
+	return result;
 }
 
 kern_return_t
-vm_map_wire(
-	register vm_map_t	map,
-	register vm_offset_t	start,
-	register vm_offset_t	end,
-	register vm_prot_t	access_type,
-	boolean_t		user_wire)
-{
-
-	kern_return_t	kret;
-
-#ifdef ppc
-        /*
-	 * the calls to mapping_prealloc and mapping_relpre
-	 * (along with the VM_MAP_RANGE_CHECK to insure a
-	 * resonable range was passed in) are
-	 * currently necessary because
-	 * we haven't enabled kernel pre-emption
-	 * and/or the pmap_enter cannot purge and re-use
-	 * existing mappings
-	 */
-	VM_MAP_RANGE_CHECK(map, start, end);
-        mapping_prealloc(end - start);
-#endif
-	kret = vm_map_wire_nested(map, start, end, access_type, 
-						user_wire, (pmap_t)NULL);
-#ifdef ppc
-	mapping_relpre();
+vm_map_enter_mem_object(
+	vm_map_t                target_map,
+	vm_map_offset_t         *address,
+	vm_map_size_t           initial_size,
+	vm_map_offset_t         mask,
+	int                     flags,
+	vm_map_kernel_flags_t   vmk_flags,
+	vm_tag_t                tag,
+	ipc_port_t              port,
+	vm_object_offset_t      offset,
+	boolean_t               copy,
+	vm_prot_t               cur_protection,
+	vm_prot_t               max_protection,
+	vm_inherit_t            inheritance)
+{
+	kern_return_t ret;
+
+	ret = vm_map_enter_mem_object_helper(target_map,
+	    address,
+	    initial_size,
+	    mask,
+	    flags,
+	    vmk_flags,
+	    tag,
+	    port,
+	    offset,
+	    copy,
+	    cur_protection,
+	    max_protection,
+	    inheritance,
+	    NULL,
+	    0);
+
+#if KASAN
+	if (ret == KERN_SUCCESS && address && target_map->pmap == kernel_pmap) {
+		kasan_notify_address(*address, initial_size);
+	}
 #endif
-	return kret;
+
+	return ret;
 }
 
-/*
- *	vm_map_unwire:
- *
- *	Sets the pageability of the specified address range in the target
- *	as pageable.  Regions specified must have been wired previously.
- *
- *	The map must not be locked, but a reference must remain to the map
- *	throughout the call.
- *
- *	Kernel will panic on failures.  User unwire ignores holes and
- *	unwired and intransition entries to avoid losing memory by leaving
- *	it unwired.
- */
 kern_return_t
-vm_map_unwire_nested(
-	register vm_map_t	map,
-	register vm_offset_t	start,
-	register vm_offset_t	end,
-	boolean_t		user_wire,
-	pmap_t			map_pmap)
-{
-	register vm_map_entry_t	entry;
-	struct vm_map_entry	*first_entry, tmp_entry;
-	boolean_t		need_wakeup;
-	boolean_t		main_map = FALSE;
-	unsigned int		last_timestamp;
+vm_map_enter_mem_object_prefault(
+	vm_map_t                target_map,
+	vm_map_offset_t         *address,
+	vm_map_size_t           initial_size,
+	vm_map_offset_t         mask,
+	int                     flags,
+	vm_map_kernel_flags_t   vmk_flags,
+	vm_tag_t                tag,
+	ipc_port_t              port,
+	vm_object_offset_t      offset,
+	vm_prot_t               cur_protection,
+	vm_prot_t               max_protection,
+	upl_page_list_ptr_t     page_list,
+	unsigned int            page_list_count)
+{
+	kern_return_t ret;
+
+	ret = vm_map_enter_mem_object_helper(target_map,
+	    address,
+	    initial_size,
+	    mask,
+	    flags,
+	    vmk_flags,
+	    tag,
+	    port,
+	    offset,
+	    FALSE,
+	    cur_protection,
+	    max_protection,
+	    VM_INHERIT_DEFAULT,
+	    page_list,
+	    page_list_count);
+
+#if KASAN
+	if (ret == KERN_SUCCESS && address && target_map->pmap == kernel_pmap) {
+		kasan_notify_address(*address, initial_size);
+	}
+#endif
 
-	vm_map_lock(map);
-	if(map_pmap == NULL)
-		main_map = TRUE;
-	last_timestamp = map->timestamp;
+	return ret;
+}
 
-	VM_MAP_RANGE_CHECK(map, start, end);
-	assert(page_aligned(start));
-	assert(page_aligned(end));
 
-	if (vm_map_lookup_entry(map, start, &first_entry)) {
-		entry = first_entry;
-		/*	vm_map_clip_start will be done later. */
-	}
-	else {
-		/*	Start address is not in map. */
-		vm_map_unlock(map);
-		return(KERN_INVALID_ADDRESS);
+kern_return_t
+vm_map_enter_mem_object_control(
+	vm_map_t                target_map,
+	vm_map_offset_t         *address,
+	vm_map_size_t           initial_size,
+	vm_map_offset_t         mask,
+	int                     flags,
+	vm_map_kernel_flags_t   vmk_flags,
+	vm_tag_t                tag,
+	memory_object_control_t control,
+	vm_object_offset_t      offset,
+	boolean_t               copy,
+	vm_prot_t               cur_protection,
+	vm_prot_t               max_protection,
+	vm_inherit_t            inheritance)
+{
+	vm_map_address_t        map_addr;
+	vm_map_size_t           map_size;
+	vm_object_t             object;
+	vm_object_size_t        size;
+	kern_return_t           result;
+	memory_object_t         pager;
+	vm_prot_t               pager_prot;
+	kern_return_t           kr;
+#if __arm64__
+	boolean_t               fourk = vmk_flags.vmkf_fourk;
+#endif /* __arm64__ */
+
+	/*
+	 * Check arguments for validity
+	 */
+	if ((target_map == VM_MAP_NULL) ||
+	    (cur_protection & ~VM_PROT_ALL) ||
+	    (max_protection & ~VM_PROT_ALL) ||
+	    (inheritance > VM_INHERIT_LAST_VALID) ||
+	    initial_size == 0) {
+		return KERN_INVALID_ARGUMENT;
 	}
 
-	need_wakeup = FALSE;
-	while ((entry != vm_map_to_entry(map)) && (entry->vme_start < end)) {
-		if (entry->in_transition) {
-			/*
-			 * 1)
-			 * Another thread is wiring down this entry. Note
-			 * that if it is not for the other thread we would
-			 * be unwiring an unwired entry.  This is not
-			 * permitted.  If we wait, we will be unwiring memory
-			 * we did not wire.
-			 *
-			 * 2)
-			 * Another thread is unwiring this entry.  We did not
-			 * have a reference to it, because if we did, this
-			 * entry will not be getting unwired now.
-			 */
-			if (!user_wire)
-				panic("vm_map_unwire: in_transition entry");
+#if __arm64__
+	if (fourk) {
+		map_addr = vm_map_trunc_page(*address,
+		    FOURK_PAGE_MASK);
+		map_size = vm_map_round_page(initial_size,
+		    FOURK_PAGE_MASK);
+	} else
+#endif /* __arm64__ */
+	{
+		map_addr = vm_map_trunc_page(*address,
+		    VM_MAP_PAGE_MASK(target_map));
+		map_size = vm_map_round_page(initial_size,
+		    VM_MAP_PAGE_MASK(target_map));
+	}
+	size = vm_object_round_page(initial_size);
 
-			entry = entry->vme_next;
-			continue;
-		}
+	object = memory_object_control_to_vm_object(control);
 
-		if(entry->is_sub_map) {
-			vm_offset_t	sub_start;
-			vm_offset_t	sub_end;
-			vm_offset_t	local_end;
-			pmap_t		pmap;
-			
+	if (object == VM_OBJECT_NULL) {
+		return KERN_INVALID_OBJECT;
+	}
 
-			vm_map_clip_start(map, entry, start);
-			vm_map_clip_end(map, entry, end);
+	if (object == kernel_object) {
+		printf("Warning: Attempt to map kernel object"
+		    " by a non-private kernel entity\n");
+		return KERN_INVALID_OBJECT;
+	}
 
-			sub_start = entry->offset;
-			sub_end = entry->vme_end - entry->vme_start;
-			sub_end += entry->offset;
-			local_end = entry->vme_end;
-			if(map_pmap == NULL) {
-			   if(entry->use_pmap) {
-					pmap = entry->object.sub_map->pmap;
-			   } else {
-					pmap = map->pmap;
-			   }
-			   if (entry->wired_count == 0 ||
-		   	       (user_wire && entry->user_wired_count == 0)) {
-				if (!user_wire)
-				   panic("vm_map_unwire: entry is unwired");
-			      entry = entry->vme_next;
-			      continue;
-			   }
-
-			   /*
-		 	    * Check for holes
-		 	    * Holes: Next entry should be contiguous unless
-		 	    * this is the end of the region.
-		 	    */
-			   if (((entry->vme_end < end) && 
-		    		((entry->vme_next == vm_map_to_entry(map)) ||
-		     		(entry->vme_next->vme_start 
-						> entry->vme_end)))) {
-				if (!user_wire)
-				  panic("vm_map_unwire: non-contiguous region");
-/*
-				entry = entry->vme_next;
-				continue;
-*/
-			   }
+	vm_object_lock(object);
+	object->ref_count++;
+	vm_object_res_reference(object);
 
-			   if (!user_wire || (--entry->user_wired_count == 0))
-				entry->wired_count--;
+	/*
+	 * For "named" VM objects, let the pager know that the
+	 * memory object is being mapped.  Some pagers need to keep
+	 * track of this, to know when they can reclaim the memory
+	 * object, for example.
+	 * VM calls memory_object_map() for each mapping (specifying
+	 * the protection of each mapping) and calls
+	 * memory_object_last_unmap() when all the mappings are gone.
+	 */
+	pager_prot = max_protection;
+	if (copy) {
+		pager_prot &= ~VM_PROT_WRITE;
+	}
+	pager = object->pager;
+	if (object->named &&
+	    pager != MEMORY_OBJECT_NULL &&
+	    object->copy_strategy != MEMORY_OBJECT_COPY_NONE) {
+		assert(object->pager_ready);
+		vm_object_mapping_wait(object, THREAD_UNINT);
+		vm_object_mapping_begin(object);
+		vm_object_unlock(object);
 
-			   if (entry->wired_count != 0) {
-				entry = entry->vme_next;
-				continue;
-			   }
+		kr = memory_object_map(pager, pager_prot);
+		assert(kr == KERN_SUCCESS);
 
-			   entry->in_transition = TRUE;
-			   tmp_entry = *entry;/* see comment in vm_map_wire() */
+		vm_object_lock(object);
+		vm_object_mapping_end(object);
+	}
+	vm_object_unlock(object);
 
-			   /*
-		 	    * We can unlock the map now. The in_transition state
-		 	    * guarantees existance of the entry.
-		 	    */
-			   vm_map_unlock(map);
-			   vm_map_unwire_nested(entry->object.sub_map, 
-					sub_start, sub_end, user_wire, pmap);
-			   vm_map_lock(map);
+	/*
+	 *	Perform the copy if requested
+	 */
 
-			   if (last_timestamp+1 != map->timestamp) {
-				/*
-				 * Find the entry again.  It could have been 
-				 * clipped or deleted after we unlocked the map.
-			 	 */
-				if (!vm_map_lookup_entry(map, 
-						tmp_entry.vme_start,
-							&first_entry)) {
-					if (!user_wire)
-				          panic("vm_map_unwire: re-lookup failed");
-					entry = first_entry->vme_next;
-				} else
-					entry = first_entry;
-			   }
-			   last_timestamp = map->timestamp;
-
-			   /*
-		 	    * clear transition bit for all constituent entries
-		 	    * that were in the original entry (saved in 
-			    * tmp_entry).  Also check for waiters.
-		 	    */
-			   while ((entry != vm_map_to_entry(map)) &&
-		       		(entry->vme_start < tmp_entry.vme_end)) {
-				assert(entry->in_transition);
-				entry->in_transition = FALSE;
-				if (entry->needs_wakeup) {
-					entry->needs_wakeup = FALSE;
-					need_wakeup = TRUE;
-				}
-				entry = entry->vme_next;
-			   }
-			   continue;
-			} else {
-			   vm_map_unlock(map);
-			   vm_map_unwire_nested(entry->object.sub_map, 
-					sub_start, sub_end, user_wire, pmap);
-			   vm_map_lock(map);
+	if (copy) {
+		vm_object_t             new_object;
+		vm_object_offset_t      new_offset;
 
-			   if (last_timestamp+1 != map->timestamp) {
-				/*
-				 * Find the entry again.  It could have been 
-				 * clipped or deleted after we unlocked the map.
-			 	 */
-				if (!vm_map_lookup_entry(map, 
-						tmp_entry.vme_start,
-							&first_entry)) {
-					if (!user_wire)
-				          panic("vm_map_unwire: re-lookup failed");
-					entry = first_entry->vme_next;
-				} else
-					entry = first_entry;
-			   }
-			   last_timestamp = map->timestamp;
-			}
-		}
+		result = vm_object_copy_strategically(object, offset, size,
+		    &new_object, &new_offset,
+		    &copy);
 
 
-		if (main_map && (entry->wired_count == 0 ||
-		   (user_wire && entry->user_wired_count == 0))) {
-			if (!user_wire)
-				panic("vm_map_unwire: entry is unwired");
+		if (result == KERN_MEMORY_RESTART_COPY) {
+			boolean_t success;
+			boolean_t src_needs_copy;
 
-			entry = entry->vme_next;
-			continue;
+			/*
+			 * XXX
+			 * We currently ignore src_needs_copy.
+			 * This really is the issue of how to make
+			 * MEMORY_OBJECT_COPY_SYMMETRIC safe for
+			 * non-kernel users to use. Solution forthcoming.
+			 * In the meantime, since we don't allow non-kernel
+			 * memory managers to specify symmetric copy,
+			 * we won't run into problems here.
+			 */
+			new_object = object;
+			new_offset = offset;
+			success = vm_object_copy_quickly(&new_object,
+			    new_offset, size,
+			    &src_needs_copy,
+			    &copy);
+			assert(success);
+			result = KERN_SUCCESS;
 		}
-		
-		assert(entry->wired_count > 0 &&
-			(!user_wire || entry->user_wired_count > 0));
-
-		vm_map_clip_start(map, entry, start);
-		vm_map_clip_end(map, entry, end);
-
 		/*
-		 * Check for holes
-		 * Holes: Next entry should be contiguous unless
-		 *	  this is the end of the region.
+		 *	Throw away the reference to the
+		 *	original object, as it won't be mapped.
 		 */
-		if (((entry->vme_end < end) && 
-		    ((entry->vme_next == vm_map_to_entry(map)) ||
-		     (entry->vme_next->vme_start > entry->vme_end)))) {
 
-			if (!user_wire)
-				panic("vm_map_unwire: non-contiguous region");
-			entry = entry->vme_next;
-			continue;
-		}
-
-		if(main_map) {
-		   if (!user_wire || (--entry->user_wired_count == 0))
-			entry->wired_count--;
-
-		   if (entry->wired_count != 0) {
-			entry = entry->vme_next;
-			continue;
-		   }
-		}
-
-		entry->in_transition = TRUE;
-		tmp_entry = *entry;	/* see comment in vm_map_wire() */
+		vm_object_deallocate(object);
 
-		/*
-		 * We can unlock the map now. The in_transition state
-		 * guarantees existance of the entry.
-		 */
-		vm_map_unlock(map);
-		if(map_pmap) {
-			vm_fault_unwire(map, &tmp_entry, FALSE, map_pmap);
-		} else {
-			vm_fault_unwire(map, &tmp_entry, FALSE, map->pmap);
+		if (result != KERN_SUCCESS) {
+			return result;
 		}
-		vm_map_lock(map);
 
-		if (last_timestamp+1 != map->timestamp) {
-			/*
-			 * Find the entry again.  It could have been clipped
-			 * or deleted after we unlocked the map.
-			 */
-			if (!vm_map_lookup_entry(map, tmp_entry.vme_start,
-								&first_entry)) {
-				if (!user_wire)
-				       panic("vm_map_unwire: re-lookup failed");
-				entry = first_entry->vme_next;
-			} else
-				entry = first_entry;
-		}
-		last_timestamp = map->timestamp;
+		object = new_object;
+		offset = new_offset;
+	}
 
-		/*
-		 * clear transition bit for all constituent entries that
-		 * were in the original entry (saved in tmp_entry).  Also
-		 * check for waiters.
-		 */
-		while ((entry != vm_map_to_entry(map)) &&
-		       (entry->vme_start < tmp_entry.vme_end)) {
-			assert(entry->in_transition);
-			entry->in_transition = FALSE;
-			if (entry->needs_wakeup) {
-				entry->needs_wakeup = FALSE;
-				need_wakeup = TRUE;
-			}
-			entry = entry->vme_next;
-		}
+#if __arm64__
+	if (fourk) {
+		result = vm_map_enter_fourk(target_map,
+		    &map_addr,
+		    map_size,
+		    (vm_map_offset_t)mask,
+		    flags,
+		    vmk_flags,
+		    tag,
+		    object, offset,
+		    copy,
+		    cur_protection, max_protection,
+		    inheritance);
+	} else
+#endif /* __arm64__ */
+	{
+		result = vm_map_enter(target_map,
+		    &map_addr, map_size,
+		    (vm_map_offset_t)mask,
+		    flags,
+		    vmk_flags,
+		    tag,
+		    object, offset,
+		    copy,
+		    cur_protection, max_protection,
+		    inheritance);
 	}
-	vm_map_unlock(map);
-	/*
-	 * wake up anybody waiting on entries that we have unwired.
-	 */
-	if (need_wakeup)
-		vm_map_entry_wakeup(map);
-	return(KERN_SUCCESS);
+	if (result != KERN_SUCCESS) {
+		vm_object_deallocate(object);
+	}
+	*address = map_addr;
 
+	return result;
 }
 
-kern_return_t
-vm_map_unwire(
-	register vm_map_t	map,
-	register vm_offset_t	start,
-	register vm_offset_t	end,
-	boolean_t		user_wire)
-{
-	return vm_map_unwire_nested(map, start, end, user_wire, (pmap_t)NULL);
-}
 
+#if     VM_CPM
+
+#ifdef MACH_ASSERT
+extern pmap_paddr_t     avail_start, avail_end;
+#endif
 
 /*
- *	vm_map_entry_delete:	[ internal use only ]
+ *	Allocate memory in the specified map, with the caveat that
+ *	the memory is physically contiguous.  This call may fail
+ *	if the system can't find sufficient contiguous memory.
+ *	This call may cause or lead to heart-stopping amounts of
+ *	paging activity.
  *
- *	Deallocate the given entry from the target map.
- */		
-void
-vm_map_entry_delete(
-	register vm_map_t	map,
-	register vm_map_entry_t	entry)
+ *	Memory obtained from this call should be freed in the
+ *	normal way, viz., via vm_deallocate.
+ */
+kern_return_t
+vm_map_enter_cpm(
+	vm_map_t                map,
+	vm_map_offset_t *addr,
+	vm_map_size_t           size,
+	int                     flags)
 {
-	register vm_offset_t	s, e;
-	register vm_object_t	object;
-	register vm_map_t	submap;
-	extern vm_object_t	kernel_object;
+	vm_object_t             cpm_obj;
+	pmap_t                  pmap;
+	vm_page_t               m, pages;
+	kern_return_t           kr;
+	vm_map_offset_t         va, start, end, offset;
+#if     MACH_ASSERT
+	vm_map_offset_t         prev_addr = 0;
+#endif  /* MACH_ASSERT */
 
-	s = entry->vme_start;
-	e = entry->vme_end;
-	assert(page_aligned(s));
-	assert(page_aligned(e));
-	assert(entry->wired_count == 0);
-	assert(entry->user_wired_count == 0);
+	boolean_t               anywhere = ((VM_FLAGS_ANYWHERE & flags) != 0);
+	vm_tag_t tag;
 
-	if (entry->is_sub_map) {
-		object = NULL;
-		submap = entry->object.sub_map;
+	VM_GET_FLAGS_ALIAS(flags, tag);
+
+	if (size == 0) {
+		*addr = 0;
+		return KERN_SUCCESS;
+	}
+	if (anywhere) {
+		*addr = vm_map_min(map);
 	} else {
-		submap = NULL;
-		object = entry->object.vm_object;
+		*addr = vm_map_trunc_page(*addr,
+		    VM_MAP_PAGE_MASK(map));
 	}
+	size = vm_map_round_page(size,
+	    VM_MAP_PAGE_MASK(map));
 
-	vm_map_entry_unlink(map, entry);
-	map->size -= e - s;
+	/*
+	 * LP64todo - cpm_allocate should probably allow
+	 * allocations of >4GB, but not with the current
+	 * algorithm, so just cast down the size for now.
+	 */
+	if (size > VM_MAX_ADDRESS) {
+		return KERN_RESOURCE_SHORTAGE;
+	}
+	if ((kr = cpm_allocate(CAST_DOWN(vm_size_t, size),
+	    &pages, 0, 0, TRUE, flags)) != KERN_SUCCESS) {
+		return kr;
+	}
 
-	vm_map_entry_dispose(map, entry);
+	cpm_obj = vm_object_allocate((vm_object_size_t)size);
+	assert(cpm_obj != VM_OBJECT_NULL);
+	assert(cpm_obj->internal);
+	assert(cpm_obj->vo_size == (vm_object_size_t)size);
+	assert(cpm_obj->can_persist == FALSE);
+	assert(cpm_obj->pager_created == FALSE);
+	assert(cpm_obj->pageout == FALSE);
+	assert(cpm_obj->shadow == VM_OBJECT_NULL);
 
-	vm_map_unlock(map);
 	/*
-	 *	Deallocate the object only after removing all
-	 *	pmap entries pointing to its pages.
+	 *	Insert pages into object.
 	 */
-	if (submap)
-		vm_map_deallocate(submap);
-	else
-	 	vm_object_deallocate(object);
 
-}
+	vm_object_lock(cpm_obj);
+	for (offset = 0; offset < size; offset += PAGE_SIZE) {
+		m = pages;
+		pages = NEXT_PAGE(m);
+		*(NEXT_PAGE_PTR(m)) = VM_PAGE_NULL;
+
+		assert(!m->vmp_gobbled);
+		assert(!m->vmp_wanted);
+		assert(!m->vmp_pageout);
+		assert(!m->vmp_tabled);
+		assert(VM_PAGE_WIRED(m));
+		assert(m->vmp_busy);
+		assert(VM_PAGE_GET_PHYS_PAGE(m) >= (avail_start >> PAGE_SHIFT) && VM_PAGE_GET_PHYS_PAGE(m) <= (avail_end >> PAGE_SHIFT));
+
+		m->vmp_busy = FALSE;
+		vm_page_insert(m, cpm_obj, offset);
+	}
+	assert(cpm_obj->resident_page_count == size / PAGE_SIZE);
+	vm_object_unlock(cpm_obj);
 
-void
-vm_map_submap_pmap_clean(
-	vm_map_t	map,
-	vm_offset_t	start,
-	vm_offset_t	end,
-	vm_map_t	sub_map,
-	vm_offset_t	offset)
-{
-	vm_offset_t	submap_start;
-	vm_offset_t	submap_end;
-	vm_offset_t	addr;
-	vm_size_t	remove_size;
-	vm_map_entry_t	entry;
+	/*
+	 *	Hang onto a reference on the object in case a
+	 *	multi-threaded application for some reason decides
+	 *	to deallocate the portion of the address space into
+	 *	which we will insert this object.
+	 *
+	 *	Unfortunately, we must insert the object now before
+	 *	we can talk to the pmap module about which addresses
+	 *	must be wired down.  Hence, the race with a multi-
+	 *	threaded app.
+	 */
+	vm_object_reference(cpm_obj);
 
-	submap_end = offset + (end - start);
-	submap_start = offset;
-	if(vm_map_lookup_entry(sub_map, offset, &entry)) {
-			
-		remove_size = (entry->vme_end - entry->vme_start);
-		if(offset > entry->vme_start)
-			remove_size -= offset - entry->vme_start;
-			
+	/*
+	 *	Insert object into map.
+	 */
 
-		if(submap_end < entry->vme_end) {
-			remove_size -=
-				entry->vme_end - submap_end;
-		}
-		if(entry->is_sub_map) {
-			vm_map_submap_pmap_clean(
-				sub_map,
-				start,
-				start + remove_size,
-				entry->object.sub_map,
-				entry->offset);
-		} else {
-			pmap_remove(map->pmap, start, start + remove_size);
-		}
+	kr = vm_map_enter(
+		map,
+		addr,
+		size,
+		(vm_map_offset_t)0,
+		flags,
+		VM_MAP_KERNEL_FLAGS_NONE,
+		cpm_obj,
+		(vm_object_offset_t)0,
+		FALSE,
+		VM_PROT_ALL,
+		VM_PROT_ALL,
+		VM_INHERIT_DEFAULT);
+
+	if (kr != KERN_SUCCESS) {
+		/*
+		 *	A CPM object doesn't have can_persist set,
+		 *	so all we have to do is deallocate it to
+		 *	free up these pages.
+		 */
+		assert(cpm_obj->pager_created == FALSE);
+		assert(cpm_obj->can_persist == FALSE);
+		assert(cpm_obj->pageout == FALSE);
+		assert(cpm_obj->shadow == VM_OBJECT_NULL);
+		vm_object_deallocate(cpm_obj); /* kill acquired ref */
+		vm_object_deallocate(cpm_obj); /* kill creation ref */
 	}
 
-	entry = entry->vme_next;
-	
-	while((entry != vm_map_to_entry(sub_map)) 
-			&& (entry->vme_start < submap_end)) {
-		remove_size = (entry->vme_end - entry->vme_start); 
-		if(submap_end < entry->vme_end) {
-			remove_size -= entry->vme_end - submap_end;
+	/*
+	 *	Inform the physical mapping system that the
+	 *	range of addresses may not fault, so that
+	 *	page tables and such can be locked down as well.
+	 */
+	start = *addr;
+	end = start + size;
+	pmap = vm_map_pmap(map);
+	pmap_pageable(pmap, start, end, FALSE);
+
+	/*
+	 *	Enter each page into the pmap, to avoid faults.
+	 *	Note that this loop could be coded more efficiently,
+	 *	if the need arose, rather than looking up each page
+	 *	again.
+	 */
+	for (offset = 0, va = start; offset < size;
+	    va += PAGE_SIZE, offset += PAGE_SIZE) {
+		int type_of_fault;
+
+		vm_object_lock(cpm_obj);
+		m = vm_page_lookup(cpm_obj, (vm_object_offset_t)offset);
+		assert(m != VM_PAGE_NULL);
+
+		vm_page_zero_fill(m);
+
+		type_of_fault = DBG_ZERO_FILL_FAULT;
+
+		vm_fault_enter(m, pmap, va, VM_PROT_ALL, VM_PROT_WRITE,
+		    VM_PAGE_WIRED(m),
+		    FALSE,                             /* change_wiring */
+		    VM_KERN_MEMORY_NONE,                             /* tag - not wiring */
+		    FALSE,                             /* no_cache */
+		    FALSE,                             /* cs_bypass */
+		    0,                                 /* user_tag */
+		    0,                             /* pmap_options */
+		    NULL,                              /* need_retry */
+		    &type_of_fault);
+
+		vm_object_unlock(cpm_obj);
+	}
+
+#if     MACH_ASSERT
+	/*
+	 *	Verify ordering in address space.
+	 */
+	for (offset = 0; offset < size; offset += PAGE_SIZE) {
+		vm_object_lock(cpm_obj);
+		m = vm_page_lookup(cpm_obj, (vm_object_offset_t)offset);
+		vm_object_unlock(cpm_obj);
+		if (m == VM_PAGE_NULL) {
+			panic("vm_allocate_cpm:  obj %p off 0x%llx no page",
+			    cpm_obj, (uint64_t)offset);
 		}
-		if(entry->is_sub_map) {
-			vm_map_submap_pmap_clean(
-				sub_map,
-				(start + entry->vme_start) - offset,
-				((start + entry->vme_start) - offset) + remove_size,
-				entry->object.sub_map,
-				entry->offset);
-		} else {
-			pmap_remove(map->pmap, 
-				(start + entry->vme_start) - offset,
-				((start + entry->vme_start) - offset) + remove_size);
+		assert(m->vmp_tabled);
+		assert(!m->vmp_busy);
+		assert(!m->vmp_wanted);
+		assert(!m->vmp_fictitious);
+		assert(!m->vmp_private);
+		assert(!m->vmp_absent);
+		assert(!m->vmp_error);
+		assert(!m->vmp_cleaning);
+		assert(!m->vmp_laundry);
+		assert(!m->vmp_precious);
+		assert(!m->vmp_clustered);
+		if (offset != 0) {
+			if (VM_PAGE_GET_PHYS_PAGE(m) != prev_addr + 1) {
+				printf("start 0x%llx end 0x%llx va 0x%llx\n",
+				    (uint64_t)start, (uint64_t)end, (uint64_t)va);
+				printf("obj %p off 0x%llx\n", cpm_obj, (uint64_t)offset);
+				printf("m %p prev_address 0x%llx\n", m, (uint64_t)prev_addr);
+				panic("vm_allocate_cpm:  pages not contig!");
+			}
 		}
-		entry = entry->vme_next;
-	} 
-	return;
+		prev_addr = VM_PAGE_GET_PHYS_PAGE(m);
+	}
+#endif  /* MACH_ASSERT */
+
+	vm_object_deallocate(cpm_obj); /* kill extra ref */
+
+	return kr;
 }
 
+
+#else   /* VM_CPM */
+
 /*
- *	vm_map_delete:	[ internal use only ]
- *
- *	Deallocates the given address range from the target map.
- *	Removes all user wirings. Unwires one kernel wiring if
- *	VM_MAP_REMOVE_KUNWIRE is set.  Waits for kernel wirings to go
- *	away if VM_MAP_REMOVE_WAIT_FOR_KWIRE is set.  Sleeps
- *	interruptibly if VM_MAP_REMOVE_INTERRUPTIBLE is set.
- *
- *	This routine is called with map locked and leaves map locked.
+ *	Interface is defined in all cases, but unless the kernel
+ *	is built explicitly for this option, the interface does
+ *	nothing.
  */
+
 kern_return_t
-vm_map_delete(
-	register vm_map_t	map,
-	vm_offset_t		start,
-	register vm_offset_t	end,
-	int			flags)
+vm_map_enter_cpm(
+	__unused vm_map_t       map,
+	__unused vm_map_offset_t        *addr,
+	__unused vm_map_size_t  size,
+	__unused int            flags)
 {
-	vm_map_entry_t		entry, next;
-	struct	 vm_map_entry	*first_entry, tmp_entry;
-	register vm_offset_t	s, e;
-	register vm_object_t	object;
-	boolean_t		need_wakeup;
-	unsigned int		last_timestamp = ~0; /* unlikely value */
-	int			interruptible;
-	extern vm_map_t		kernel_map;
+	return KERN_FAILURE;
+}
+#endif /* VM_CPM */
 
-	interruptible = (flags & VM_MAP_REMOVE_INTERRUPTIBLE) ? 
-	  		THREAD_ABORTSAFE : THREAD_UNINT;
+/* Not used without nested pmaps */
+#ifndef NO_NESTED_PMAP
+/*
+ * Clip and unnest a portion of a nested submap mapping.
+ */
 
-	/*
-	 * All our DMA I/O operations in IOKit are currently done by
-	 * wiring through the map entries of the task requesting the I/O.
-	 * Because of this, we must always wait for kernel wirings
-	 * to go away on the entries before deleting them.
-	 *
-	 * Any caller who wants to actually remove a kernel wiring
-	 * should explicitly set the VM_MAP_REMOVE_KUNWIRE flag to
-	 * properly remove one wiring instead of blasting through
-	 * them all.
-	 */
-	flags |= VM_MAP_REMOVE_WAIT_FOR_KWIRE;
+
+static void
+vm_map_clip_unnest(
+	vm_map_t        map,
+	vm_map_entry_t  entry,
+	vm_map_offset_t start_unnest,
+	vm_map_offset_t end_unnest)
+{
+	vm_map_offset_t old_start_unnest = start_unnest;
+	vm_map_offset_t old_end_unnest = end_unnest;
+
+	assert(entry->is_sub_map);
+	assert(VME_SUBMAP(entry) != NULL);
+	assert(entry->use_pmap);
 
 	/*
-	 *	Find the start of the region, and clip it
+	 * Query the platform for the optimal unnest range.
+	 * DRK: There's some duplication of effort here, since
+	 * callers may have adjusted the range to some extent. This
+	 * routine was introduced to support 1GiB subtree nesting
+	 * for x86 platforms, which can also nest on 2MiB boundaries
+	 * depending on size/alignment.
 	 */
-	if (vm_map_lookup_entry(map, start, &first_entry)) {
-		entry = first_entry;
-		vm_map_clip_start(map, entry, start);
+	if (pmap_adjust_unnest_parameters(map->pmap, &start_unnest, &end_unnest)) {
+		assert(VME_SUBMAP(entry)->is_nested_map);
+		assert(!VME_SUBMAP(entry)->disable_vmentry_reuse);
+		log_unnest_badness(map,
+		    old_start_unnest,
+		    old_end_unnest,
+		    VME_SUBMAP(entry)->is_nested_map,
+		    (entry->vme_start +
+		    VME_SUBMAP(entry)->lowest_unnestable_start -
+		    VME_OFFSET(entry)));
+	}
 
-		/*
-		 *	Fix the lookup hint now, rather than each
-		 *	time through the loop.
-		 */
-		SAVE_HINT(map, entry->vme_prev);
-	} else {
-		entry = first_entry->vme_next;
+	if (entry->vme_start > start_unnest ||
+	    entry->vme_end < end_unnest) {
+		panic("vm_map_clip_unnest(0x%llx,0x%llx): "
+		    "bad nested entry: start=0x%llx end=0x%llx\n",
+		    (long long)start_unnest, (long long)end_unnest,
+		    (long long)entry->vme_start, (long long)entry->vme_end);
 	}
 
-	need_wakeup = FALSE;
-	/*
-	 *	Step through all entries in this region
-	 */
-	while ((entry != vm_map_to_entry(map)) && (entry->vme_start < end)) {
-
-		vm_map_clip_end(map, entry, end);
-		if (entry->in_transition) {
-			/*
-			 * Another thread is wiring/unwiring this entry.
-			 * Let the other thread know we are waiting.
-			 */
-			s = entry->vme_start;
-			entry->needs_wakeup = TRUE;
-
-			/*
-			 * wake up anybody waiting on entries that we have
-			 * already unwired/deleted.
-			 */
-			if (need_wakeup) {
-				vm_map_entry_wakeup(map);
-				need_wakeup = FALSE;
-			}
-
-			vm_map_entry_wait(map, interruptible);
-
-			if (interruptible &&
-			   current_thread()->wait_result == THREAD_INTERRUPTED)
-				/*
-				 * We do not clear the needs_wakeup flag,
-				 * since we cannot tell if we were the only one.
-				 */
-				return KERN_ABORTED;
+	if (start_unnest > entry->vme_start) {
+		_vm_map_clip_start(&map->hdr,
+		    entry,
+		    start_unnest);
+		if (map->holelistenabled) {
+			vm_map_store_update_first_free(map, NULL, FALSE);
+		} else {
+			vm_map_store_update_first_free(map, map->first_free, FALSE);
+		}
+	}
+	if (entry->vme_end > end_unnest) {
+		_vm_map_clip_end(&map->hdr,
+		    entry,
+		    end_unnest);
+		if (map->holelistenabled) {
+			vm_map_store_update_first_free(map, NULL, FALSE);
+		} else {
+			vm_map_store_update_first_free(map, map->first_free, FALSE);
+		}
+	}
 
-			vm_map_lock(map);
-			/*
-			 * Cannot avoid a lookup here. reset timestamp.
-			 */
-			last_timestamp = map->timestamp;
+	pmap_unnest(map->pmap,
+	    entry->vme_start,
+	    entry->vme_end - entry->vme_start);
+	if ((map->mapped_in_other_pmaps) && os_ref_get_count(&map->map_refcnt) != 0) {
+		/* clean up parent map/maps */
+		vm_map_submap_pmap_clean(
+			map, entry->vme_start,
+			entry->vme_end,
+			VME_SUBMAP(entry),
+			VME_OFFSET(entry));
+	}
+	entry->use_pmap = FALSE;
+	if ((map->pmap != kernel_pmap) &&
+	    (VME_ALIAS(entry) == VM_MEMORY_SHARED_PMAP)) {
+		VME_ALIAS_SET(entry, VM_MEMORY_UNSHARED_PMAP);
+	}
+}
+#endif  /* NO_NESTED_PMAP */
 
-			/*
-			 * The entry could have been clipped or it
-			 * may not exist anymore.  Look it up again.
-			 */
-			if (!vm_map_lookup_entry(map, s, &first_entry)) {
-				assert((map != kernel_map) && 
-				       (!entry->is_sub_map));
-				/*
-				 * User: use the next entry
-				 */
-				entry = first_entry->vme_next;
-			} else {
-				entry = first_entry;
-				SAVE_HINT(map, entry->vme_prev);
-			}
-			continue;
-		} /* end in_transition */
+/*
+ *	vm_map_clip_start:	[ internal use only ]
+ *
+ *	Asserts that the given entry begins at or after
+ *	the specified address; if necessary,
+ *	it splits the entry into two.
+ */
+void
+vm_map_clip_start(
+	vm_map_t        map,
+	vm_map_entry_t  entry,
+	vm_map_offset_t startaddr)
+{
+#ifndef NO_NESTED_PMAP
+	if (entry->is_sub_map &&
+	    entry->use_pmap &&
+	    startaddr >= entry->vme_start) {
+		vm_map_offset_t start_unnest, end_unnest;
 
-		if (entry->wired_count) {
-			/*
-			 * 	Remove a kernel wiring if requested or if
-			 *	there are user wirings.
-			 */
-			if ((flags & VM_MAP_REMOVE_KUNWIRE) || 
-			   (entry->user_wired_count > 0))
-				entry->wired_count--;
+		/*
+		 * Make sure "startaddr" is no longer in a nested range
+		 * before we clip.  Unnest only the minimum range the platform
+		 * can handle.
+		 * vm_map_clip_unnest may perform additional adjustments to
+		 * the unnest range.
+		 */
+		start_unnest = startaddr & ~(pmap_nesting_size_min - 1);
+		end_unnest = start_unnest + pmap_nesting_size_min;
+		vm_map_clip_unnest(map, entry, start_unnest, end_unnest);
+	}
+#endif /* NO_NESTED_PMAP */
+	if (startaddr > entry->vme_start) {
+		if (VME_OBJECT(entry) &&
+		    !entry->is_sub_map &&
+		    VME_OBJECT(entry)->phys_contiguous) {
+			pmap_remove(map->pmap,
+			    (addr64_t)(entry->vme_start),
+			    (addr64_t)(entry->vme_end));
+		}
+		if (entry->vme_atomic) {
+			panic("Attempting to clip an atomic VM entry! (map: %p, entry: %p)\n", map, entry);
+		}
 
-			/* remove all user wire references */
-			entry->user_wired_count = 0;
+		DTRACE_VM5(
+			vm_map_clip_start,
+			vm_map_t, map,
+			vm_map_offset_t, entry->vme_start,
+			vm_map_offset_t, entry->vme_end,
+			vm_map_offset_t, startaddr,
+			int, VME_ALIAS(entry));
+
+		_vm_map_clip_start(&map->hdr, entry, startaddr);
+		if (map->holelistenabled) {
+			vm_map_store_update_first_free(map, NULL, FALSE);
+		} else {
+			vm_map_store_update_first_free(map, map->first_free, FALSE);
+		}
+	}
+}
 
-			if (entry->wired_count != 0) {
-				assert((map != kernel_map) && 
-				       (!entry->is_sub_map));
-				/*
-				 * Cannot continue.  Typical case is when
-				 * a user thread has physical io pending on
-				 * on this page.  Either wait for the
-				 * kernel wiring to go away or return an
-				 * error.
-				 */
-				if (flags & VM_MAP_REMOVE_WAIT_FOR_KWIRE) {
 
-					s = entry->vme_start;
-					entry->needs_wakeup = TRUE;
-					vm_map_entry_wait(map, interruptible);
+#define vm_map_copy_clip_start(copy, entry, startaddr) \
+	MACRO_BEGIN \
+	if ((startaddr) > (entry)->vme_start) \
+	        _vm_map_clip_start(&(copy)->cpy_hdr,(entry),(startaddr)); \
+	MACRO_END
 
-					if (interruptible &&
-			   		    current_thread()->wait_result == 
-							THREAD_INTERRUPTED)
-						/*
-				 	 	 * We do not clear the 
-						 * needs_wakeup flag, since we 
-						 * cannot tell if we were the 
-						 * only one.
-				 	 	 */
-						return KERN_ABORTED;
+/*
+ *	This routine is called only when it is known that
+ *	the entry must be split.
+ */
+static void
+_vm_map_clip_start(
+	struct vm_map_header    *map_header,
+	vm_map_entry_t          entry,
+	vm_map_offset_t         start)
+{
+	vm_map_entry_t  new_entry;
 
-					vm_map_lock(map);
-					/*
-			 	 	 * Cannot avoid a lookup here. reset 
-					 * timestamp.
-			 	 	 */
-					last_timestamp = map->timestamp;
+	/*
+	 *	Split off the front portion --
+	 *	note that we must insert the new
+	 *	entry BEFORE this one, so that
+	 *	this entry has the specified starting
+	 *	address.
+	 */
 
-					/*
-			 		 * The entry could have been clipped or
-					 * it may not exist anymore.  Look it
-					 * up again.
-			 		 */
-					if (!vm_map_lookup_entry(map, s, 
-								&first_entry)) {
-						assert((map != kernel_map) && 
-				       		(!entry->is_sub_map));
-						/*
-				 		 * User: use the next entry
-				 		 */
-						entry = first_entry->vme_next;
-					} else {
-						entry = first_entry;
-						SAVE_HINT(map, entry->vme_prev);
-					}
-					continue;
-				}
-				else {
-					return KERN_FAILURE;
-				}
-			}
+	if (entry->map_aligned) {
+		assert(VM_MAP_PAGE_ALIGNED(start,
+		    VM_MAP_HDR_PAGE_MASK(map_header)));
+	}
 
-			entry->in_transition = TRUE;
-			/*
-			 * copy current entry.  see comment in vm_map_wire()
-			 */
-			tmp_entry = *entry;
-			s = entry->vme_start;
-			e = entry->vme_end;
+	new_entry = _vm_map_entry_create(map_header, !map_header->entries_pageable);
+	vm_map_entry_copy_full(new_entry, entry);
 
-			/*
-			 * We can unlock the map now. The in_transition
-			 * state guarentees existance of the entry.
-			 */
-			vm_map_unlock(map);
-			vm_fault_unwire(map, &tmp_entry,
-				tmp_entry.object.vm_object == kernel_object,
-				map->pmap);
-			vm_map_lock(map);
+	new_entry->vme_end = start;
+	assert(new_entry->vme_start < new_entry->vme_end);
+	VME_OFFSET_SET(entry, VME_OFFSET(entry) + (start - entry->vme_start));
+	assert(start < entry->vme_end);
+	entry->vme_start = start;
 
-			if (last_timestamp+1 != map->timestamp) {
-				/*
-				 * Find the entry again.  It could have
-				 * been clipped after we unlocked the map.
-				 */
-				if (!vm_map_lookup_entry(map, s, &first_entry)){
-					assert((map != kernel_map) && 
-				       	       (!entry->is_sub_map));
-					first_entry = first_entry->vme_next;
-				} else {
-					SAVE_HINT(map, entry->vme_prev);
-				}
-			} else {
-				SAVE_HINT(map, entry->vme_prev);
-				first_entry = entry;
-			}
+	_vm_map_store_entry_link(map_header, entry->vme_prev, new_entry);
 
-			last_timestamp = map->timestamp;
+	if (entry->is_sub_map) {
+		vm_map_reference(VME_SUBMAP(new_entry));
+	} else {
+		vm_object_reference(VME_OBJECT(new_entry));
+	}
+}
 
-			entry = first_entry;
-			while ((entry != vm_map_to_entry(map)) &&
-			       (entry->vme_start < tmp_entry.vme_end)) {
-				assert(entry->in_transition);
-				entry->in_transition = FALSE;
-				if (entry->needs_wakeup) {
-					entry->needs_wakeup = FALSE;
-					need_wakeup = TRUE;
-				}
-				entry = entry->vme_next;
-			}
-			/*
-			 * We have unwired the entry(s).  Go back and
-			 * delete them.
-			 */
-			entry = first_entry;
-			continue;
-		}
 
-		/* entry is unwired */
-		assert(entry->wired_count == 0);
-		assert(entry->user_wired_count == 0);
+/*
+ *	vm_map_clip_end:	[ internal use only ]
+ *
+ *	Asserts that the given entry ends at or before
+ *	the specified address; if necessary,
+ *	it splits the entry into two.
+ */
+void
+vm_map_clip_end(
+	vm_map_t        map,
+	vm_map_entry_t  entry,
+	vm_map_offset_t endaddr)
+{
+	if (endaddr > entry->vme_end) {
+		/*
+		 * Within the scope of this clipping, limit "endaddr" to
+		 * the end of this map entry...
+		 */
+		endaddr = entry->vme_end;
+	}
+#ifndef NO_NESTED_PMAP
+	if (entry->is_sub_map && entry->use_pmap) {
+		vm_map_offset_t start_unnest, end_unnest;
 
-		if ((!entry->is_sub_map &&
-		    entry->object.vm_object != kernel_object) ||
-		    entry->is_sub_map) {
-			if(entry->is_sub_map) {
-			   if(entry->use_pmap) {
-#ifndef i386
-				pmap_unnest(map->pmap, entry->vme_start,
-				        entry->vme_end - entry->vme_start);
-#endif
-			   } else {
-				vm_map_submap_pmap_clean(
-					map, entry->vme_start, entry->vme_end,
-					entry->object.sub_map,
-					entry->offset);
-			   }
-			} else {
-				pmap_remove(map->pmap, 
-					entry->vme_start, entry->vme_end);
-			}
+		/*
+		 * Make sure the range between the start of this entry and
+		 * the new "endaddr" is no longer nested before we clip.
+		 * Unnest only the minimum range the platform can handle.
+		 * vm_map_clip_unnest may perform additional adjustments to
+		 * the unnest range.
+		 */
+		start_unnest = entry->vme_start;
+		end_unnest =
+		    (endaddr + pmap_nesting_size_min - 1) &
+		    ~(pmap_nesting_size_min - 1);
+		vm_map_clip_unnest(map, entry, start_unnest, end_unnest);
+	}
+#endif /* NO_NESTED_PMAP */
+	if (endaddr < entry->vme_end) {
+		if (VME_OBJECT(entry) &&
+		    !entry->is_sub_map &&
+		    VME_OBJECT(entry)->phys_contiguous) {
+			pmap_remove(map->pmap,
+			    (addr64_t)(entry->vme_start),
+			    (addr64_t)(entry->vme_end));
 		}
-
-		next = entry->vme_next;
-		s = next->vme_start;
-		last_timestamp = map->timestamp;
-		vm_map_entry_delete(map, entry);
-		/* vm_map_entry_delete unlocks the map */
-		vm_map_lock(map);
-		entry = next;
-
-		if(entry == vm_map_to_entry(map)) {
-			break;
+		if (entry->vme_atomic) {
+			panic("Attempting to clip an atomic VM entry! (map: %p, entry: %p)\n", map, entry);
 		}
-		if (last_timestamp+1 != map->timestamp) {
-			/*
-			 * we are responsible for deleting everything
-			 * from the give space, if someone has interfered
-			 * we pick up where we left off, back fills should
-			 * be all right for anyone except map_delete and
-			 * we have to assume that the task has been fully
-			 * disabled before we get here
-			 */
-        		if (!vm_map_lookup_entry(map, s, &entry)){
-	               		entry = entry->vme_next;
-        		} else {
-				 SAVE_HINT(map, entry->vme_prev);
-       		 	}
-			/* 
-			 * others can not only allocate behind us, we can 
-			 * also see coalesce while we don't have the map lock 
-			 */
-			if(entry == vm_map_to_entry(map)) {
-				break;
-			}
-			vm_map_clip_start(map, entry, s);
+		DTRACE_VM5(
+			vm_map_clip_end,
+			vm_map_t, map,
+			vm_map_offset_t, entry->vme_start,
+			vm_map_offset_t, entry->vme_end,
+			vm_map_offset_t, endaddr,
+			int, VME_ALIAS(entry));
+
+		_vm_map_clip_end(&map->hdr, entry, endaddr);
+		if (map->holelistenabled) {
+			vm_map_store_update_first_free(map, NULL, FALSE);
+		} else {
+			vm_map_store_update_first_free(map, map->first_free, FALSE);
 		}
-		last_timestamp = map->timestamp;
 	}
+}
 
-	if (map->wait_for_space)
-		thread_wakeup((event_t) map);
-	/*
-	 * wake up anybody waiting on entries that we have already deleted.
-	 */
-	if (need_wakeup)
-		vm_map_entry_wakeup(map);
 
-	return KERN_SUCCESS;
-}
+#define vm_map_copy_clip_end(copy, entry, endaddr) \
+	MACRO_BEGIN \
+	if ((endaddr) < (entry)->vme_end) \
+	        _vm_map_clip_end(&(copy)->cpy_hdr,(entry),(endaddr)); \
+	MACRO_END
 
 /*
- *	vm_map_remove:
- *
- *	Remove the given address range from the target map.
- *	This is the exported form of vm_map_delete.
+ *	This routine is called only when it is known that
+ *	the entry must be split.
  */
-kern_return_t
-vm_map_remove(
-	register vm_map_t	map,
-	register vm_offset_t	start,
-	register vm_offset_t	end,
-	register boolean_t	flags)
+static void
+_vm_map_clip_end(
+	struct vm_map_header    *map_header,
+	vm_map_entry_t          entry,
+	vm_map_offset_t         end)
 {
-	register kern_return_t	result;
+	vm_map_entry_t  new_entry;
 
-	vm_map_lock(map);
-	VM_MAP_RANGE_CHECK(map, start, end);
-	result = vm_map_delete(map, start, end, flags);
-	vm_map_unlock(map);
+	/*
+	 *	Create a new entry and insert it
+	 *	AFTER the specified entry
+	 */
 
-	return(result);
-}
+	if (entry->map_aligned) {
+		assert(VM_MAP_PAGE_ALIGNED(end,
+		    VM_MAP_HDR_PAGE_MASK(map_header)));
+	}
 
+	new_entry = _vm_map_entry_create(map_header, !map_header->entries_pageable);
+	vm_map_entry_copy_full(new_entry, entry);
 
-/*
- *	Routine:	vm_map_copy_discard
- *
- *	Description:
- *		Dispose of a map copy object (returned by
- *		vm_map_copyin).
- */
-void
-vm_map_copy_discard(
-	vm_map_copy_t	copy)
-{
-	TR_DECL("vm_map_copy_discard");
-
-/*	tr3("enter: copy 0x%x type %d", copy, copy->type);*/
-free_next_copy:
-	if (copy == VM_MAP_COPY_NULL)
-		return;
-
-	switch (copy->type) {
-	case VM_MAP_COPY_ENTRY_LIST:
-		while (vm_map_copy_first_entry(copy) !=
-					vm_map_copy_to_entry(copy)) {
-			vm_map_entry_t	entry = vm_map_copy_first_entry(copy);
+	assert(entry->vme_start < end);
+	new_entry->vme_start = entry->vme_end = end;
+	VME_OFFSET_SET(new_entry,
+	    VME_OFFSET(new_entry) + (end - entry->vme_start));
+	assert(new_entry->vme_start < new_entry->vme_end);
 
-			vm_map_copy_entry_unlink(copy, entry);
-			vm_object_deallocate(entry->object.vm_object);
-			vm_map_copy_entry_dispose(copy, entry);
-		}
-		break;
-        case VM_MAP_COPY_OBJECT:
-		vm_object_deallocate(copy->cpy_object);
-		break;
-	case VM_MAP_COPY_KERNEL_BUFFER:
+	_vm_map_store_entry_link(map_header, entry, new_entry);
 
-		/*
-		 * The vm_map_copy_t and possibly the data buffer were
-		 * allocated by a single call to kalloc(), i.e. the
-		 * vm_map_copy_t was not allocated out of the zone.
-		 */
-		kfree((vm_offset_t) copy, copy->cpy_kalloc_size);
-		return;
+	if (entry->is_sub_map) {
+		vm_map_reference(VME_SUBMAP(new_entry));
+	} else {
+		vm_object_reference(VME_OBJECT(new_entry));
 	}
-	zfree(vm_map_copy_zone, (vm_offset_t) copy);
 }
 
+
 /*
- *	Routine:	vm_map_copy_copy
+ *	VM_MAP_RANGE_CHECK:	[ internal use only ]
  *
- *	Description:
- *			Move the information in a map copy object to
- *			a new map copy object, leaving the old one
- *			empty.
+ *	Asserts that the starting and ending region
+ *	addresses fall within the valid range of the map.
+ */
+#define VM_MAP_RANGE_CHECK(map, start, end)     \
+	MACRO_BEGIN                             \
+	if (start < vm_map_min(map))            \
+	        start = vm_map_min(map);        \
+	if (end > vm_map_max(map))              \
+	        end = vm_map_max(map);          \
+	if (start > end)                        \
+	        start = end;                    \
+	MACRO_END
+
+/*
+ *	vm_map_range_check:	[ internal use only ]
  *
- *			This is used by kernel routines that need
- *			to look at out-of-line data (in copyin form)
- *			before deciding whether to return SUCCESS.
- *			If the routine returns FAILURE, the original
- *			copy object will be deallocated; therefore,
- *			these routines must make a copy of the copy
- *			object and leave the original empty so that
- *			deallocation will not fail.
+ *	Check that the region defined by the specified start and
+ *	end addresses are wholly contained within a single map
+ *	entry or set of adjacent map entries of the spacified map,
+ *	i.e. the specified region contains no unmapped space.
+ *	If any or all of the region is unmapped, FALSE is returned.
+ *	Otherwise, TRUE is returned and if the output argument 'entry'
+ *	is not NULL it points to the map entry containing the start
+ *	of the region.
+ *
+ *	The map is locked for reading on entry and is left locked.
  */
-vm_map_copy_t
-vm_map_copy_copy(
-	vm_map_copy_t	copy)
+static boolean_t
+vm_map_range_check(
+	vm_map_t                map,
+	vm_map_offset_t         start,
+	vm_map_offset_t         end,
+	vm_map_entry_t          *entry)
 {
-	vm_map_copy_t	new_copy;
-
-	if (copy == VM_MAP_COPY_NULL)
-		return VM_MAP_COPY_NULL;
+	vm_map_entry_t          cur;
+	vm_map_offset_t         prev;
 
 	/*
-	 * Allocate a new copy object, and copy the information
-	 * from the old one into it.
+	 *      Basic sanity checks first
 	 */
+	if (start < vm_map_min(map) || end > vm_map_max(map) || start > end) {
+		return FALSE;
+	}
 
-	new_copy = (vm_map_copy_t) zalloc(vm_map_copy_zone);
-	*new_copy = *copy;
-
-	if (copy->type == VM_MAP_COPY_ENTRY_LIST) {
-		/*
-		 * The links in the entry chain must be
-		 * changed to point to the new copy object.
-		 */
-		vm_map_copy_first_entry(copy)->vme_prev
-			= vm_map_copy_to_entry(new_copy);
-		vm_map_copy_last_entry(copy)->vme_next
-			= vm_map_copy_to_entry(new_copy);
+	/*
+	 *      Check first if the region starts within a valid
+	 *	mapping for the map.
+	 */
+	if (!vm_map_lookup_entry(map, start, &cur)) {
+		return FALSE;
 	}
 
 	/*
-	 * Change the old copy object into one that contains
-	 * nothing to be deallocated.
+	 *	Optimize for the case that the region is contained
+	 *	in a single map entry.
 	 */
-	copy->type = VM_MAP_COPY_OBJECT;
-	copy->cpy_object = VM_OBJECT_NULL;
+	if (entry != (vm_map_entry_t *) NULL) {
+		*entry = cur;
+	}
+	if (end <= cur->vme_end) {
+		return TRUE;
+	}
 
 	/*
-	 * Return the new object.
+	 *      If the region is not wholly contained within a
+	 *      single entry, walk the entries looking for holes.
 	 */
-	return new_copy;
+	prev = cur->vme_end;
+	cur = cur->vme_next;
+	while ((cur != vm_map_to_entry(map)) && (prev == cur->vme_start)) {
+		if (end <= cur->vme_end) {
+			return TRUE;
+		}
+		prev = cur->vme_end;
+		cur = cur->vme_next;
+	}
+	return FALSE;
 }
 
+/*
+ *	vm_map_submap:		[ kernel use only ]
+ *
+ *	Mark the given range as handled by a subordinate map.
+ *
+ *	This range must have been created with vm_map_find using
+ *	the vm_submap_object, and no other operations may have been
+ *	performed on this range prior to calling vm_map_submap.
+ *
+ *	Only a limited number of operations can be performed
+ *	within this rage after calling vm_map_submap:
+ *		vm_fault
+ *	[Don't try vm_map_copyin!]
+ *
+ *	To remove a submapping, one must first remove the
+ *	range from the superior map, and then destroy the
+ *	submap (if desired).  [Better yet, don't try it.]
+ */
 kern_return_t
-vm_map_overwrite_submap_recurse(
-	vm_map_t	dst_map,
-	vm_offset_t	dst_addr,
-	vm_size_t	dst_size)
+vm_map_submap(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end,
+	vm_map_t        submap,
+	vm_map_offset_t offset,
+#ifdef NO_NESTED_PMAP
+	__unused
+#endif  /* NO_NESTED_PMAP */
+	boolean_t       use_pmap)
 {
-	vm_offset_t	dst_end;
-	vm_map_entry_t	tmp_entry;
-	vm_map_entry_t	entry;
-	kern_return_t	result;
-	boolean_t	encountered_sub_map = FALSE;
-
-
-
-	/*
-	 *	Verify that the destination is all writeable
-	 *	initially.  We have to trunc the destination
-	 *	address and round the copy size or we'll end up
-	 *	splitting entries in strange ways.
-	 */
+	vm_map_entry_t          entry;
+	kern_return_t           result = KERN_INVALID_ARGUMENT;
+	vm_object_t             object;
 
-	dst_end = round_page(dst_addr + dst_size);
+	vm_map_lock(map);
 
-start_pass_1:
-	vm_map_lock(dst_map);
-	if (!vm_map_lookup_entry(dst_map, dst_addr, &tmp_entry)) {
-		vm_map_unlock(dst_map);
-		return(KERN_INVALID_ADDRESS);
+	if (!vm_map_lookup_entry(map, start, &entry)) {
+		entry = entry->vme_next;
 	}
 
-	vm_map_clip_start(dst_map, tmp_entry, trunc_page(dst_addr));
-
-	for (entry = tmp_entry;;) {
-		vm_map_entry_t	next;
+	if (entry == vm_map_to_entry(map) ||
+	    entry->is_sub_map) {
+		vm_map_unlock(map);
+		return KERN_INVALID_ARGUMENT;
+	}
 
-		next = entry->vme_next;
-		while(entry->is_sub_map) {
-			vm_offset_t	sub_start;
-			vm_offset_t	sub_end;
-			vm_offset_t	local_end;
+	vm_map_clip_start(map, entry, start);
+	vm_map_clip_end(map, entry, end);
 
-			if (entry->in_transition) {
-                        /*
-                         * Say that we are waiting, and wait for entry.
-                         */
-                        	entry->needs_wakeup = TRUE;
-                        	vm_map_entry_wait(dst_map, THREAD_UNINT);
+	if ((entry->vme_start == start) && (entry->vme_end == end) &&
+	    (!entry->is_sub_map) &&
+	    ((object = VME_OBJECT(entry)) == vm_submap_object) &&
+	    (object->resident_page_count == 0) &&
+	    (object->copy == VM_OBJECT_NULL) &&
+	    (object->shadow == VM_OBJECT_NULL) &&
+	    (!object->pager_created)) {
+		VME_OFFSET_SET(entry, (vm_object_offset_t)offset);
+		VME_OBJECT_SET(entry, VM_OBJECT_NULL);
+		vm_object_deallocate(object);
+		entry->is_sub_map = TRUE;
+		entry->use_pmap = FALSE;
+		VME_SUBMAP_SET(entry, submap);
+		vm_map_reference(submap);
+		if (submap->mapped_in_other_pmaps == FALSE &&
+		    vm_map_pmap(submap) != PMAP_NULL &&
+		    vm_map_pmap(submap) != vm_map_pmap(map)) {
+			/*
+			 * This submap is being mapped in a map
+			 * that uses a different pmap.
+			 * Set its "mapped_in_other_pmaps" flag
+			 * to indicate that we now need to
+			 * remove mappings from all pmaps rather
+			 * than just the submap's pmap.
+			 */
+			submap->mapped_in_other_pmaps = TRUE;
+		}
 
-				goto start_pass_1;
+#ifndef NO_NESTED_PMAP
+		if (use_pmap) {
+			/* nest if platform code will allow */
+			if (submap->pmap == NULL) {
+				ledger_t ledger = map->pmap->ledger;
+				submap->pmap = pmap_create_options(ledger,
+				    (vm_map_size_t) 0, 0);
+				if (submap->pmap == PMAP_NULL) {
+					vm_map_unlock(map);
+					return KERN_NO_SPACE;
+				}
+#if     defined(__arm__) || defined(__arm64__)
+				pmap_set_nested(submap->pmap);
+#endif
 			}
+			result = pmap_nest(map->pmap,
+			    (VME_SUBMAP(entry))->pmap,
+			    (addr64_t)start,
+			    (addr64_t)start,
+			    (uint64_t)(end - start));
+			if (result) {
+				panic("vm_map_submap: pmap_nest failed, rc = %08X\n", result);
+			}
+			entry->use_pmap = TRUE;
+		}
+#else   /* NO_NESTED_PMAP */
+		pmap_remove(map->pmap, (addr64_t)start, (addr64_t)end);
+#endif  /* NO_NESTED_PMAP */
+		result = KERN_SUCCESS;
+	}
+	vm_map_unlock(map);
 
-			encountered_sub_map = TRUE;
-			sub_start = entry->offset;
+	return result;
+}
 
-			if(entry->vme_end < dst_end)
-				sub_end = entry->vme_end;
-			else 
-				sub_end = dst_end;
-			sub_end -= entry->vme_start;
-			sub_end += entry->offset;
-			local_end = entry->vme_end;
-			vm_map_unlock(dst_map);
-			
-			result = vm_map_overwrite_submap_recurse(
-					entry->object.sub_map,
-					sub_start,
-					sub_end - sub_start);
+/*
+ *	vm_map_protect:
+ *
+ *	Sets the protection of the specified address
+ *	region in the target map.  If "set_max" is
+ *	specified, the maximum protection is to be set;
+ *	otherwise, only the current protection is affected.
+ */
+kern_return_t
+vm_map_protect(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end,
+	vm_prot_t       new_prot,
+	boolean_t       set_max)
+{
+	vm_map_entry_t                  current;
+	vm_map_offset_t                 prev;
+	vm_map_entry_t                  entry;
+	vm_prot_t                       new_max;
+	int                             pmap_options = 0;
+	kern_return_t                   kr;
+
+	if (new_prot & VM_PROT_COPY) {
+		vm_map_offset_t         new_start;
+		vm_prot_t               cur_prot, max_prot;
+		vm_map_kernel_flags_t   kflags;
+
+		/* LP64todo - see below */
+		if (start >= map->max_offset) {
+			return KERN_INVALID_ADDRESS;
+		}
 
-			if(result != KERN_SUCCESS)
-				return result;
-			if (dst_end <= entry->vme_end)
-				return KERN_SUCCESS;
-			vm_map_lock(dst_map);
-			if(!vm_map_lookup_entry(dst_map, local_end, 
-						&tmp_entry)) {
-				vm_map_unlock(dst_map);
-				return(KERN_INVALID_ADDRESS);
-			}
-			entry = tmp_entry;
-			next = entry->vme_next;
+#if VM_PROTECT_WX_FAIL
+		if ((new_prot & VM_PROT_EXECUTE) &&
+		    map != kernel_map &&
+		    cs_process_enforcement(NULL)) {
+			DTRACE_VM3(cs_wx,
+			    uint64_t, (uint64_t) start,
+			    uint64_t, (uint64_t) end,
+			    vm_prot_t, new_prot);
+			printf("CODE SIGNING: %d[%s] %s can't have both write and exec at the same time\n",
+			    proc_selfpid(),
+			    (current_task()->bsd_info
+			    ? proc_name_address(current_task()->bsd_info)
+			    : "?"),
+			    __FUNCTION__);
+			return KERN_PROTECTION_FAILURE;
 		}
+#endif /* VM_PROTECT_WX_FAIL */
 
-		if ( ! (entry->protection & VM_PROT_WRITE)) {
-			vm_map_unlock(dst_map);
-			return(KERN_PROTECTION_FAILURE);
+		/*
+		 * Let vm_map_remap_extract() know that it will need to:
+		 * + make a copy of the mapping
+		 * + add VM_PROT_WRITE to the max protections
+		 * + remove any protections that are no longer allowed from the
+		 *   max protections (to avoid any WRITE/EXECUTE conflict, for
+		 *   example).
+		 * Note that "max_prot" is an IN/OUT parameter only for this
+		 * specific (VM_PROT_COPY) case.  It's usually an OUT parameter
+		 * only.
+		 */
+		max_prot = new_prot & VM_PROT_ALL;
+		kflags = VM_MAP_KERNEL_FLAGS_NONE;
+		kflags.vmkf_remap_prot_copy = TRUE;
+		kflags.vmkf_overwrite_immutable = TRUE;
+		new_start = start;
+		kr = vm_map_remap(map,
+		    &new_start,
+		    end - start,
+		    0,               /* mask */
+		    VM_FLAGS_FIXED | VM_FLAGS_OVERWRITE,
+		    kflags,
+		    0,
+		    map,
+		    start,
+		    TRUE,               /* copy-on-write remapping! */
+		    &cur_prot,
+		    &max_prot,
+		    VM_INHERIT_DEFAULT);
+		if (kr != KERN_SUCCESS) {
+			return kr;
 		}
+		new_prot &= ~VM_PROT_COPY;
+	}
+
+	vm_map_lock(map);
+
+	/* LP64todo - remove this check when vm_map_commpage64()
+	 * no longer has to stuff in a map_entry for the commpage
+	 * above the map's max_offset.
+	 */
+	if (start >= map->max_offset) {
+		vm_map_unlock(map);
+		return KERN_INVALID_ADDRESS;
+	}
 
+	while (1) {
 		/*
-		 *	If the entry is in transition, we must wait
-		 *	for it to exit that state.  Anything could happen
-		 *	when we unlock the map, so start over.
+		 *      Lookup the entry.  If it doesn't start in a valid
+		 *	entry, return an error.
 		 */
-                if (entry->in_transition) {
+		if (!vm_map_lookup_entry(map, start, &entry)) {
+			vm_map_unlock(map);
+			return KERN_INVALID_ADDRESS;
+		}
 
-                        /*
-                         * Say that we are waiting, and wait for entry.
-                         */
-                        entry->needs_wakeup = TRUE;
-                        vm_map_entry_wait(dst_map, THREAD_UNINT);
+		if (entry->superpage_size && (start & (SUPERPAGE_SIZE - 1))) { /* extend request to whole entry */
+			start = SUPERPAGE_ROUND_DOWN(start);
+			continue;
+		}
+		break;
+	}
+	if (entry->superpage_size) {
+		end = SUPERPAGE_ROUND_UP(end);
+	}
 
-			goto start_pass_1;
+	/*
+	 *	Make a first pass to check for protection and address
+	 *	violations.
+	 */
+
+	current = entry;
+	prev = current->vme_start;
+	while ((current != vm_map_to_entry(map)) &&
+	    (current->vme_start < end)) {
+		/*
+		 * If there is a hole, return an error.
+		 */
+		if (current->vme_start != prev) {
+			vm_map_unlock(map);
+			return KERN_INVALID_ADDRESS;
 		}
 
-/*
- *		our range is contained completely within this map entry
- */
-		if (dst_end <= entry->vme_end) {
-			vm_map_unlock(dst_map);
-			return KERN_SUCCESS;
+		new_max = current->max_protection;
+		if ((new_prot & new_max) != new_prot) {
+			vm_map_unlock(map);
+			return KERN_PROTECTION_FAILURE;
 		}
-/*
- *		check that range specified is contiguous region
- */
-		if ((next == vm_map_to_entry(dst_map)) ||
-		    (next->vme_start != entry->vme_end)) {
-			vm_map_unlock(dst_map);
-			return(KERN_INVALID_ADDRESS);
+
+		if ((new_prot & VM_PROT_WRITE) &&
+		    (new_prot & VM_PROT_EXECUTE) &&
+#if !CONFIG_EMBEDDED
+		    map != kernel_map &&
+		    cs_process_enforcement(NULL) &&
+#endif /* !CONFIG_EMBEDDED */
+		    !(current->used_for_jit)) {
+			DTRACE_VM3(cs_wx,
+			    uint64_t, (uint64_t) current->vme_start,
+			    uint64_t, (uint64_t) current->vme_end,
+			    vm_prot_t, new_prot);
+			printf("CODE SIGNING: %d[%s] %s can't have both write and exec at the same time\n",
+			    proc_selfpid(),
+			    (current_task()->bsd_info
+			    ? proc_name_address(current_task()->bsd_info)
+			    : "?"),
+			    __FUNCTION__);
+			new_prot &= ~VM_PROT_EXECUTE;
+#if VM_PROTECT_WX_FAIL
+			vm_map_unlock(map);
+			return KERN_PROTECTION_FAILURE;
+#endif /* VM_PROTECT_WX_FAIL */
 		}
 
 		/*
-		 *	Check for permanent objects in the destination.
+		 * If the task has requested executable lockdown,
+		 * deny both:
+		 * - adding executable protections OR
+		 * - adding write protections to an existing executable mapping.
 		 */
-		if ((entry->object.vm_object != VM_OBJECT_NULL) &&
-			   ((!entry->object.vm_object->internal) ||
-			   (entry->object.vm_object->true_share))) {
-			if(encountered_sub_map) {
-				vm_map_unlock(dst_map);
-				return(KERN_FAILURE);
+		if (map->map_disallow_new_exec == TRUE) {
+			if ((new_prot & VM_PROT_EXECUTE) ||
+			    ((current->protection & VM_PROT_EXECUTE) && (new_prot & VM_PROT_WRITE))) {
+				vm_map_unlock(map);
+				return KERN_PROTECTION_FAILURE;
 			}
 		}
 
-
-		entry = next;
-	}/* for */
-	vm_map_unlock(dst_map);
-	return(KERN_SUCCESS);
+		prev = current->vme_end;
+		current = current->vme_next;
+	}
+
+#if __arm64__
+	if (end > prev &&
+	    end == vm_map_round_page(prev, VM_MAP_PAGE_MASK(map))) {
+		vm_map_entry_t prev_entry;
+
+		prev_entry = current->vme_prev;
+		if (prev_entry != vm_map_to_entry(map) &&
+		    !prev_entry->map_aligned &&
+		    (vm_map_round_page(prev_entry->vme_end,
+		    VM_MAP_PAGE_MASK(map))
+		    == end)) {
+			/*
+			 * The last entry in our range is not "map-aligned"
+			 * but it would have reached all the way to "end"
+			 * if it had been map-aligned, so this is not really
+			 * a hole in the range and we can proceed.
+			 */
+			prev = end;
+		}
+	}
+#endif /* __arm64__ */
+
+	if (end > prev) {
+		vm_map_unlock(map);
+		return KERN_INVALID_ADDRESS;
+	}
+
+	/*
+	 *	Go back and fix up protections.
+	 *	Clip to start here if the range starts within
+	 *	the entry.
+	 */
+
+	current = entry;
+	if (current != vm_map_to_entry(map)) {
+		/* clip and unnest if necessary */
+		vm_map_clip_start(map, current, start);
+	}
+
+	while ((current != vm_map_to_entry(map)) &&
+	    (current->vme_start < end)) {
+		vm_prot_t       old_prot;
+
+		vm_map_clip_end(map, current, end);
+
+		if (current->is_sub_map) {
+			/* clipping did unnest if needed */
+			assert(!current->use_pmap);
+		}
+
+		old_prot = current->protection;
+
+		if (set_max) {
+			current->max_protection = new_prot;
+			current->protection = new_prot & old_prot;
+		} else {
+			current->protection = new_prot;
+		}
+
+		/*
+		 *	Update physical map if necessary.
+		 *	If the request is to turn off write protection,
+		 *	we won't do it for real (in pmap). This is because
+		 *	it would cause copy-on-write to fail.  We've already
+		 *	set, the new protection in the map, so if a
+		 *	write-protect fault occurred, it will be fixed up
+		 *	properly, COW or not.
+		 */
+		if (current->protection != old_prot) {
+			/* Look one level in we support nested pmaps */
+			/* from mapped submaps which are direct entries */
+			/* in our map */
+
+			vm_prot_t prot;
+
+			prot = current->protection;
+			if (current->is_sub_map || (VME_OBJECT(current) == NULL) || (VME_OBJECT(current) != compressor_object)) {
+				prot &= ~VM_PROT_WRITE;
+			} else {
+				assert(!VME_OBJECT(current)->code_signed);
+				assert(VME_OBJECT(current)->copy_strategy == MEMORY_OBJECT_COPY_NONE);
+			}
+
+			if (override_nx(map, VME_ALIAS(current)) && prot) {
+				prot |= VM_PROT_EXECUTE;
+			}
+
+#if CONFIG_EMBEDDED && (DEVELOPMENT || DEBUG)
+			if (!(old_prot & VM_PROT_EXECUTE) &&
+			    (prot & VM_PROT_EXECUTE) &&
+			    panic_on_unsigned_execute &&
+			    (proc_selfcsflags() & CS_KILL)) {
+				panic("vm_map_protect(%p,0x%llx,0x%llx) old=0x%x new=0x%x - <rdar://23770418> code-signing bypass?\n", map, (uint64_t)current->vme_start, (uint64_t)current->vme_end, old_prot, prot);
+			}
+#endif /* CONFIG_EMBEDDED && (DEVELOPMENT || DEBUG) */
+
+			if (pmap_has_prot_policy(prot)) {
+				if (current->wired_count) {
+					panic("vm_map_protect(%p,0x%llx,0x%llx) new=0x%x wired=%x\n",
+					    map, (uint64_t)current->vme_start, (uint64_t)current->vme_end, prot, current->wired_count);
+				}
+
+				/* If the pmap layer cares about this
+				 * protection type, force a fault for
+				 * each page so that vm_fault will
+				 * repopulate the page with the full
+				 * set of protections.
+				 */
+				/*
+				 * TODO: We don't seem to need this,
+				 * but this is due to an internal
+				 * implementation detail of
+				 * pmap_protect.  Do we want to rely
+				 * on this?
+				 */
+				prot = VM_PROT_NONE;
+			}
+
+			if (current->is_sub_map && current->use_pmap) {
+				pmap_protect(VME_SUBMAP(current)->pmap,
+				    current->vme_start,
+				    current->vme_end,
+				    prot);
+			} else {
+				if (prot & VM_PROT_WRITE) {
+					if (VME_OBJECT(current) == compressor_object) {
+						/*
+						 * For write requests on the
+						 * compressor, we wil ask the
+						 * pmap layer to prevent us from
+						 * taking a write fault when we
+						 * attempt to access the mapping
+						 * next.
+						 */
+						pmap_options |= PMAP_OPTIONS_PROTECT_IMMEDIATE;
+					}
+				}
+
+				pmap_protect_options(map->pmap,
+				    current->vme_start,
+				    current->vme_end,
+				    prot,
+				    pmap_options,
+				    NULL);
+			}
+		}
+		current = current->vme_next;
+	}
+
+	current = entry;
+	while ((current != vm_map_to_entry(map)) &&
+	    (current->vme_start <= end)) {
+		vm_map_simplify_entry(map, current);
+		current = current->vme_next;
+	}
+
+	vm_map_unlock(map);
+	return KERN_SUCCESS;
 }
 
 /*
- *	Routine:	vm_map_copy_overwrite
- *
- *	Description:
- *		Copy the memory described by the map copy
- *		object (copy; returned by vm_map_copyin) onto
- *		the specified destination region (dst_map, dst_addr).
- *		The destination must be writeable.
- *
- *		Unlike vm_map_copyout, this routine actually
- *		writes over previously-mapped memory.  If the
- *		previous mapping was to a permanent (user-supplied)
- *		memory object, it is preserved.
- *
- *		The attributes (protection and inheritance) of the
- *		destination region are preserved.
- *
- *		If successful, consumes the copy object.
- *		Otherwise, the caller is responsible for it.
- *
- *	Implementation notes:
- *		To overwrite aligned temporary virtual memory, it is
- *		sufficient to remove the previous mapping and insert
- *		the new copy.  This replacement is done either on
- *		the whole region (if no permanent virtual memory
- *		objects are embedded in the destination region) or
- *		in individual map entries.
- *
- *		To overwrite permanent virtual memory , it is necessary
- *		to copy each page, as the external memory management
- *		interface currently does not provide any optimizations.
- *
- *		Unaligned memory also has to be copied.  It is possible
- *		to use 'vm_trickery' to copy the aligned data.  This is
- *		not done but not hard to implement.
- *
- *		Once a page of permanent memory has been overwritten,
- *		it is impossible to interrupt this function; otherwise,
- *		the call would be neither atomic nor location-independent.
- *		The kernel-state portion of a user thread must be
- *		interruptible.
+ *	vm_map_inherit:
  *
- *		It may be expensive to forward all requests that might
- *		overwrite permanent memory (vm_write, vm_copy) to
- *		uninterruptible kernel threads.  This routine may be
- *		called by interruptible threads; however, success is
- *		not guaranteed -- if the request cannot be performed
- *		atomically and interruptibly, an error indication is
- *		returned.
+ *	Sets the inheritance of the specified address
+ *	range in the target map.  Inheritance
+ *	affects how the map will be shared with
+ *	child maps at the time of vm_map_fork.
  */
-
 kern_return_t
-vm_map_copy_overwrite_nested(
-	vm_map_t	dst_map,
-	vm_offset_t	dst_addr,
-	vm_map_copy_t	copy,
-	boolean_t	interruptible,
-	pmap_t		pmap)
+vm_map_inherit(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end,
+	vm_inherit_t    new_inheritance)
 {
-	vm_offset_t	dst_end;
-	vm_map_entry_t	tmp_entry;
-	vm_map_entry_t	entry;
-	kern_return_t	kr;
-	boolean_t	aligned = TRUE;
-	boolean_t	contains_permanent_objects = FALSE;
-	boolean_t	encountered_sub_map = FALSE;
-	vm_offset_t	base_addr;
-	vm_size_t	copy_size;
-	vm_size_t	total_size;
+	vm_map_entry_t  entry;
+	vm_map_entry_t  temp_entry;
 
+	vm_map_lock(map);
 
-	/*
-	 *	Check for null copy object.
-	 */
+	VM_MAP_RANGE_CHECK(map, start, end);
 
-	if (copy == VM_MAP_COPY_NULL)
-		return(KERN_SUCCESS);
+	if (vm_map_lookup_entry(map, start, &temp_entry)) {
+		entry = temp_entry;
+	} else {
+		temp_entry = temp_entry->vme_next;
+		entry = temp_entry;
+	}
 
-	/*
-	 *	Check for special kernel buffer allocated
-	 *	by new_ipc_kmsg_copyin.
-	 */
+	/* first check entire range for submaps which can't support the */
+	/* given inheritance. */
+	while ((entry != vm_map_to_entry(map)) && (entry->vme_start < end)) {
+		if (entry->is_sub_map) {
+			if (new_inheritance == VM_INHERIT_COPY) {
+				vm_map_unlock(map);
+				return KERN_INVALID_ARGUMENT;
+			}
+		}
 
-	if (copy->type == VM_MAP_COPY_KERNEL_BUFFER) {
-		return(vm_map_copyout_kernel_buffer(
-						dst_map, &dst_addr, 
-					    	copy, TRUE));
+		entry = entry->vme_next;
 	}
 
-	/*
-	 *      Only works for entry lists at the moment.  Will
-	 *	support page lists later.
-	 */
+	entry = temp_entry;
+	if (entry != vm_map_to_entry(map)) {
+		/* clip and unnest if necessary */
+		vm_map_clip_start(map, entry, start);
+	}
 
-	assert(copy->type == VM_MAP_COPY_ENTRY_LIST);
+	while ((entry != vm_map_to_entry(map)) && (entry->vme_start < end)) {
+		vm_map_clip_end(map, entry, end);
+		if (entry->is_sub_map) {
+			/* clip did unnest if needed */
+			assert(!entry->use_pmap);
+		}
 
-	if (copy->size == 0) {
-		vm_map_copy_discard(copy);
-		return(KERN_SUCCESS);
+		entry->inheritance = new_inheritance;
+
+		entry = entry->vme_next;
 	}
 
-	/*
-	 *	Verify that the destination is all writeable
-	 *	initially.  We have to trunc the destination
-	 *	address and round the copy size or we'll end up
-	 *	splitting entries in strange ways.
-	 */
+	vm_map_unlock(map);
+	return KERN_SUCCESS;
+}
 
-	if (!page_aligned(copy->size) ||
-		!page_aligned (copy->offset) ||
-		!page_aligned (dst_addr))
-	{
-		aligned = FALSE;
-		dst_end = round_page(dst_addr + copy->size);
-	} else {
-		dst_end = dst_addr + copy->size;
-	}
+/*
+ * Update the accounting for the amount of wired memory in this map.  If the user has
+ * exceeded the defined limits, then we fail.  Wiring on behalf of the kernel never fails.
+ */
 
-start_pass_1:
-	vm_map_lock(dst_map);
-	if (!vm_map_lookup_entry(dst_map, dst_addr, &tmp_entry)) {
-		vm_map_unlock(dst_map);
-		return(KERN_INVALID_ADDRESS);
-	}
-	vm_map_clip_start(dst_map, tmp_entry, trunc_page(dst_addr));
-	for (entry = tmp_entry;;) {
-		vm_map_entry_t	next = entry->vme_next;
+static kern_return_t
+add_wire_counts(
+	vm_map_t        map,
+	vm_map_entry_t  entry,
+	boolean_t       user_wire)
+{
+	vm_map_size_t   size;
 
-		while(entry->is_sub_map) {
-			vm_offset_t	sub_start;
-			vm_offset_t	sub_end;
-			vm_offset_t	local_end;
+	if (user_wire) {
+		unsigned int total_wire_count =  vm_page_wire_count + vm_lopage_free_count;
 
-                	if (entry->in_transition) {
+		/*
+		 * We're wiring memory at the request of the user.  Check if this is the first time the user is wiring
+		 * this map entry.
+		 */
 
-                        /*
-                         * Say that we are waiting, and wait for entry.
-                         */
-                        	entry->needs_wakeup = TRUE;
-                        	vm_map_entry_wait(dst_map, THREAD_UNINT);
+		if (entry->user_wired_count == 0) {
+			size = entry->vme_end - entry->vme_start;
 
-				goto start_pass_1;
+			/*
+			 * Since this is the first time the user is wiring this map entry, check to see if we're
+			 * exceeding the user wire limits.  There is a per map limit which is the smaller of either
+			 * the process's rlimit or the global vm_per_task_user_wire_limit which caps this value.  There is also
+			 * a system-wide limit on the amount of memory all users can wire.  If the user is over either
+			 * limit, then we fail.
+			 */
+
+			if (size + map->user_wire_size > MIN(map->user_wire_limit, vm_per_task_user_wire_limit) ||
+			    size + ptoa_64(total_wire_count) > vm_global_user_wire_limit) {
+				return KERN_RESOURCE_SHORTAGE;
 			}
 
-			local_end = entry->vme_end;
-		        if (!(entry->needs_copy)) {
-				/* if needs_copy we are a COW submap */
-				/* in such a case we just replace so */
-				/* there is no need for the follow-  */
-				/* ing check.                        */
-				encountered_sub_map = TRUE;
-				sub_start = entry->offset;
+			/*
+			 * The first time the user wires an entry, we also increment the wired_count and add this to
+			 * the total that has been wired in the map.
+			 */
 
-				if(entry->vme_end < dst_end)
-					sub_end = entry->vme_end;
-				else 
-					sub_end = dst_end;
-				sub_end -= entry->vme_start;
-				sub_end += entry->offset;
-				vm_map_unlock(dst_map);
-			
-				kr = vm_map_overwrite_submap_recurse(
-					entry->object.sub_map,
-					sub_start,
-					sub_end - sub_start);
-				if(kr != KERN_SUCCESS)
-					return kr;
-				vm_map_lock(dst_map);
+			if (entry->wired_count >= MAX_WIRE_COUNT) {
+				return KERN_FAILURE;
 			}
 
-			if (dst_end <= entry->vme_end)
-				goto start_overwrite;
-			if(!vm_map_lookup_entry(dst_map, local_end, 
-						&entry)) {
-				vm_map_unlock(dst_map);
-				return(KERN_INVALID_ADDRESS);
-			}
-			next = entry->vme_next;
+			entry->wired_count++;
+			map->user_wire_size += size;
 		}
 
-		if ( ! (entry->protection & VM_PROT_WRITE)) {
-			vm_map_unlock(dst_map);
-			return(KERN_PROTECTION_FAILURE);
+		if (entry->user_wired_count >= MAX_WIRE_COUNT) {
+			return KERN_FAILURE;
 		}
 
+		entry->user_wired_count++;
+	} else {
 		/*
-		 *	If the entry is in transition, we must wait
-		 *	for it to exit that state.  Anything could happen
-		 *	when we unlock the map, so start over.
+		 * The kernel's wiring the memory.  Just bump the count and continue.
 		 */
-                if (entry->in_transition) {
 
-                        /*
-                         * Say that we are waiting, and wait for entry.
-                         */
-                        entry->needs_wakeup = TRUE;
-                        vm_map_entry_wait(dst_map, THREAD_UNINT);
-
-			goto start_pass_1;
+		if (entry->wired_count >= MAX_WIRE_COUNT) {
+			panic("vm_map_wire: too many wirings");
 		}
 
+		entry->wired_count++;
+	}
+
+	return KERN_SUCCESS;
+}
+
 /*
- *		our range is contained completely within this map entry
- */
-		if (dst_end <= entry->vme_end)
-			break;
-/*
- *		check that range specified is contiguous region
+ * Update the memory wiring accounting now that the given map entry is being unwired.
  */
-		if ((next == vm_map_to_entry(dst_map)) ||
-		    (next->vme_start != entry->vme_end)) {
-			vm_map_unlock(dst_map);
-			return(KERN_INVALID_ADDRESS);
-		}
-
 
+static void
+subtract_wire_counts(
+	vm_map_t        map,
+	vm_map_entry_t  entry,
+	boolean_t       user_wire)
+{
+	if (user_wire) {
 		/*
-		 *	Check for permanent objects in the destination.
+		 * We're unwiring memory at the request of the user.  See if we're removing the last user wire reference.
 		 */
-		if ((entry->object.vm_object != VM_OBJECT_NULL) &&
-			   ((!entry->object.vm_object->internal) ||
-			   (entry->object.vm_object->true_share))) {
-			contains_permanent_objects = TRUE;
-		}
 
-		entry = next;
-	}/* for */
+		if (entry->user_wired_count == 1) {
+			/*
+			 * We're removing the last user wire reference.  Decrement the wired_count and the total
+			 * user wired memory for this map.
+			 */
 
-start_overwrite:
-	/*
-	 *	If there are permanent objects in the destination, then
-	 *	the copy cannot be interrupted.
-	 */
+			assert(entry->wired_count >= 1);
+			entry->wired_count--;
+			map->user_wire_size -= entry->vme_end - entry->vme_start;
+		}
 
-	if (interruptible && contains_permanent_objects) {
-		vm_map_unlock(dst_map);
-		return(KERN_FAILURE);	/* XXX */
+		assert(entry->user_wired_count >= 1);
+		entry->user_wired_count--;
+	} else {
+		/*
+		 * The kernel is unwiring the memory.   Just update the count.
+		 */
+
+		assert(entry->wired_count >= 1);
+		entry->wired_count--;
 	}
+}
 
-	/*
- 	 *
-	 *	Make a second pass, overwriting the data
-	 *	At the beginning of each loop iteration,
-	 *	the next entry to be overwritten is "tmp_entry"
-	 *	(initially, the value returned from the lookup above),
-	 *	and the starting address expected in that entry
-	 *	is "start".
-	 */
+int cs_executable_wire = 0;
 
-	total_size = copy->size;
-	if(encountered_sub_map) {
-		copy_size = 0;
-		/* re-calculate tmp_entry since we've had the map */
-		/* unlocked */
-		if (!vm_map_lookup_entry( dst_map, dst_addr, &tmp_entry)) {
-			vm_map_unlock(dst_map);
-			return(KERN_INVALID_ADDRESS);
+/*
+ *	vm_map_wire:
+ *
+ *	Sets the pageability of the specified address range in the
+ *	target map as wired.  Regions specified as not pageable require
+ *	locked-down physical memory and physical page maps.  The
+ *	access_type variable indicates types of accesses that must not
+ *	generate page faults.  This is checked against protection of
+ *	memory being locked-down.
+ *
+ *	The map must not be locked, but a reference must remain to the
+ *	map throughout the call.
+ */
+static kern_return_t
+vm_map_wire_nested(
+	vm_map_t                map,
+	vm_map_offset_t         start,
+	vm_map_offset_t         end,
+	vm_prot_t               caller_prot,
+	vm_tag_t                tag,
+	boolean_t               user_wire,
+	pmap_t                  map_pmap,
+	vm_map_offset_t         pmap_addr,
+	ppnum_t                 *physpage_p)
+{
+	vm_map_entry_t          entry;
+	vm_prot_t               access_type;
+	struct vm_map_entry     *first_entry, tmp_entry;
+	vm_map_t                real_map;
+	vm_map_offset_t         s, e;
+	kern_return_t           rc;
+	boolean_t               need_wakeup;
+	boolean_t               main_map = FALSE;
+	wait_interrupt_t        interruptible_state;
+	thread_t                cur_thread;
+	unsigned int            last_timestamp;
+	vm_map_size_t           size;
+	boolean_t               wire_and_extract;
+
+	access_type = (caller_prot & VM_PROT_ALL);
+
+	wire_and_extract = FALSE;
+	if (physpage_p != NULL) {
+		/*
+		 * The caller wants the physical page number of the
+		 * wired page.  We return only one physical page number
+		 * so this works for only one page at a time.
+		 */
+		if ((end - start) != PAGE_SIZE) {
+			return KERN_INVALID_ARGUMENT;
 		}
+		wire_and_extract = TRUE;
+		*physpage_p = 0;
+	}
+
+	vm_map_lock(map);
+	if (map_pmap == NULL) {
+		main_map = TRUE;
+	}
+	last_timestamp = map->timestamp;
+
+	VM_MAP_RANGE_CHECK(map, start, end);
+	assert(page_aligned(start));
+	assert(page_aligned(end));
+	assert(VM_MAP_PAGE_ALIGNED(start, VM_MAP_PAGE_MASK(map)));
+	assert(VM_MAP_PAGE_ALIGNED(end, VM_MAP_PAGE_MASK(map)));
+	if (start == end) {
+		/* We wired what the caller asked for, zero pages */
+		vm_map_unlock(map);
+		return KERN_SUCCESS;
+	}
+
+	need_wakeup = FALSE;
+	cur_thread = current_thread();
+
+	s = start;
+	rc = KERN_SUCCESS;
+
+	if (vm_map_lookup_entry(map, s, &first_entry)) {
+		entry = first_entry;
+		/*
+		 * vm_map_clip_start will be done later.
+		 * We don't want to unnest any nested submaps here !
+		 */
 	} else {
-		copy_size = copy->size;
+		/* Start address is not in map */
+		rc = KERN_INVALID_ADDRESS;
+		goto done;
 	}
-	
-	base_addr = dst_addr;
-	while(TRUE) {
-		/* deconstruct the copy object and do in parts */
-		/* only in sub_map, interruptable case */
-		vm_map_entry_t	copy_entry;
-		vm_map_entry_t	previous_prev;
-		vm_map_entry_t	next_copy;
-		int		nentries;
-		int		remaining_entries;
-		int		new_offset;
-	
-		for (entry = tmp_entry; copy_size == 0;) {
-			vm_map_entry_t	next;
 
-			next = entry->vme_next;
+	while ((entry != vm_map_to_entry(map)) && (s < end)) {
+		/*
+		 * At this point, we have wired from "start" to "s".
+		 * We still need to wire from "s" to "end".
+		 *
+		 * "entry" hasn't been clipped, so it could start before "s"
+		 * and/or end after "end".
+		 */
 
-			/* tmp_entry and base address are moved along */
-			/* each time we encounter a sub-map.  Otherwise */
-			/* entry can outpase tmp_entry, and the copy_size */
-			/* may reflect the distance between them */
-			/* if the current entry is found to be in transition */
-			/* we will start over at the beginning or the last */
-			/* encounter of a submap as dictated by base_addr */
-			/* we will zero copy_size accordingly. */
-			if (entry->in_transition) {
-                       		/*
-                       		 * Say that we are waiting, and wait for entry.
-                       		 */
-                       		entry->needs_wakeup = TRUE;
-                       		vm_map_entry_wait(dst_map, THREAD_UNINT);
+		/* "e" is how far we want to wire in this entry */
+		e = entry->vme_end;
+		if (e > end) {
+			e = end;
+		}
 
-				vm_map_lock(dst_map);
-				if(!vm_map_lookup_entry(dst_map, base_addr, 
-								&tmp_entry)) {
-					vm_map_unlock(dst_map);
-					return(KERN_INVALID_ADDRESS);
-				}
-				copy_size = 0;
-				entry = tmp_entry;
-				continue;
+		/*
+		 * If another thread is wiring/unwiring this entry then
+		 * block after informing other thread to wake us up.
+		 */
+		if (entry->in_transition) {
+			wait_result_t wait_result;
+
+			/*
+			 * We have not clipped the entry.  Make sure that
+			 * the start address is in range so that the lookup
+			 * below will succeed.
+			 * "s" is the current starting point: we've already
+			 * wired from "start" to "s" and we still have
+			 * to wire from "s" to "end".
+			 */
+
+			entry->needs_wakeup = TRUE;
+
+			/*
+			 * wake up anybody waiting on entries that we have
+			 * already wired.
+			 */
+			if (need_wakeup) {
+				vm_map_entry_wakeup(map);
+				need_wakeup = FALSE;
+			}
+			/*
+			 * User wiring is interruptible
+			 */
+			wait_result = vm_map_entry_wait(map,
+			    (user_wire) ? THREAD_ABORTSAFE :
+			    THREAD_UNINT);
+			if (user_wire && wait_result == THREAD_INTERRUPTED) {
+				/*
+				 * undo the wirings we have done so far
+				 * We do not clear the needs_wakeup flag,
+				 * because we cannot tell if we were the
+				 * only one waiting.
+				 */
+				rc = KERN_FAILURE;
+				goto done;
 			}
-			if(entry->is_sub_map) {
-				vm_offset_t	sub_start;
-				vm_offset_t	sub_end;
-				vm_offset_t	local_end;
 
-		        	if (entry->needs_copy) {
-					/* if this is a COW submap */
-					/* just back the range with a */
-					/* anonymous entry */
-					if(entry->vme_end < dst_end)
-						sub_end = entry->vme_end;
-					else 
-						sub_end = dst_end;
-					if(entry->vme_start < base_addr)
-						sub_start = base_addr;
-					else 
-						sub_start = entry->vme_start;
-					vm_map_clip_end(
-						dst_map, entry, sub_end);
-					vm_map_clip_start(
-						dst_map, entry, sub_start);
-					entry->is_sub_map = FALSE;
-					vm_map_deallocate(
-						entry->object.sub_map);
-					entry->object.sub_map = NULL;
-					entry->is_shared = FALSE;
-					entry->needs_copy = FALSE;
-					entry->offset = 0;
-					entry->protection = VM_PROT_ALL;
-					entry->max_protection = VM_PROT_ALL;
-					entry->wired_count = 0;
-					entry->user_wired_count = 0;
-					if(entry->inheritance 
-							== VM_INHERIT_SHARE) 
-					   entry->inheritance = VM_INHERIT_COPY;
-					continue;
-				}
-				/* first take care of any non-sub_map */
-				/* entries to send */
-				if(base_addr < entry->vme_start) {
-					/* stuff to send */
-					copy_size = 
-						entry->vme_start - base_addr;
-					break;
-				}
-				sub_start = entry->offset;
+			/*
+			 * Cannot avoid a lookup here. reset timestamp.
+			 */
+			last_timestamp = map->timestamp;
 
-				if(entry->vme_end < dst_end)
-					sub_end = entry->vme_end;
-				else 
-					sub_end = dst_end;
-				sub_end -= entry->vme_start;
-				sub_end += entry->offset;
-				local_end = entry->vme_end;
-				vm_map_unlock(dst_map);
-				copy_size = sub_end - sub_start;
+			/*
+			 * The entry could have been clipped, look it up again.
+			 * Worse that can happen is, it may not exist anymore.
+			 */
+			if (!vm_map_lookup_entry(map, s, &first_entry)) {
+				/*
+				 * User: undo everything upto the previous
+				 * entry.  let vm_map_unwire worry about
+				 * checking the validity of the range.
+				 */
+				rc = KERN_FAILURE;
+				goto done;
+			}
+			entry = first_entry;
+			continue;
+		}
 
-				/* adjust the copy object */
-				if (total_size > copy_size) {
-					vm_size_t	local_size = 0;
-					vm_size_t	entry_size;
-
-				   nentries = 1;
-				   new_offset = copy->offset;
-				   copy_entry = vm_map_copy_first_entry(copy);
-				   while(copy_entry != 
-					         vm_map_copy_to_entry(copy)){
-				       entry_size = copy_entry->vme_end - 
-						      copy_entry->vme_start;
-				       if((local_size < copy_size) &&
-				       		((local_size + entry_size) 
-					         >= copy_size)) {
-				          vm_map_copy_clip_end(copy, 
-					         copy_entry, 
-					         copy_entry->vme_start +
-					         (copy_size - local_size));
-				          entry_size = copy_entry->vme_end - 
-				  		         copy_entry->vme_start;
-					  local_size += entry_size;
-					  new_offset += entry_size;
-				       }
-				       if(local_size >= copy_size) {
-				          next_copy = copy_entry->vme_next;
-					  copy_entry->vme_next = 
-					            vm_map_copy_to_entry(copy);
-				          previous_prev = 
-						   copy->cpy_hdr.links.prev;
-					  copy->cpy_hdr.links.prev = copy_entry;
-				          copy->size = copy_size;
-					  remaining_entries = 
-						        copy->cpy_hdr.nentries;
-					  remaining_entries -= nentries;
-					  copy->cpy_hdr.nentries = nentries;
-				          break;
-				       } else {
-				          local_size += entry_size;
-					  new_offset += entry_size;
-					  nentries++;
-				       }
-				       copy_entry = copy_entry->vme_next;
-				   }
-				}
-			
-				if((entry->use_pmap) && (pmap == NULL)) {
-					kr = vm_map_copy_overwrite_nested(
-						entry->object.sub_map,
-						sub_start,
-						copy,
-						interruptible, 
-						entry->object.sub_map->pmap);
-				} else if (pmap != NULL) {
-					kr = vm_map_copy_overwrite_nested(
-						entry->object.sub_map,
-						sub_start,
-						copy,
-						interruptible, pmap);
+		if (entry->is_sub_map) {
+			vm_map_offset_t sub_start;
+			vm_map_offset_t sub_end;
+			vm_map_offset_t local_start;
+			vm_map_offset_t local_end;
+			pmap_t          pmap;
+
+			if (wire_and_extract) {
+				/*
+				 * Wiring would result in copy-on-write
+				 * which would not be compatible with
+				 * the sharing we have with the original
+				 * provider of this memory.
+				 */
+				rc = KERN_INVALID_ARGUMENT;
+				goto done;
+			}
+
+			vm_map_clip_start(map, entry, s);
+			vm_map_clip_end(map, entry, end);
+
+			sub_start = VME_OFFSET(entry);
+			sub_end = entry->vme_end;
+			sub_end += VME_OFFSET(entry) - entry->vme_start;
+
+			local_end = entry->vme_end;
+			if (map_pmap == NULL) {
+				vm_object_t             object;
+				vm_object_offset_t      offset;
+				vm_prot_t               prot;
+				boolean_t               wired;
+				vm_map_entry_t          local_entry;
+				vm_map_version_t         version;
+				vm_map_t                lookup_map;
+
+				if (entry->use_pmap) {
+					pmap = VME_SUBMAP(entry)->pmap;
+					/* ppc implementation requires that */
+					/* submaps pmap address ranges line */
+					/* up with parent map */
+#ifdef notdef
+					pmap_addr = sub_start;
+#endif
+					pmap_addr = s;
 				} else {
-					kr = vm_map_copy_overwrite_nested(
-						entry->object.sub_map,
-						sub_start,
-						copy,
-						interruptible,
-						dst_map->pmap);
-				}
-				if(kr != KERN_SUCCESS) {
-					if(next_copy != NULL) {
-					   copy->cpy_hdr.nentries += 
-							   remaining_entries;
-				           copy->cpy_hdr.links.prev->vme_next = 
-							   next_copy;
-				           copy->cpy_hdr.links.prev 
-							   = previous_prev;
-					   copy->size = total_size;
+					pmap = map->pmap;
+					pmap_addr = s;
+				}
+
+				if (entry->wired_count) {
+					if ((rc = add_wire_counts(map, entry, user_wire)) != KERN_SUCCESS) {
+						goto done;
 					}
-					return kr;
+
+					/*
+					 * The map was not unlocked:
+					 * no need to goto re-lookup.
+					 * Just go directly to next entry.
+					 */
+					entry = entry->vme_next;
+					s = entry->vme_start;
+					continue;
 				}
-				if (dst_end <= local_end) {
-					return(KERN_SUCCESS);
+
+				/* call vm_map_lookup_locked to */
+				/* cause any needs copy to be   */
+				/* evaluated */
+				local_start = entry->vme_start;
+				lookup_map = map;
+				vm_map_lock_write_to_read(map);
+				if (vm_map_lookup_locked(
+					    &lookup_map, local_start,
+					    access_type | VM_PROT_COPY,
+					    OBJECT_LOCK_EXCLUSIVE,
+					    &version, &object,
+					    &offset, &prot, &wired,
+					    NULL,
+					    &real_map)) {
+					vm_map_unlock_read(lookup_map);
+					assert(map_pmap == NULL);
+					vm_map_unwire(map, start,
+					    s, user_wire);
+					return KERN_FAILURE;
 				}
-				/* otherwise copy no longer exists, it was */
-				/* destroyed after successful copy_overwrite */
-			        copy = (vm_map_copy_t) 
-						zalloc(vm_map_copy_zone);
-				vm_map_copy_first_entry(copy) =
-				   vm_map_copy_last_entry(copy) =
-			           vm_map_copy_to_entry(copy);
-				copy->type = VM_MAP_COPY_ENTRY_LIST;
-				copy->offset = new_offset;
+				vm_object_unlock(object);
+				if (real_map != lookup_map) {
+					vm_map_unlock(real_map);
+				}
+				vm_map_unlock_read(lookup_map);
+				vm_map_lock(map);
 
-				total_size -= copy_size;
-				copy_size = 0;
-				/* put back remainder of copy in container */
-				if(next_copy != NULL) {
-				   copy->cpy_hdr.nentries = remaining_entries;
-				   copy->cpy_hdr.links.next = next_copy;
-			           copy->cpy_hdr.links.prev = previous_prev;
-				   copy->size = total_size;
-				   next_copy->vme_prev = 
-					         vm_map_copy_to_entry(copy);
-				   next_copy = NULL;
+				/* we unlocked, so must re-lookup */
+				if (!vm_map_lookup_entry(map,
+				    local_start,
+				    &local_entry)) {
+					rc = KERN_FAILURE;
+					goto done;
 				}
-				base_addr = local_end;
-				vm_map_lock(dst_map);
-				if(!vm_map_lookup_entry(dst_map, 
-						local_end, &tmp_entry)) {
-					vm_map_unlock(dst_map);
-					return(KERN_INVALID_ADDRESS);
+
+				/*
+				 * entry could have been "simplified",
+				 * so re-clip
+				 */
+				entry = local_entry;
+				assert(s == local_start);
+				vm_map_clip_start(map, entry, s);
+				vm_map_clip_end(map, entry, end);
+				/* re-compute "e" */
+				e = entry->vme_end;
+				if (e > end) {
+					e = end;
 				}
-				entry = tmp_entry;
-				continue;
-			} 
-			if (dst_end <= entry->vme_end) {
-				copy_size = dst_end - base_addr;
-				break;
+
+				/* did we have a change of type? */
+				if (!entry->is_sub_map) {
+					last_timestamp = map->timestamp;
+					continue;
+				}
+			} else {
+				local_start = entry->vme_start;
+				pmap = map_pmap;
 			}
 
-			if ((next == vm_map_to_entry(dst_map)) ||
-				    (next->vme_start != entry->vme_end)) {
-				vm_map_unlock(dst_map);
-				return(KERN_INVALID_ADDRESS);
+			if ((rc = add_wire_counts(map, entry, user_wire)) != KERN_SUCCESS) {
+				goto done;
 			}
 
-			entry = next;
-		}/* for */
+			entry->in_transition = TRUE;
 
-		next_copy = NULL;
-		nentries = 1;
+			vm_map_unlock(map);
+			rc = vm_map_wire_nested(VME_SUBMAP(entry),
+			    sub_start, sub_end,
+			    caller_prot, tag,
+			    user_wire, pmap, pmap_addr,
+			    NULL);
+			vm_map_lock(map);
 
-		/* adjust the copy object */
-		if (total_size > copy_size) {
-			vm_size_t	local_size = 0;
-			vm_size_t	entry_size;
+			/*
+			 * Find the entry again.  It could have been clipped
+			 * after we unlocked the map.
+			 */
+			if (!vm_map_lookup_entry(map, local_start,
+			    &first_entry)) {
+				panic("vm_map_wire: re-lookup failed");
+			}
+			entry = first_entry;
 
-			new_offset = copy->offset;
-			copy_entry = vm_map_copy_first_entry(copy);
-			while(copy_entry != vm_map_copy_to_entry(copy)) {
-				entry_size = copy_entry->vme_end - 
-						copy_entry->vme_start;
-				if((local_size < copy_size) &&
-						((local_size + entry_size) 
-						>= copy_size)) {
-					vm_map_copy_clip_end(copy, copy_entry, 
-						copy_entry->vme_start +
-						(copy_size - local_size));
-					entry_size = copy_entry->vme_end - 
-				  		   copy_entry->vme_start;
-					local_size += entry_size;
-					new_offset += entry_size;
+			assert(local_start == s);
+			/* re-compute "e" */
+			e = entry->vme_end;
+			if (e > end) {
+				e = end;
+			}
+
+			last_timestamp = map->timestamp;
+			while ((entry != vm_map_to_entry(map)) &&
+			    (entry->vme_start < e)) {
+				assert(entry->in_transition);
+				entry->in_transition = FALSE;
+				if (entry->needs_wakeup) {
+					entry->needs_wakeup = FALSE;
+					need_wakeup = TRUE;
 				}
-				if(local_size >= copy_size) {
-					next_copy = copy_entry->vme_next;
-					copy_entry->vme_next = 
-						vm_map_copy_to_entry(copy);
-					previous_prev = 
-						copy->cpy_hdr.links.prev;
-					copy->cpy_hdr.links.prev = copy_entry;
-					copy->size = copy_size;
-					remaining_entries = 
-						copy->cpy_hdr.nentries;
-					remaining_entries -= nentries;
-					copy->cpy_hdr.nentries = nentries;
-					break;
-				} else {
-					local_size += entry_size;
-					new_offset += entry_size;
-					nentries++;
+				if (rc != KERN_SUCCESS) {/* from vm_*_wire */
+					subtract_wire_counts(map, entry, user_wire);
 				}
-				copy_entry = copy_entry->vme_next;
+				entry = entry->vme_next;
+			}
+			if (rc != KERN_SUCCESS) {       /* from vm_*_wire */
+				goto done;
 			}
-		}
-
-		if (aligned) {
-			pmap_t	local_pmap;
 
-			if(pmap)
-				local_pmap = pmap;
-			else
-				local_pmap = dst_map->pmap;
+			/* no need to relookup again */
+			s = entry->vme_start;
+			continue;
+		}
 
-			if ((kr =  vm_map_copy_overwrite_aligned( 
-				dst_map, tmp_entry, copy,
-				base_addr, local_pmap)) != KERN_SUCCESS) {
-				if(next_copy != NULL) {
-					copy->cpy_hdr.nentries += 
-							   remaining_entries;
-				        copy->cpy_hdr.links.prev->vme_next = 
-							   next_copy;
-			       		copy->cpy_hdr.links.prev = 
-							previous_prev;
-					copy->size += copy_size;
-				}
-				return kr;
-			}
-			vm_map_unlock(dst_map);
-		} else {
 		/*
-		 * Performance gain:
-		 *
-		 * if the copy and dst address are misaligned but the same
-		 * offset within the page we can copy_not_aligned the
-		 * misaligned parts and copy aligned the rest.  If they are
-		 * aligned but len is unaligned we simply need to copy
-		 * the end bit unaligned.  We'll need to split the misaligned
-		 * bits of the region in this case !
-		 */
-		/* ALWAYS UNLOCKS THE dst_map MAP */
-			if ((kr =  vm_map_copy_overwrite_unaligned( dst_map,
-				tmp_entry, copy, base_addr)) != KERN_SUCCESS) {
-				if(next_copy != NULL) {
-					copy->cpy_hdr.nentries +=
-							     remaining_entries;
-			       		copy->cpy_hdr.links.prev->vme_next = 
-							     next_copy;
-			       		copy->cpy_hdr.links.prev = 
-						previous_prev;
-					copy->size += copy_size;
+		 * If this entry is already wired then increment
+		 * the appropriate wire reference count.
+		 */
+		if (entry->wired_count) {
+			if ((entry->protection & access_type) != access_type) {
+				/* found a protection problem */
+
+				/*
+				 * XXX FBDP
+				 * We should always return an error
+				 * in this case but since we didn't
+				 * enforce it before, let's do
+				 * it only for the new "wire_and_extract"
+				 * code path for now...
+				 */
+				if (wire_and_extract) {
+					rc = KERN_PROTECTION_FAILURE;
+					goto done;
 				}
-				return kr;
 			}
-		}
-		total_size -= copy_size;
-		if(total_size == 0)
-			break;
-		base_addr += copy_size;
-		copy_size = 0;
-		copy->offset = new_offset;
-		if(next_copy != NULL) {
-			copy->cpy_hdr.nentries = remaining_entries;
-			copy->cpy_hdr.links.next = next_copy;
-			copy->cpy_hdr.links.prev = previous_prev;
-			next_copy->vme_prev = vm_map_copy_to_entry(copy);
-			copy->size = total_size;
-		}
-		vm_map_lock(dst_map);
-		while(TRUE) {
-			if (!vm_map_lookup_entry(dst_map, 
-						base_addr, &tmp_entry)) {
-				vm_map_unlock(dst_map);
-				return(KERN_INVALID_ADDRESS);
+
+			/*
+			 * entry is already wired down, get our reference
+			 * after clipping to our range.
+			 */
+			vm_map_clip_start(map, entry, s);
+			vm_map_clip_end(map, entry, end);
+
+			if ((rc = add_wire_counts(map, entry, user_wire)) != KERN_SUCCESS) {
+				goto done;
 			}
-                	if (tmp_entry->in_transition) {
-                       		entry->needs_wakeup = TRUE;
-                       		vm_map_entry_wait(dst_map, THREAD_UNINT);
-			} else {
-				break;
+
+			if (wire_and_extract) {
+				vm_object_t             object;
+				vm_object_offset_t      offset;
+				vm_page_t               m;
+
+				/*
+				 * We don't have to "wire" the page again
+				 * bit we still have to "extract" its
+				 * physical page number, after some sanity
+				 * checks.
+				 */
+				assert((entry->vme_end - entry->vme_start)
+				    == PAGE_SIZE);
+				assert(!entry->needs_copy);
+				assert(!entry->is_sub_map);
+				assert(VME_OBJECT(entry));
+				if (((entry->vme_end - entry->vme_start)
+				    != PAGE_SIZE) ||
+				    entry->needs_copy ||
+				    entry->is_sub_map ||
+				    VME_OBJECT(entry) == VM_OBJECT_NULL) {
+					rc = KERN_INVALID_ARGUMENT;
+					goto done;
+				}
+
+				object = VME_OBJECT(entry);
+				offset = VME_OFFSET(entry);
+				/* need exclusive lock to update m->dirty */
+				if (entry->protection & VM_PROT_WRITE) {
+					vm_object_lock(object);
+				} else {
+					vm_object_lock_shared(object);
+				}
+				m = vm_page_lookup(object, offset);
+				assert(m != VM_PAGE_NULL);
+				assert(VM_PAGE_WIRED(m));
+				if (m != VM_PAGE_NULL && VM_PAGE_WIRED(m)) {
+					*physpage_p = VM_PAGE_GET_PHYS_PAGE(m);
+					if (entry->protection & VM_PROT_WRITE) {
+						vm_object_lock_assert_exclusive(
+							object);
+						m->vmp_dirty = TRUE;
+					}
+				} else {
+					/* not already wired !? */
+					*physpage_p = 0;
+				}
+				vm_object_unlock(object);
 			}
+
+			/* map was not unlocked: no need to relookup */
+			entry = entry->vme_next;
+			s = entry->vme_start;
+			continue;
 		}
-		vm_map_clip_start(dst_map, tmp_entry, trunc_page(base_addr));
 
-		entry = tmp_entry;
-	} /* while */
+		/*
+		 * Unwired entry or wire request transmitted via submap
+		 */
 
-	/*
-	 *	Throw away the vm_map_copy object
-	 */
-	vm_map_copy_discard(copy);
+		/*
+		 * Wiring would copy the pages to the shadow object.
+		 * The shadow object would not be code-signed so
+		 * attempting to execute code from these copied pages
+		 * would trigger a code-signing violation.
+		 */
 
-	return(KERN_SUCCESS);
-}/* vm_map_copy_overwrite */
+		if ((entry->protection & VM_PROT_EXECUTE)
+#if !CONFIG_EMBEDDED
+		    &&
+		    map != kernel_map &&
+		    cs_process_enforcement(NULL)
+#endif /* !CONFIG_EMBEDDED */
+		    ) {
+#if MACH_ASSERT
+			printf("pid %d[%s] wiring executable range from "
+			    "0x%llx to 0x%llx: rejected to preserve "
+			    "code-signing\n",
+			    proc_selfpid(),
+			    (current_task()->bsd_info
+			    ? proc_name_address(current_task()->bsd_info)
+			    : "?"),
+			    (uint64_t) entry->vme_start,
+			    (uint64_t) entry->vme_end);
+#endif /* MACH_ASSERT */
+			DTRACE_VM2(cs_executable_wire,
+			    uint64_t, (uint64_t)entry->vme_start,
+			    uint64_t, (uint64_t)entry->vme_end);
+			cs_executable_wire++;
+			rc = KERN_PROTECTION_FAILURE;
+			goto done;
+		}
 
-kern_return_t
-vm_map_copy_overwrite(
-	vm_map_t	dst_map,
-	vm_offset_t	dst_addr,
-	vm_map_copy_t	copy,
-	boolean_t	interruptible)
-{
-	return vm_map_copy_overwrite_nested(
-			dst_map, dst_addr, copy, interruptible, (pmap_t) NULL);
-}
+		/*
+		 * Perform actions of vm_map_lookup that need the write
+		 * lock on the map: create a shadow object for a
+		 * copy-on-write region, or an object for a zero-fill
+		 * region.
+		 */
+		size = entry->vme_end - entry->vme_start;
+		/*
+		 * If wiring a copy-on-write page, we need to copy it now
+		 * even if we're only (currently) requesting read access.
+		 * This is aggressive, but once it's wired we can't move it.
+		 */
+		if (entry->needs_copy) {
+			if (wire_and_extract) {
+				/*
+				 * We're supposed to share with the original
+				 * provider so should not be "needs_copy"
+				 */
+				rc = KERN_INVALID_ARGUMENT;
+				goto done;
+			}
 
+			VME_OBJECT_SHADOW(entry, size);
+			entry->needs_copy = FALSE;
+		} else if (VME_OBJECT(entry) == VM_OBJECT_NULL) {
+			if (wire_and_extract) {
+				/*
+				 * We're supposed to share with the original
+				 * provider so should already have an object.
+				 */
+				rc = KERN_INVALID_ARGUMENT;
+				goto done;
+			}
+			VME_OBJECT_SET(entry, vm_object_allocate(size));
+			VME_OFFSET_SET(entry, (vm_object_offset_t)0);
+			assert(entry->use_pmap);
+		}
 
-/*
- *	Routine: vm_map_copy_overwrite_unaligned
- *
- *	Decription:
- *	Physically copy unaligned data
- *
- *	Implementation:
- *	Unaligned parts of pages have to be physically copied.  We use
- *	a modified form of vm_fault_copy (which understands none-aligned
- *	page offsets and sizes) to do the copy.  We attempt to copy as
- *	much memory in one go as possibly, however vm_fault_copy copies
- *	within 1 memory object so we have to find the smaller of "amount left"
- *	"source object data size" and "target object data size".  With
- *	unaligned data we don't need to split regions, therefore the source
- *	(copy) object should be one map entry, the target range may be split
- *	over multiple map entries however.  In any event we are pessimistic
- *	about these assumptions.
- *
- *	Assumptions:
- *	dst_map is locked on entry and is return locked on success,
- *	unlocked on error.
- */
+		vm_map_clip_start(map, entry, s);
+		vm_map_clip_end(map, entry, end);
 
-kern_return_t
-vm_map_copy_overwrite_unaligned(
-	vm_map_t	dst_map,
-	vm_map_entry_t	entry,
-	vm_map_copy_t	copy,
-	vm_offset_t	start)
-{
-	vm_map_entry_t		copy_entry = vm_map_copy_first_entry(copy);
-	vm_map_version_t	version;
-	vm_object_t		dst_object;
-	vm_object_offset_t	dst_offset;
-	vm_object_offset_t	src_offset;
-	vm_object_offset_t	entry_offset;
-	vm_offset_t		entry_end;
-	vm_size_t		src_size,
-				dst_size,
-				copy_size,
-				amount_left;
-	kern_return_t		kr = KERN_SUCCESS;
+		/* re-compute "e" */
+		e = entry->vme_end;
+		if (e > end) {
+			e = end;
+		}
 
-	vm_map_lock_write_to_read(dst_map);
+		/*
+		 * Check for holes and protection mismatch.
+		 * Holes: Next entry should be contiguous unless this
+		 *	  is the end of the region.
+		 * Protection: Access requested must be allowed, unless
+		 *	wiring is by protection class
+		 */
+		if ((entry->vme_end < end) &&
+		    ((entry->vme_next == vm_map_to_entry(map)) ||
+		    (entry->vme_next->vme_start > entry->vme_end))) {
+			/* found a hole */
+			rc = KERN_INVALID_ADDRESS;
+			goto done;
+		}
+		if ((entry->protection & access_type) != access_type) {
+			/* found a protection problem */
+			rc = KERN_PROTECTION_FAILURE;
+			goto done;
+		}
 
-	src_offset = copy->offset - trunc_page_64(copy->offset);
-	amount_left = copy->size;
-/*
- *	unaligned so we never clipped this entry, we need the offset into
- *	the vm_object not just the data.
- */	
-	while (amount_left > 0) {
+		assert(entry->wired_count == 0 && entry->user_wired_count == 0);
 
-		if (entry == vm_map_to_entry(dst_map)) {
-			vm_map_unlock_read(dst_map);
-			return KERN_INVALID_ADDRESS;
+		if ((rc = add_wire_counts(map, entry, user_wire)) != KERN_SUCCESS) {
+			goto done;
 		}
 
-		/* "start" must be within the current map entry */
-		assert ((start>=entry->vme_start) && (start<entry->vme_end));
+		entry->in_transition = TRUE;
 
-		dst_offset = start - entry->vme_start;
+		/*
+		 * This entry might get split once we unlock the map.
+		 * In vm_fault_wire(), we need the current range as
+		 * defined by this entry.  In order for this to work
+		 * along with a simultaneous clip operation, we make a
+		 * temporary copy of this entry and use that for the
+		 * wiring.  Note that the underlying objects do not
+		 * change during a clip.
+		 */
+		tmp_entry = *entry;
 
-		dst_size = entry->vme_end - start;
+		/*
+		 * The in_transition state guarentees that the entry
+		 * (or entries for this range, if split occured) will be
+		 * there when the map lock is acquired for the second time.
+		 */
+		vm_map_unlock(map);
 
-		src_size = copy_entry->vme_end -
-			(copy_entry->vme_start + src_offset);
+		if (!user_wire && cur_thread != THREAD_NULL) {
+			interruptible_state = thread_interrupt_level(THREAD_UNINT);
+		} else {
+			interruptible_state = THREAD_UNINT;
+		}
 
-		if (dst_size < src_size) {
-/*
- *			we can only copy dst_size bytes before
- *			we have to get the next destination entry
- */
-			copy_size = dst_size;
+		if (map_pmap) {
+			rc = vm_fault_wire(map,
+			    &tmp_entry, caller_prot, tag, map_pmap, pmap_addr,
+			    physpage_p);
 		} else {
-/*
- *			we can only copy src_size bytes before
- *			we have to get the next source copy entry
- */
-			copy_size = src_size;
+			rc = vm_fault_wire(map,
+			    &tmp_entry, caller_prot, tag, map->pmap,
+			    tmp_entry.vme_start,
+			    physpage_p);
 		}
 
-		if (copy_size > amount_left) {
-			copy_size = amount_left;
+		if (!user_wire && cur_thread != THREAD_NULL) {
+			thread_interrupt_level(interruptible_state);
 		}
-/*
- *		Entry needs copy, create a shadow shadow object for
- *		Copy on write region.
- */
-		if (entry->needs_copy &&
-			 ((entry->protection & VM_PROT_WRITE) != 0))
-		{
-			if (vm_map_lock_read_to_write(dst_map)) {
-				vm_map_lock_read(dst_map);
-				goto RetryLookup;
+
+		vm_map_lock(map);
+
+		if (last_timestamp + 1 != map->timestamp) {
+			/*
+			 * Find the entry again.  It could have been clipped
+			 * after we unlocked the map.
+			 */
+			if (!vm_map_lookup_entry(map, tmp_entry.vme_start,
+			    &first_entry)) {
+				panic("vm_map_wire: re-lookup failed");
 			}
-			vm_object_shadow(&entry->object.vm_object,
-					&entry->offset,
-					(vm_size_t)(entry->vme_end
-						- entry->vme_start));
-			entry->needs_copy = FALSE;
-			vm_map_lock_write_to_read(dst_map);
+
+			entry = first_entry;
 		}
-		dst_object = entry->object.vm_object;
-/*
- *		unlike with the virtual (aligned) copy we're going
- *		to fault on it therefore we need a target object.
- */
-                if (dst_object == VM_OBJECT_NULL) {
-			if (vm_map_lock_read_to_write(dst_map)) {
-				vm_map_lock_read(dst_map);
-				goto RetryLookup;
+
+		last_timestamp = map->timestamp;
+
+		while ((entry != vm_map_to_entry(map)) &&
+		    (entry->vme_start < tmp_entry.vme_end)) {
+			assert(entry->in_transition);
+			entry->in_transition = FALSE;
+			if (entry->needs_wakeup) {
+				entry->needs_wakeup = FALSE;
+				need_wakeup = TRUE;
 			}
-			dst_object = vm_object_allocate((vm_size_t)
-					entry->vme_end - entry->vme_start);
-			entry->object.vm_object = dst_object;
-			entry->offset = 0;
-			vm_map_lock_write_to_read(dst_map);
+			if (rc != KERN_SUCCESS) {       /* from vm_*_wire */
+				subtract_wire_counts(map, entry, user_wire);
+			}
+			entry = entry->vme_next;
 		}
-/*
- *		Take an object reference and unlock map. The "entry" may
- *		disappear or change when the map is unlocked.
- */
-		vm_object_reference(dst_object);
-		version.main_timestamp = dst_map->timestamp;
-		entry_offset = entry->offset;
-		entry_end = entry->vme_end;
-		vm_map_unlock_read(dst_map);
-/*
- *		Copy as much as possible in one pass
- */
-		kr = vm_fault_copy(
-			copy_entry->object.vm_object,
-			copy_entry->offset + src_offset,
-			&copy_size,
-			dst_object,
-			entry_offset + dst_offset,
-			dst_map,
-			&version,
-			THREAD_UNINT );
-
-		start += copy_size;
-		src_offset += copy_size;
-		amount_left -= copy_size;
-/*
- *		Release the object reference
- */
-		vm_object_deallocate(dst_object);
-/*
- *		If a hard error occurred, return it now
- */
-		if (kr != KERN_SUCCESS)
-			return kr;
 
-		if ((copy_entry->vme_start + src_offset) == copy_entry->vme_end
-			|| amount_left == 0)
-		{
-/*
- *			all done with this copy entry, dispose.
- */
-			vm_map_copy_entry_unlink(copy, copy_entry);
-			vm_object_deallocate(copy_entry->object.vm_object);
-			vm_map_copy_entry_dispose(copy, copy_entry);
+		if (rc != KERN_SUCCESS) {               /* from vm_*_wire */
+			goto done;
+		}
 
-			if ((copy_entry = vm_map_copy_first_entry(copy))
-				== vm_map_copy_to_entry(copy) && amount_left) {
-/*
- *				not finished copying but run out of source
- */
-				return KERN_INVALID_ADDRESS;
-			}
-			src_offset = 0;
+		if ((entry != vm_map_to_entry(map)) && /* we still have entries in the map */
+		    (tmp_entry.vme_end != end) &&    /* AND, we are not at the end of the requested range */
+		    (entry->vme_start != tmp_entry.vme_end)) { /* AND, the next entry is not contiguous. */
+			/* found a "new" hole */
+			s = tmp_entry.vme_end;
+			rc = KERN_INVALID_ADDRESS;
+			goto done;
 		}
 
-		if (amount_left == 0)
-			return KERN_SUCCESS;
+		s = entry->vme_start;
+	} /* end while loop through map entries */
 
-		vm_map_lock_read(dst_map);
-		if (version.main_timestamp == dst_map->timestamp) {
-			if (start == entry_end) {
-/*
- *				destination region is split.  Use the version
- *				information to avoid a lookup in the normal
- *				case.
- */
-				entry = entry->vme_next;
-/*
- *				should be contiguous. Fail if we encounter
- *				a hole in the destination.
- */
-				if (start != entry->vme_start) {
-					vm_map_unlock_read(dst_map);
-					return KERN_INVALID_ADDRESS ;
-				}
-			}
-		} else {
-/*
- *			Map version check failed.
- *			we must lookup the entry because somebody
- *			might have changed the map behind our backs.
- */
-RetryLookup:
-			if (!vm_map_lookup_entry(dst_map, start, &entry))
-			{
-				vm_map_unlock_read(dst_map);
-				return KERN_INVALID_ADDRESS ;
-			}
-		}
-	}/* while */
+done:
+	if (rc == KERN_SUCCESS) {
+		/* repair any damage we may have made to the VM map */
+		vm_map_simplify_range(map, start, end);
+	}
 
-	/* NOTREACHED ?? */
-	vm_map_unlock_read(dst_map);
+	vm_map_unlock(map);
 
-	return KERN_SUCCESS;
-}/* vm_map_copy_overwrite_unaligned */
+	/*
+	 * wake up anybody waiting on entries we wired.
+	 */
+	if (need_wakeup) {
+		vm_map_entry_wakeup(map);
+	}
 
-/*
- *	Routine:	vm_map_copy_overwrite_aligned
- *
- *	Description:
- *	Does all the vm_trickery possible for whole pages.
- *
- *	Implementation:
- *
- *	If there are no permanent objects in the destination,
- *	and the source and destination map entry zones match,
- *	and the destination map entry is not shared,
- *	then the map entries can be deleted and replaced
- *	with those from the copy.  The following code is the
- *	basic idea of what to do, but there are lots of annoying
- *	little details about getting protection and inheritance
- *	right.  Should add protection, inheritance, and sharing checks
- *	to the above pass and make sure that no wiring is involved.
- */
+	if (rc != KERN_SUCCESS) {
+		/* undo what has been wired so far */
+		vm_map_unwire_nested(map, start, s, user_wire,
+		    map_pmap, pmap_addr);
+		if (physpage_p) {
+			*physpage_p = 0;
+		}
+	}
+
+	return rc;
+}
 
 kern_return_t
-vm_map_copy_overwrite_aligned(
-	vm_map_t	dst_map,
-	vm_map_entry_t	tmp_entry,
-	vm_map_copy_t	copy,
-	vm_offset_t	start,
-	pmap_t		pmap)
-{
-	vm_object_t	object;
-	vm_map_entry_t	copy_entry;
-	vm_size_t	copy_size;
-	vm_size_t	size;
-	vm_map_entry_t	entry;
-		
-	while ((copy_entry = vm_map_copy_first_entry(copy))
-		!= vm_map_copy_to_entry(copy))
-	{
-		copy_size = (copy_entry->vme_end - copy_entry->vme_start);
-		
-		entry = tmp_entry;
-		if (entry == vm_map_to_entry(dst_map)) {
-			vm_map_unlock(dst_map);
-			return KERN_INVALID_ADDRESS;
-		}
-		size = (entry->vme_end - entry->vme_start);
-		/*
-		 *	Make sure that no holes popped up in the
-		 *	address map, and that the protection is
-		 *	still valid, in case the map was unlocked
-		 *	earlier.
-		 */
+vm_map_wire_external(
+	vm_map_t                map,
+	vm_map_offset_t         start,
+	vm_map_offset_t         end,
+	vm_prot_t               caller_prot,
+	boolean_t               user_wire)
+{
+	kern_return_t   kret;
 
-		if ((entry->vme_start != start) || ((entry->is_sub_map)
-				&& !entry->needs_copy)) {
-			vm_map_unlock(dst_map);
-			return(KERN_INVALID_ADDRESS);
-		}
-		assert(entry != vm_map_to_entry(dst_map));
+	kret = vm_map_wire_nested(map, start, end, caller_prot, vm_tag_bt(),
+	    user_wire, (pmap_t)NULL, 0, NULL);
+	return kret;
+}
 
-		/*
-		 *	Check protection again
-		 */
+kern_return_t
+vm_map_wire_kernel(
+	vm_map_t                map,
+	vm_map_offset_t         start,
+	vm_map_offset_t         end,
+	vm_prot_t               caller_prot,
+	vm_tag_t                tag,
+	boolean_t               user_wire)
+{
+	kern_return_t   kret;
 
-		if ( ! (entry->protection & VM_PROT_WRITE)) {
-			vm_map_unlock(dst_map);
-			return(KERN_PROTECTION_FAILURE);
-		}
+	kret = vm_map_wire_nested(map, start, end, caller_prot, tag,
+	    user_wire, (pmap_t)NULL, 0, NULL);
+	return kret;
+}
 
-		/*
-		 *	Adjust to source size first
-		 */
+kern_return_t
+vm_map_wire_and_extract_external(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_prot_t       caller_prot,
+	boolean_t       user_wire,
+	ppnum_t         *physpage_p)
+{
+	kern_return_t   kret;
+
+	kret = vm_map_wire_nested(map,
+	    start,
+	    start + VM_MAP_PAGE_SIZE(map),
+	    caller_prot,
+	    vm_tag_bt(),
+	    user_wire,
+	    (pmap_t)NULL,
+	    0,
+	    physpage_p);
+	if (kret != KERN_SUCCESS &&
+	    physpage_p != NULL) {
+		*physpage_p = 0;
+	}
+	return kret;
+}
 
-		if (copy_size < size) {
-			vm_map_clip_end(dst_map, entry, entry->vme_start + copy_size);
-			size = copy_size;
-		}
+kern_return_t
+vm_map_wire_and_extract_kernel(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_prot_t       caller_prot,
+	vm_tag_t        tag,
+	boolean_t       user_wire,
+	ppnum_t         *physpage_p)
+{
+	kern_return_t   kret;
+
+	kret = vm_map_wire_nested(map,
+	    start,
+	    start + VM_MAP_PAGE_SIZE(map),
+	    caller_prot,
+	    tag,
+	    user_wire,
+	    (pmap_t)NULL,
+	    0,
+	    physpage_p);
+	if (kret != KERN_SUCCESS &&
+	    physpage_p != NULL) {
+		*physpage_p = 0;
+	}
+	return kret;
+}
 
-		/*
-		 *	Adjust to destination size
-		 */
+/*
+ *	vm_map_unwire:
+ *
+ *	Sets the pageability of the specified address range in the target
+ *	as pageable.  Regions specified must have been wired previously.
+ *
+ *	The map must not be locked, but a reference must remain to the map
+ *	throughout the call.
+ *
+ *	Kernel will panic on failures.  User unwire ignores holes and
+ *	unwired and intransition entries to avoid losing memory by leaving
+ *	it unwired.
+ */
+static kern_return_t
+vm_map_unwire_nested(
+	vm_map_t                map,
+	vm_map_offset_t         start,
+	vm_map_offset_t         end,
+	boolean_t               user_wire,
+	pmap_t                  map_pmap,
+	vm_map_offset_t         pmap_addr)
+{
+	vm_map_entry_t          entry;
+	struct vm_map_entry     *first_entry, tmp_entry;
+	boolean_t               need_wakeup;
+	boolean_t               main_map = FALSE;
+	unsigned int            last_timestamp;
 
-		if (size < copy_size) {
-			vm_map_copy_clip_end(copy, copy_entry,
-				copy_entry->vme_start + size);
-			copy_size = size;
-		}
+	vm_map_lock(map);
+	if (map_pmap == NULL) {
+		main_map = TRUE;
+	}
+	last_timestamp = map->timestamp;
 
-		assert((entry->vme_end - entry->vme_start) == size);
-		assert((tmp_entry->vme_end - tmp_entry->vme_start) == size);
-		assert((copy_entry->vme_end - copy_entry->vme_start) == size);
+	VM_MAP_RANGE_CHECK(map, start, end);
+	assert(page_aligned(start));
+	assert(page_aligned(end));
+	assert(VM_MAP_PAGE_ALIGNED(start, VM_MAP_PAGE_MASK(map)));
+	assert(VM_MAP_PAGE_ALIGNED(end, VM_MAP_PAGE_MASK(map)));
+
+	if (start == end) {
+		/* We unwired what the caller asked for: zero pages */
+		vm_map_unlock(map);
+		return KERN_SUCCESS;
+	}
 
+	if (vm_map_lookup_entry(map, start, &first_entry)) {
+		entry = first_entry;
 		/*
-		 *	If the destination contains temporary unshared memory,
-		 *	we can perform the copy by throwing it away and
-		 *	installing the source data.
+		 * vm_map_clip_start will be done later.
+		 * We don't want to unnest any nested sub maps here !
 		 */
+	} else {
+		if (!user_wire) {
+			panic("vm_map_unwire: start not found");
+		}
+		/*	Start address is not in map. */
+		vm_map_unlock(map);
+		return KERN_INVALID_ADDRESS;
+	}
 
-		object = entry->object.vm_object;
-		if ((!entry->is_shared && 
-		    ((object == VM_OBJECT_NULL) || 
-		    (object->internal && !object->true_share))) ||
-		    entry->needs_copy) {
-			vm_object_t	old_object = entry->object.vm_object;
-			vm_object_offset_t	old_offset = entry->offset;
-			vm_object_offset_t	offset;
+	if (entry->superpage_size) {
+		/* superpages are always wired */
+		vm_map_unlock(map);
+		return KERN_INVALID_ADDRESS;
+	}
 
+	need_wakeup = FALSE;
+	while ((entry != vm_map_to_entry(map)) && (entry->vme_start < end)) {
+		if (entry->in_transition) {
 			/*
-			 * Ensure that the source and destination aren't
-			 * identical
+			 * 1)
+			 * Another thread is wiring down this entry. Note
+			 * that if it is not for the other thread we would
+			 * be unwiring an unwired entry.  This is not
+			 * permitted.  If we wait, we will be unwiring memory
+			 * we did not wire.
+			 *
+			 * 2)
+			 * Another thread is unwiring this entry.  We did not
+			 * have a reference to it, because if we did, this
+			 * entry will not be getting unwired now.
 			 */
-			if (old_object == copy_entry->object.vm_object &&
-			    old_offset == copy_entry->offset) {
-				vm_map_copy_entry_unlink(copy, copy_entry);
-				vm_map_copy_entry_dispose(copy, copy_entry);
+			if (!user_wire) {
+				/*
+				 * XXX FBDP
+				 * This could happen:  there could be some
+				 * overlapping vslock/vsunlock operations
+				 * going on.
+				 * We should probably just wait and retry,
+				 * but then we have to be careful that this
+				 * entry could get "simplified" after
+				 * "in_transition" gets unset and before
+				 * we re-lookup the entry, so we would
+				 * have to re-clip the entry to avoid
+				 * re-unwiring what we have already unwired...
+				 * See vm_map_wire_nested().
+				 *
+				 * Or we could just ignore "in_transition"
+				 * here and proceed to decement the wired
+				 * count(s) on this entry.  That should be fine
+				 * as long as "wired_count" doesn't drop all
+				 * the way to 0 (and we should panic if THAT
+				 * happens).
+				 */
+				panic("vm_map_unwire: in_transition entry");
+			}
 
-				if (old_object != VM_OBJECT_NULL)
-					vm_object_deallocate(old_object);
+			entry = entry->vme_next;
+			continue;
+		}
 
-				start = tmp_entry->vme_end;
-				tmp_entry = tmp_entry->vme_next;
-				continue;
-			}
+		if (entry->is_sub_map) {
+			vm_map_offset_t sub_start;
+			vm_map_offset_t sub_end;
+			vm_map_offset_t local_end;
+			pmap_t          pmap;
 
-			if (old_object != VM_OBJECT_NULL) {
-				if(entry->is_sub_map) {
-				   if(entry->use_pmap) {
-#ifndef i386
-				      pmap_unnest(dst_map->pmap, 
-					entry->vme_start,
-					entry->vme_end - entry->vme_start);
-#endif
-				   } else {
-				      vm_map_submap_pmap_clean(
-					dst_map, entry->vme_start, 
-					entry->vme_end,
-					entry->object.sub_map,
-					entry->offset);
-				   }
-				   vm_map_deallocate(
-						entry->object.sub_map);
-				} else {
-					vm_object_pmap_protect(
-						old_object,
-						old_offset,
-						size,
-						pmap,
-						tmp_entry->vme_start,
-						VM_PROT_NONE);
+			vm_map_clip_start(map, entry, start);
+			vm_map_clip_end(map, entry, end);
 
-					vm_object_deallocate(old_object);
+			sub_start = VME_OFFSET(entry);
+			sub_end = entry->vme_end - entry->vme_start;
+			sub_end += VME_OFFSET(entry);
+			local_end = entry->vme_end;
+			if (map_pmap == NULL) {
+				if (entry->use_pmap) {
+					pmap = VME_SUBMAP(entry)->pmap;
+					pmap_addr = sub_start;
+				} else {
+					pmap = map->pmap;
+					pmap_addr = start;
+				}
+				if (entry->wired_count == 0 ||
+				    (user_wire && entry->user_wired_count == 0)) {
+					if (!user_wire) {
+						panic("vm_map_unwire: entry is unwired");
+					}
+					entry = entry->vme_next;
+					continue;
 				}
-			}
 
-			entry->is_sub_map = FALSE;
-			entry->object = copy_entry->object;
-			object = entry->object.vm_object;
-			entry->needs_copy = copy_entry->needs_copy;
-			entry->wired_count = 0;
-			entry->user_wired_count = 0;
-			offset = entry->offset = copy_entry->offset;
+				/*
+				 * Check for holes
+				 * Holes: Next entry should be contiguous unless
+				 * this is the end of the region.
+				 */
+				if (((entry->vme_end < end) &&
+				    ((entry->vme_next == vm_map_to_entry(map)) ||
+				    (entry->vme_next->vme_start
+				    > entry->vme_end)))) {
+					if (!user_wire) {
+						panic("vm_map_unwire: non-contiguous region");
+					}
+/*
+ *                                       entry = entry->vme_next;
+ *                                       continue;
+ */
+				}
 
-			vm_map_copy_entry_unlink(copy, copy_entry);
-			vm_map_copy_entry_dispose(copy, copy_entry);
-#if BAD_OPTIMIZATION
-			/*
-			 * if we turn this optimization back on
-			 * we need to revisit our use of pmap mappings
-			 * large copies will cause us to run out and panic
-			 * this optimization only saved on average 2 us per page if ALL
-			 * the pages in the source were currently mapped
-			 * and ALL the pages in the dest were touched, if there were fewer
-			 * than 2/3 of the pages touched, this optimization actually cost more cycles
-			 */
+				subtract_wire_counts(map, entry, user_wire);
 
-			/*
-			 * Try to aggressively enter physical mappings
-			 * (but avoid uninstantiated objects)
-			 */
-			if (object != VM_OBJECT_NULL) {
-			    vm_offset_t	va = entry->vme_start;
+				if (entry->wired_count != 0) {
+					entry = entry->vme_next;
+					continue;
+				}
 
-			    while (va < entry->vme_end) {
-				register vm_page_t	m;
-				vm_prot_t		prot;
+				entry->in_transition = TRUE;
+				tmp_entry = *entry;/* see comment in vm_map_wire() */
 
 				/*
-				 * Look for the page in the top object
+				 * We can unlock the map now. The in_transition state
+				 * guarantees existance of the entry.
 				 */
-				prot = entry->protection;
-				vm_object_lock(object);
-				vm_object_paging_begin(object);
-
-				if ((m = vm_page_lookup(object,offset)) !=
-				    VM_PAGE_NULL && !m->busy && 
-				    !m->fictitious &&
-				    (!m->unusual || (!m->error &&
-					!m->restart && !m->absent &&
-					 (prot & m->page_lock) == 0))) {
-					
-					m->busy = TRUE;
-					vm_object_unlock(object);
-					
-					/* 
-					 * Honor COW obligations
+				vm_map_unlock(map);
+				vm_map_unwire_nested(VME_SUBMAP(entry),
+				    sub_start, sub_end, user_wire, pmap, pmap_addr);
+				vm_map_lock(map);
+
+				if (last_timestamp + 1 != map->timestamp) {
+					/*
+					 * Find the entry again.  It could have been
+					 * clipped or deleted after we unlocked the map.
 					 */
-					if (entry->needs_copy)
-						prot &= ~VM_PROT_WRITE;
-					/* It is our policy to require */
-					/* explicit sync from anyone   */
-					/* writing code and then       */
-					/* a pc to execute it.         */
-					/* No isync here */
-
-					PMAP_ENTER(pmap, va, m,
-						   prot, FALSE);
-		
-					vm_object_lock(object);
-					vm_page_lock_queues();
-					if (!m->active && !m->inactive)
-						vm_page_activate(m);
-					vm_page_unlock_queues();
-					 PAGE_WAKEUP_DONE(m);
+					if (!vm_map_lookup_entry(map,
+					    tmp_entry.vme_start,
+					    &first_entry)) {
+						if (!user_wire) {
+							panic("vm_map_unwire: re-lookup failed");
+						}
+						entry = first_entry->vme_next;
+					} else {
+						entry = first_entry;
+					}
 				}
-				vm_object_paging_end(object);
-				vm_object_unlock(object);
-
-				offset += PAGE_SIZE_64;
-				va += PAGE_SIZE;
-			    } /* end while (va < entry->vme_end) */
-			} /* end if (object) */
-#endif
-			/*
-			 *	Set up for the next iteration.  The map
-			 *	has not been unlocked, so the next
-			 *	address should be at the end of this
-			 *	entry, and the next map entry should be
-			 *	the one following it.
-			 */
+				last_timestamp = map->timestamp;
 
-			start = tmp_entry->vme_end;
-			tmp_entry = tmp_entry->vme_next;
-		} else {
-			vm_map_version_t	version;
-			vm_object_t		dst_object = entry->object.vm_object;
-			vm_object_offset_t	dst_offset = entry->offset;
-			kern_return_t		r;
+				/*
+				 * clear transition bit for all constituent entries
+				 * that were in the original entry (saved in
+				 * tmp_entry).  Also check for waiters.
+				 */
+				while ((entry != vm_map_to_entry(map)) &&
+				    (entry->vme_start < tmp_entry.vme_end)) {
+					assert(entry->in_transition);
+					entry->in_transition = FALSE;
+					if (entry->needs_wakeup) {
+						entry->needs_wakeup = FALSE;
+						need_wakeup = TRUE;
+					}
+					entry = entry->vme_next;
+				}
+				continue;
+			} else {
+				vm_map_unlock(map);
+				vm_map_unwire_nested(VME_SUBMAP(entry),
+				    sub_start, sub_end, user_wire, map_pmap,
+				    pmap_addr);
+				vm_map_lock(map);
 
-			/*
-			 *	Take an object reference, and record
-			 *	the map version information so that the
-			 *	map can be safely unlocked.
-			 */
+				if (last_timestamp + 1 != map->timestamp) {
+					/*
+					 * Find the entry again.  It could have been
+					 * clipped or deleted after we unlocked the map.
+					 */
+					if (!vm_map_lookup_entry(map,
+					    tmp_entry.vme_start,
+					    &first_entry)) {
+						if (!user_wire) {
+							panic("vm_map_unwire: re-lookup failed");
+						}
+						entry = first_entry->vme_next;
+					} else {
+						entry = first_entry;
+					}
+				}
+				last_timestamp = map->timestamp;
+			}
+		}
 
-			vm_object_reference(dst_object);
 
-			version.main_timestamp = dst_map->timestamp;
+		if ((entry->wired_count == 0) ||
+		    (user_wire && entry->user_wired_count == 0)) {
+			if (!user_wire) {
+				panic("vm_map_unwire: entry is unwired");
+			}
 
-			vm_map_unlock(dst_map);
+			entry = entry->vme_next;
+			continue;
+		}
 
-			/*
-			 *	Copy as much as possible in one pass
-			 */
+		assert(entry->wired_count > 0 &&
+		    (!user_wire || entry->user_wired_count > 0));
 
-			copy_size = size;
-			r = vm_fault_copy(
-					copy_entry->object.vm_object,
-					copy_entry->offset,
-					&copy_size,
-					dst_object,
-					dst_offset,
-					dst_map,
-					&version,
-					THREAD_UNINT );
+		vm_map_clip_start(map, entry, start);
+		vm_map_clip_end(map, entry, end);
 
-			/*
-			 *	Release the object reference
-			 */
+		/*
+		 * Check for holes
+		 * Holes: Next entry should be contiguous unless
+		 *	  this is the end of the region.
+		 */
+		if (((entry->vme_end < end) &&
+		    ((entry->vme_next == vm_map_to_entry(map)) ||
+		    (entry->vme_next->vme_start > entry->vme_end)))) {
+			if (!user_wire) {
+				panic("vm_map_unwire: non-contiguous region");
+			}
+			entry = entry->vme_next;
+			continue;
+		}
 
-			vm_object_deallocate(dst_object);
+		subtract_wire_counts(map, entry, user_wire);
 
-			/*
-			 *	If a hard error occurred, return it now
-			 */
+		if (entry->wired_count != 0) {
+			entry = entry->vme_next;
+			continue;
+		}
 
-			if (r != KERN_SUCCESS)
-				return(r);
+		if (entry->zero_wired_pages) {
+			entry->zero_wired_pages = FALSE;
+		}
 
-			if (copy_size != 0) {
-				/*
-				 *	Dispose of the copied region
-				 */
+		entry->in_transition = TRUE;
+		tmp_entry = *entry;     /* see comment in vm_map_wire() */
 
-				vm_map_copy_clip_end(copy, copy_entry,
-					copy_entry->vme_start + copy_size);
-				vm_map_copy_entry_unlink(copy, copy_entry);
-				vm_object_deallocate(copy_entry->object.vm_object);
-				vm_map_copy_entry_dispose(copy, copy_entry);
-			}
+		/*
+		 * We can unlock the map now. The in_transition state
+		 * guarantees existance of the entry.
+		 */
+		vm_map_unlock(map);
+		if (map_pmap) {
+			vm_fault_unwire(map,
+			    &tmp_entry, FALSE, map_pmap, pmap_addr);
+		} else {
+			vm_fault_unwire(map,
+			    &tmp_entry, FALSE, map->pmap,
+			    tmp_entry.vme_start);
+		}
+		vm_map_lock(map);
 
+		if (last_timestamp + 1 != map->timestamp) {
 			/*
-			 *	Pick up in the destination map where we left off.
-			 *
-			 *	Use the version information to avoid a lookup
-			 *	in the normal case.
+			 * Find the entry again.  It could have been clipped
+			 * or deleted after we unlocked the map.
 			 */
-
-			start += copy_size;
-			vm_map_lock(dst_map);
-			if ((version.main_timestamp + 1) == dst_map->timestamp) {
-				/* We can safely use saved tmp_entry value */
-
-				vm_map_clip_end(dst_map, tmp_entry, start);
-				tmp_entry = tmp_entry->vme_next;
+			if (!vm_map_lookup_entry(map, tmp_entry.vme_start,
+			    &first_entry)) {
+				if (!user_wire) {
+					panic("vm_map_unwire: re-lookup failed");
+				}
+				entry = first_entry->vme_next;
 			} else {
-				/* Must do lookup of tmp_entry */
+				entry = first_entry;
+			}
+		}
+		last_timestamp = map->timestamp;
 
-				if (!vm_map_lookup_entry(dst_map, start, &tmp_entry)) {
-					vm_map_unlock(dst_map);
-					return(KERN_INVALID_ADDRESS);
-				}
-				vm_map_clip_start(dst_map, tmp_entry, start);
+		/*
+		 * clear transition bit for all constituent entries that
+		 * were in the original entry (saved in tmp_entry).  Also
+		 * check for waiters.
+		 */
+		while ((entry != vm_map_to_entry(map)) &&
+		    (entry->vme_start < tmp_entry.vme_end)) {
+			assert(entry->in_transition);
+			entry->in_transition = FALSE;
+			if (entry->needs_wakeup) {
+				entry->needs_wakeup = FALSE;
+				need_wakeup = TRUE;
 			}
+			entry = entry->vme_next;
 		}
-	}/* while */
+	}
+
+	/*
+	 * We might have fragmented the address space when we wired this
+	 * range of addresses.  Attempt to re-coalesce these VM map entries
+	 * with their neighbors now that they're no longer wired.
+	 * Under some circumstances, address space fragmentation can
+	 * prevent VM object shadow chain collapsing, which can cause
+	 * swap space leaks.
+	 */
+	vm_map_simplify_range(map, start, end);
+
+	vm_map_unlock(map);
+	/*
+	 * wake up anybody waiting on entries that we have unwired.
+	 */
+	if (need_wakeup) {
+		vm_map_entry_wakeup(map);
+	}
+	return KERN_SUCCESS;
+}
+
+kern_return_t
+vm_map_unwire(
+	vm_map_t                map,
+	vm_map_offset_t         start,
+	vm_map_offset_t         end,
+	boolean_t               user_wire)
+{
+	return vm_map_unwire_nested(map, start, end,
+	           user_wire, (pmap_t)NULL, 0);
+}
 
-	return(KERN_SUCCESS);
-}/* vm_map_copy_overwrite_aligned */
 
 /*
- *	Routine:	vm_map_copyin_kernel_buffer
- *
- *	Description:
- *		Copy in data to a kernel buffer from space in the
- *		source map. The original space may be otpionally
- *		deallocated.
+ *	vm_map_entry_delete:	[ internal use only ]
  *
- *		If successful, returns a new copy object.
+ *	Deallocate the given entry from the target map.
  */
-kern_return_t
-vm_map_copyin_kernel_buffer(
-	vm_map_t	src_map,
-	vm_offset_t	src_addr,
-	vm_size_t	len,
-	boolean_t	src_destroy,
-	vm_map_copy_t	*copy_result)
+static void
+vm_map_entry_delete(
+	vm_map_t        map,
+	vm_map_entry_t  entry)
 {
-	boolean_t flags;
-	vm_map_copy_t copy;
-	vm_size_t kalloc_size = sizeof(struct vm_map_copy) + len;
+	vm_map_offset_t s, e;
+	vm_object_t     object;
+	vm_map_t        submap;
 
-	copy = (vm_map_copy_t) kalloc(kalloc_size);
-	if (copy == VM_MAP_COPY_NULL) {
-		return KERN_RESOURCE_SHORTAGE;
+	s = entry->vme_start;
+	e = entry->vme_end;
+	assert(page_aligned(s));
+	assert(page_aligned(e));
+	if (entry->map_aligned == TRUE) {
+		assert(VM_MAP_PAGE_ALIGNED(s, VM_MAP_PAGE_MASK(map)));
+		assert(VM_MAP_PAGE_ALIGNED(e, VM_MAP_PAGE_MASK(map)));
 	}
-	copy->type = VM_MAP_COPY_KERNEL_BUFFER;
-	copy->size = len;
-	copy->offset = 0;
-	copy->cpy_kdata = (vm_offset_t) (copy + 1);
-	copy->cpy_kalloc_size = kalloc_size;
+	assert(entry->wired_count == 0);
+	assert(entry->user_wired_count == 0);
+	assert(!entry->permanent);
 
-	if (src_map == kernel_map) {
-		bcopy((char *)src_addr, (char *)copy->cpy_kdata, len);
-		flags = VM_MAP_REMOVE_KUNWIRE | VM_MAP_REMOVE_WAIT_FOR_KWIRE |
-		        VM_MAP_REMOVE_INTERRUPTIBLE;
+	if (entry->is_sub_map) {
+		object = NULL;
+		submap = VME_SUBMAP(entry);
 	} else {
-		kern_return_t kr;
-		kr = copyinmap(src_map, src_addr, copy->cpy_kdata, len);
-		if (kr != KERN_SUCCESS) {
-			kfree((vm_offset_t)copy, kalloc_size);
-			return kr;
-		}
-		flags = VM_MAP_REMOVE_WAIT_FOR_KWIRE |
-		        VM_MAP_REMOVE_INTERRUPTIBLE;
+		submap = NULL;
+		object = VME_OBJECT(entry);
 	}
-	if (src_destroy) {
-		(void) vm_map_remove(src_map, trunc_page(src_addr), 
-				     round_page(src_addr + len),
-				     flags);
+
+	vm_map_store_entry_unlink(map, entry);
+	map->size -= e - s;
+
+	vm_map_entry_dispose(map, entry);
+
+	vm_map_unlock(map);
+	/*
+	 *	Deallocate the object only after removing all
+	 *	pmap entries pointing to its pages.
+	 */
+	if (submap) {
+		vm_map_deallocate(submap);
+	} else {
+		vm_object_deallocate(object);
 	}
-	*copy_result = copy;
-	return KERN_SUCCESS;
 }
 
-/*
- *	Routine:	vm_map_copyout_kernel_buffer
- *
- *	Description:
- *		Copy out data from a kernel buffer into space in the
- *		destination map. The space may be otpionally dynamically
- *		allocated.
- *
- *		If successful, consumes the copy object.
- *		Otherwise, the caller is responsible for it.
- */
-kern_return_t
-vm_map_copyout_kernel_buffer(
-	vm_map_t	map,
-	vm_offset_t	*addr,	/* IN/OUT */
-	vm_map_copy_t	copy,
-	boolean_t	overwrite)
+void
+vm_map_submap_pmap_clean(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end,
+	vm_map_t        sub_map,
+	vm_map_offset_t offset)
 {
-	kern_return_t kr = KERN_SUCCESS;
-	thread_act_t thr_act = current_act();
-
-	if (!overwrite) {
+	vm_map_offset_t submap_start;
+	vm_map_offset_t submap_end;
+	vm_map_size_t   remove_size;
+	vm_map_entry_t  entry;
 
-		/*
-		 * Allocate space in the target map for the data
-		 */
-		*addr = 0;
-		kr = vm_map_enter(map, 
-				  addr, 
-				  round_page(copy->size),
-				  (vm_offset_t) 0, 
-				  TRUE,
-				  VM_OBJECT_NULL, 
-				  (vm_object_offset_t) 0, 
-				  FALSE,
-				  VM_PROT_DEFAULT, 
-				  VM_PROT_ALL,
-				  VM_INHERIT_DEFAULT);
-		if (kr != KERN_SUCCESS)
-			return(kr);
-	}
+	submap_end = offset + (end - start);
+	submap_start = offset;
 
-	/*
-	 * Copyout the data from the kernel buffer to the target map.
-	 */	
-	if (thr_act->map == map) {
-	
-		/*
-		 * If the target map is the current map, just do
-		 * the copy.
-		 */
-		if (copyout((char *)copy->cpy_kdata, (char *)*addr,
-				copy->size)) {
-			return(KERN_INVALID_ADDRESS);
+	vm_map_lock_read(sub_map);
+	if (vm_map_lookup_entry(sub_map, offset, &entry)) {
+		remove_size = (entry->vme_end - entry->vme_start);
+		if (offset > entry->vme_start) {
+			remove_size -= offset - entry->vme_start;
 		}
-	}
-	else {
-		vm_map_t oldmap;
 
-		/*
-		 * If the target map is another map, assume the
-		 * target's address space identity for the duration
-		 * of the copy.
-		 */
-		vm_map_reference(map);
-		oldmap = vm_map_switch(map);
 
-		if (copyout((char *)copy->cpy_kdata, (char *)*addr,
-				copy->size)) {
-			return(KERN_INVALID_ADDRESS);
+		if (submap_end < entry->vme_end) {
+			remove_size -=
+			    entry->vme_end - submap_end;
+		}
+		if (entry->is_sub_map) {
+			vm_map_submap_pmap_clean(
+				sub_map,
+				start,
+				start + remove_size,
+				VME_SUBMAP(entry),
+				VME_OFFSET(entry));
+		} else {
+			if (map->mapped_in_other_pmaps &&
+			    os_ref_get_count(&map->map_refcnt) != 0 &&
+			    VME_OBJECT(entry) != NULL) {
+				vm_object_pmap_protect_options(
+					VME_OBJECT(entry),
+					(VME_OFFSET(entry) +
+					offset -
+					entry->vme_start),
+					remove_size,
+					PMAP_NULL,
+					entry->vme_start,
+					VM_PROT_NONE,
+					PMAP_OPTIONS_REMOVE);
+			} else {
+				pmap_remove(map->pmap,
+				    (addr64_t)start,
+				    (addr64_t)(start + remove_size));
+			}
 		}
-	
-		(void) vm_map_switch(oldmap);
-		vm_map_deallocate(map);
 	}
 
-	kfree((vm_offset_t)copy, copy->cpy_kalloc_size);
+	entry = entry->vme_next;
 
-	return(kr);
+	while ((entry != vm_map_to_entry(sub_map))
+	    && (entry->vme_start < submap_end)) {
+		remove_size = (entry->vme_end - entry->vme_start);
+		if (submap_end < entry->vme_end) {
+			remove_size -= entry->vme_end - submap_end;
+		}
+		if (entry->is_sub_map) {
+			vm_map_submap_pmap_clean(
+				sub_map,
+				(start + entry->vme_start) - offset,
+				((start + entry->vme_start) - offset) + remove_size,
+				VME_SUBMAP(entry),
+				VME_OFFSET(entry));
+		} else {
+			if (map->mapped_in_other_pmaps &&
+			    os_ref_get_count(&map->map_refcnt) != 0 &&
+			    VME_OBJECT(entry) != NULL) {
+				vm_object_pmap_protect_options(
+					VME_OBJECT(entry),
+					VME_OFFSET(entry),
+					remove_size,
+					PMAP_NULL,
+					entry->vme_start,
+					VM_PROT_NONE,
+					PMAP_OPTIONS_REMOVE);
+			} else {
+				pmap_remove(map->pmap,
+				    (addr64_t)((start + entry->vme_start)
+				    - offset),
+				    (addr64_t)(((start + entry->vme_start)
+				    - offset) + remove_size));
+			}
+		}
+		entry = entry->vme_next;
+	}
+	vm_map_unlock_read(sub_map);
+	return;
 }
-		
-/*
- *	Macro:		vm_map_copy_insert
- *	
- *	Description:
- *		Link a copy chain ("copy") into a map at the
- *		specified location (after "where").
- *	Side effects:
- *		The copy chain is destroyed.
- *	Warning:
- *		The arguments are evaluated multiple times.
- */
-#define	vm_map_copy_insert(map, where, copy)				\
-MACRO_BEGIN								\
-	vm_map_t VMCI_map;						\
-	vm_map_entry_t VMCI_where;					\
-	vm_map_copy_t VMCI_copy;					\
-	VMCI_map = (map);						\
-	VMCI_where = (where);						\
-	VMCI_copy = (copy);						\
-	((VMCI_where->vme_next)->vme_prev = vm_map_copy_last_entry(VMCI_copy))\
-		->vme_next = (VMCI_where->vme_next);			\
-	((VMCI_where)->vme_next = vm_map_copy_first_entry(VMCI_copy))	\
-		->vme_prev = VMCI_where;				\
-	VMCI_map->hdr.nentries += VMCI_copy->cpy_hdr.nentries;		\
-	UPDATE_FIRST_FREE(VMCI_map, VMCI_map->first_free);		\
-	zfree(vm_map_copy_zone, (vm_offset_t) VMCI_copy);		\
-MACRO_END
 
 /*
- *	Routine:	vm_map_copyout
- *
- *	Description:
- *		Copy out a copy chain ("copy") into newly-allocated
- *		space in the destination map.
+ *     virt_memory_guard_ast:
  *
- *		If successful, consumes the copy object.
- *		Otherwise, the caller is responsible for it.
+ *     Handle the AST callout for a virtual memory guard.
+ *	   raise an EXC_GUARD exception and terminate the task
+ *     if configured to do so.
  */
-kern_return_t
-vm_map_copyout(
-	register vm_map_t	dst_map,
-	vm_offset_t		*dst_addr,	/* OUT */
-	register vm_map_copy_t	copy)
+void
+virt_memory_guard_ast(
+	thread_t thread,
+	mach_exception_data_type_t code,
+	mach_exception_data_type_t subcode)
 {
-	vm_size_t		size;
-	vm_size_t		adjustment;
-	vm_offset_t		start;
-	vm_object_offset_t	vm_copy_start;
-	vm_map_entry_t		last;
-	register
-	vm_map_entry_t		entry;
+	task_t task = thread->task;
+	assert(task != kernel_task);
+	assert(task == current_task());
+	uint32_t behavior;
 
-	/*
-	 *	Check for null copy object.
-	 */
+	behavior = task->task_exc_guard;
 
-	if (copy == VM_MAP_COPY_NULL) {
-		*dst_addr = 0;
-		return(KERN_SUCCESS);
+	/* Is delivery enabled */
+	if ((behavior & TASK_EXC_GUARD_VM_DELIVER) == 0) {
+		return;
 	}
 
-	/*
-	 *	Check for special copy object, created
-	 *	by vm_map_copyin_object.
-	 */
-
-	if (copy->type == VM_MAP_COPY_OBJECT) {
-		vm_object_t 		object = copy->cpy_object;
-		kern_return_t 		kr;
-		vm_object_offset_t	offset;
+	/* If only once, make sure we're that once */
+	while (behavior & TASK_EXC_GUARD_VM_ONCE) {
+		uint32_t new_behavior = behavior & ~TASK_EXC_GUARD_VM_DELIVER;
 
-		offset = trunc_page_64(copy->offset);
-		size = round_page(copy->size + 
-				(vm_size_t)(copy->offset - offset));
-		*dst_addr = 0;
-		kr = vm_map_enter(dst_map, dst_addr, size,
-				  (vm_offset_t) 0, TRUE,
-				  object, offset, FALSE,
-				  VM_PROT_DEFAULT, VM_PROT_ALL,
-				  VM_INHERIT_DEFAULT);
-		if (kr != KERN_SUCCESS)
-			return(kr);
-		/* Account for non-pagealigned copy object */
-		*dst_addr += (vm_offset_t)(copy->offset - offset);
-		zfree(vm_map_copy_zone, (vm_offset_t) copy);
-		return(KERN_SUCCESS);
+		if (OSCompareAndSwap(behavior, new_behavior, &task->task_exc_guard)) {
+			break;
+		}
+		behavior = task->task_exc_guard;
+		if ((behavior & TASK_EXC_GUARD_VM_DELIVER) == 0) {
+			return;
+		}
 	}
 
-	/*
-	 *	Check for special kernel buffer allocated
-	 *	by new_ipc_kmsg_copyin.
-	 */
-
-	if (copy->type == VM_MAP_COPY_KERNEL_BUFFER) {
-		return(vm_map_copyout_kernel_buffer(dst_map, dst_addr, 
-						    copy, FALSE));
+	/* Raise exception via corpse fork or synchronously */
+	if ((task->task_exc_guard & TASK_EXC_GUARD_VM_CORPSE) &&
+	    (task->task_exc_guard & TASK_EXC_GUARD_VM_FATAL) == 0) {
+		task_violated_guard(code, subcode, NULL);
+	} else {
+		task_exception_notify(EXC_GUARD, code, subcode);
 	}
 
-	/*
-	 *	Find space for the data
-	 */
-
-	vm_copy_start = trunc_page_64(copy->offset);
-	size =	round_page((vm_size_t)copy->offset + copy->size) 
-							- vm_copy_start;
-
- StartAgain: ;
-
-	vm_map_lock(dst_map);
-	assert(first_free_is_valid(dst_map));
-	start = ((last = dst_map->first_free) == vm_map_to_entry(dst_map)) ?
-		vm_map_min(dst_map) : last->vme_end;
-
-	while (TRUE) {
-		vm_map_entry_t	next = last->vme_next;
-		vm_offset_t	end = start + size;
+	/* Terminate the task if desired */
+	if (task->task_exc_guard & TASK_EXC_GUARD_VM_FATAL) {
+		task_bsdtask_kill(current_task());
+	}
+}
 
-		if ((end > dst_map->max_offset) || (end < start)) {
-			if (dst_map->wait_for_space) {
-				if (size <= (dst_map->max_offset - dst_map->min_offset)) {
-					assert_wait((event_t) dst_map,
-						    THREAD_INTERRUPTIBLE);
-					vm_map_unlock(dst_map);
-					thread_block((void (*)(void))0);
-					goto StartAgain;
-				}
-			}
-			vm_map_unlock(dst_map);
-			return(KERN_NO_SPACE);
-		}
+/*
+ *     vm_map_guard_exception:
+ *
+ *     Generate a GUARD_TYPE_VIRTUAL_MEMORY EXC_GUARD exception.
+ *
+ *     Right now, we do this when we find nothing mapped, or a
+ *     gap in the mapping when a user address space deallocate
+ *     was requested. We report the address of the first gap found.
+ */
+static void
+vm_map_guard_exception(
+	vm_map_offset_t gap_start,
+	unsigned reason)
+{
+	mach_exception_code_t code = 0;
+	unsigned int guard_type = GUARD_TYPE_VIRT_MEMORY;
+	unsigned int target = 0; /* should we pass in pid associated with map? */
+	mach_exception_data_type_t subcode = (uint64_t)gap_start;
+	boolean_t fatal = FALSE;
 
-		if ((next == vm_map_to_entry(dst_map)) ||
-		    (next->vme_start >= end))
-			break;
+	task_t task = current_task();
 
-		last = next;
-		start = last->vme_end;
+	/* Can't deliver exceptions to kernel task */
+	if (task == kernel_task) {
+		return;
 	}
 
-	/*
-	 *	Since we're going to just drop the map
-	 *	entries from the copy into the destination
-	 *	map, they must come from the same pool.
-	 */
-
-	if (copy->cpy_hdr.entries_pageable != dst_map->hdr.entries_pageable) {
-	    /*
-	     * Mismatches occur when dealing with the default
-	     * pager.
-	     */
-	    zone_t		old_zone;
-	    vm_map_entry_t	next, new;
-
-	    /*
-	     * Find the zone that the copies were allocated from
-	     */
-	    old_zone = (copy->cpy_hdr.entries_pageable)
-			? vm_map_entry_zone
-			: vm_map_kentry_zone;
-	    entry = vm_map_copy_first_entry(copy);
+	EXC_GUARD_ENCODE_TYPE(code, guard_type);
+	EXC_GUARD_ENCODE_FLAVOR(code, reason);
+	EXC_GUARD_ENCODE_TARGET(code, target);
 
-	    /*
-	     * Reinitialize the copy so that vm_map_copy_entry_link
-	     * will work.
-	     */
-	    copy->cpy_hdr.nentries = 0;
-	    copy->cpy_hdr.entries_pageable = dst_map->hdr.entries_pageable;
-	    vm_map_copy_first_entry(copy) =
-	     vm_map_copy_last_entry(copy) =
-		vm_map_copy_to_entry(copy);
+	if (task->task_exc_guard & TASK_EXC_GUARD_VM_FATAL) {
+		fatal = TRUE;
+	}
+	thread_guard_violation(current_thread(), code, subcode, fatal);
+}
 
-	    /*
-	     * Copy each entry.
-	     */
-	    while (entry != vm_map_copy_to_entry(copy)) {
-		new = vm_map_copy_entry_create(copy);
-		vm_map_entry_copy_full(new, entry);
-		new->use_pmap = FALSE;	/* clr address space specifics */
-		vm_map_copy_entry_link(copy,
-				vm_map_copy_last_entry(copy),
-				new);
-		next = entry->vme_next;
-		zfree(old_zone, (vm_offset_t) entry);
-		entry = next;
-	    }
+/*
+ *	vm_map_delete:	[ internal use only ]
+ *
+ *	Deallocates the given address range from the target map.
+ *	Removes all user wirings. Unwires one kernel wiring if
+ *	VM_MAP_REMOVE_KUNWIRE is set.  Waits for kernel wirings to go
+ *	away if VM_MAP_REMOVE_WAIT_FOR_KWIRE is set.  Sleeps
+ *	interruptibly if VM_MAP_REMOVE_INTERRUPTIBLE is set.
+ *
+ *	This routine is called with map locked and leaves map locked.
+ */
+static kern_return_t
+vm_map_delete(
+	vm_map_t                map,
+	vm_map_offset_t         start,
+	vm_map_offset_t         end,
+	int                     flags,
+	vm_map_t                zap_map)
+{
+	vm_map_entry_t          entry, next;
+	struct   vm_map_entry   *first_entry, tmp_entry;
+	vm_map_offset_t         s;
+	vm_object_t             object;
+	boolean_t               need_wakeup;
+	unsigned int            last_timestamp = ~0; /* unlikely value */
+	int                     interruptible;
+	vm_map_offset_t         gap_start;
+	__unused vm_map_offset_t save_start = start;
+	__unused vm_map_offset_t save_end = end;
+	const vm_map_offset_t   FIND_GAP = 1;   /* a not page aligned value */
+	const vm_map_offset_t   GAPS_OK = 2;    /* a different not page aligned value */
+
+	if (map != kernel_map && !(flags & VM_MAP_REMOVE_GAPS_OK)) {
+		gap_start = FIND_GAP;
+	} else {
+		gap_start = GAPS_OK;
 	}
 
+	interruptible = (flags & VM_MAP_REMOVE_INTERRUPTIBLE) ?
+	    THREAD_ABORTSAFE : THREAD_UNINT;
+
 	/*
-	 *	Adjust the addresses in the copy chain, and
-	 *	reset the region attributes.
+	 * All our DMA I/O operations in IOKit are currently done by
+	 * wiring through the map entries of the task requesting the I/O.
+	 * Because of this, we must always wait for kernel wirings
+	 * to go away on the entries before deleting them.
+	 *
+	 * Any caller who wants to actually remove a kernel wiring
+	 * should explicitly set the VM_MAP_REMOVE_KUNWIRE flag to
+	 * properly remove one wiring instead of blasting through
+	 * them all.
 	 */
+	flags |= VM_MAP_REMOVE_WAIT_FOR_KWIRE;
 
-	adjustment = start - vm_copy_start;
-	for (entry = vm_map_copy_first_entry(copy);
-	     entry != vm_map_copy_to_entry(copy);
-	     entry = entry->vme_next) {
-		entry->vme_start += adjustment;
-		entry->vme_end += adjustment;
-
-		entry->inheritance = VM_INHERIT_DEFAULT;
-		entry->protection = VM_PROT_DEFAULT;
-		entry->max_protection = VM_PROT_ALL;
-		entry->behavior = VM_BEHAVIOR_DEFAULT;
-
+	while (1) {
 		/*
-		 * If the entry is now wired,
-		 * map the pages into the destination map.
+		 *	Find the start of the region, and clip it
 		 */
-		if (entry->wired_count != 0) {
-		    register vm_offset_t va;
-		    vm_object_offset_t	 offset;
-		    register vm_object_t object;
-
-		    object = entry->object.vm_object;
-		    offset = entry->offset;
-		    va = entry->vme_start;
-
-		    pmap_pageable(dst_map->pmap,
-				  entry->vme_start,
-				  entry->vme_end,
-				  TRUE);
-
-		    while (va < entry->vme_end) {
-			register vm_page_t	m;
-
-			/*
-			 * Look up the page in the object.
-			 * Assert that the page will be found in the
-			 * top object:
-			 * either
-			 *	the object was newly created by
-			 *	vm_object_copy_slowly, and has
-			 *	copies of all of the pages from
-			 *	the source object
-			 * or
-			 *	the object was moved from the old
-			 *	map entry; because the old map
-			 *	entry was wired, all of the pages
-			 *	were in the top-level object.
-			 *	(XXX not true if we wire pages for
-			 *	 reading)
-			 */
-			vm_object_lock(object);
-			vm_object_paging_begin(object);
-
-			m = vm_page_lookup(object, offset);
-			if (m == VM_PAGE_NULL || m->wire_count == 0 ||
-			    m->absent)
-			    panic("vm_map_copyout: wiring 0x%x", m);
-
-			m->busy = TRUE;
-			vm_object_unlock(object);
-
-			PMAP_ENTER(dst_map->pmap, va, m,
-				   entry->protection, TRUE);
-
-			vm_object_lock(object);
-			PAGE_WAKEUP_DONE(m);
-			/* the page is wired, so we don't have to activate */
-			vm_object_paging_end(object);
-			vm_object_unlock(object);
-
-			offset += PAGE_SIZE_64;
-			va += PAGE_SIZE;
-		    }
-		}
-		else if (size <= vm_map_aggressive_enter_max) {
-
-			register vm_offset_t	va;
-			vm_object_offset_t	offset;
-			register vm_object_t	object;
-			vm_prot_t		prot;
+		if (vm_map_lookup_entry(map, start, &first_entry)) {
+			entry = first_entry;
+			if (map == kalloc_map &&
+			    (entry->vme_start != start ||
+			    entry->vme_end != end)) {
+				panic("vm_map_delete(%p,0x%llx,0x%llx): "
+				    "mismatched entry %p [0x%llx:0x%llx]\n",
+				    map,
+				    (uint64_t)start,
+				    (uint64_t)end,
+				    entry,
+				    (uint64_t)entry->vme_start,
+				    (uint64_t)entry->vme_end);
+			}
 
-			object = entry->object.vm_object;
-			if (object != VM_OBJECT_NULL) {
+			/*
+			 * If in a superpage, extend the range to include the start of the mapping.
+			 */
+			if (entry->superpage_size && (start & ~SUPERPAGE_MASK)) {
+				start = SUPERPAGE_ROUND_DOWN(start);
+				continue;
+			}
 
-				offset = entry->offset;
-				va = entry->vme_start;
-				while (va < entry->vme_end) {
-					register vm_page_t	m;
-				    
+			if (start == entry->vme_start) {
+				/*
+				 * No need to clip.  We don't want to cause
+				 * any unnecessary unnesting in this case...
+				 */
+			} else {
+				if ((flags & VM_MAP_REMOVE_NO_MAP_ALIGN) &&
+				    entry->map_aligned &&
+				    !VM_MAP_PAGE_ALIGNED(
+					    start,
+					    VM_MAP_PAGE_MASK(map))) {
 					/*
-					 * Look up the page in the object.
-					 * Assert that the page will be found
-					 * in the top object if at all...
+					 * The entry will no longer be
+					 * map-aligned after clipping
+					 * and the caller said it's OK.
 					 */
-					vm_object_lock(object);
-					vm_object_paging_begin(object);
-
-					if (((m = vm_page_lookup(object,
-								 offset))
-					     != VM_PAGE_NULL) &&
-					    !m->busy && !m->fictitious &&
-					    !m->absent && !m->error) {
-						m->busy = TRUE;
-						vm_object_unlock(object);
-
-						/* honor cow obligations */
-						prot = entry->protection;
-						if (entry->needs_copy)
-							prot &= ~VM_PROT_WRITE;
-
-						PMAP_ENTER(dst_map->pmap, va, 
-							   m, prot, FALSE);
-
-						vm_object_lock(object);
-						vm_page_lock_queues();
-						if (!m->active && !m->inactive)
-							vm_page_activate(m);
-						vm_page_unlock_queues();
-						PAGE_WAKEUP_DONE(m);
-					}
-					vm_object_paging_end(object);
-					vm_object_unlock(object);
-
-					offset += PAGE_SIZE_64;
-					va += PAGE_SIZE;
+					entry->map_aligned = FALSE;
 				}
+				if (map == kalloc_map) {
+					panic("vm_map_delete(%p,0x%llx,0x%llx):"
+					    " clipping %p at 0x%llx\n",
+					    map,
+					    (uint64_t)start,
+					    (uint64_t)end,
+					    entry,
+					    (uint64_t)start);
+				}
+				vm_map_clip_start(map, entry, start);
+			}
+
+			/*
+			 *	Fix the lookup hint now, rather than each
+			 *	time through the loop.
+			 */
+			SAVE_HINT_MAP_WRITE(map, entry->vme_prev);
+		} else {
+			if (map->pmap == kernel_pmap &&
+			    os_ref_get_count(&map->map_refcnt) != 0) {
+				panic("vm_map_delete(%p,0x%llx,0x%llx): "
+				    "no map entry at 0x%llx\n",
+				    map,
+				    (uint64_t)start,
+				    (uint64_t)end,
+				    (uint64_t)start);
+			}
+			entry = first_entry->vme_next;
+			if (gap_start == FIND_GAP) {
+				gap_start = start;
 			}
 		}
+		break;
+	}
+	if (entry->superpage_size) {
+		end = SUPERPAGE_ROUND_UP(end);
 	}
 
+	need_wakeup = FALSE;
 	/*
-	 *	Correct the page alignment for the result
+	 *	Step through all entries in this region
 	 */
+	s = entry->vme_start;
+	while ((entry != vm_map_to_entry(map)) && (s < end)) {
+		/*
+		 * At this point, we have deleted all the memory entries
+		 * between "start" and "s".  We still need to delete
+		 * all memory entries between "s" and "end".
+		 * While we were blocked and the map was unlocked, some
+		 * new memory entries could have been re-allocated between
+		 * "start" and "s" and we don't want to mess with those.
+		 * Some of those entries could even have been re-assembled
+		 * with an entry after "s" (in vm_map_simplify_entry()), so
+		 * we may have to vm_map_clip_start() again.
+		 */
 
-	*dst_addr = start + (copy->offset - vm_copy_start);
+		if (entry->vme_start >= s) {
+			/*
+			 * This entry starts on or after "s"
+			 * so no need to clip its start.
+			 */
+		} else {
+			/*
+			 * This entry has been re-assembled by a
+			 * vm_map_simplify_entry().  We need to
+			 * re-clip its start.
+			 */
+			if ((flags & VM_MAP_REMOVE_NO_MAP_ALIGN) &&
+			    entry->map_aligned &&
+			    !VM_MAP_PAGE_ALIGNED(s,
+			    VM_MAP_PAGE_MASK(map))) {
+				/*
+				 * The entry will no longer be map-aligned
+				 * after clipping and the caller said it's OK.
+				 */
+				entry->map_aligned = FALSE;
+			}
+			if (map == kalloc_map) {
+				panic("vm_map_delete(%p,0x%llx,0x%llx): "
+				    "clipping %p at 0x%llx\n",
+				    map,
+				    (uint64_t)start,
+				    (uint64_t)end,
+				    entry,
+				    (uint64_t)s);
+			}
+			vm_map_clip_start(map, entry, s);
+		}
+		if (entry->vme_end <= end) {
+			/*
+			 * This entry is going away completely, so no need
+			 * to clip and possibly cause an unnecessary unnesting.
+			 */
+		} else {
+			if ((flags & VM_MAP_REMOVE_NO_MAP_ALIGN) &&
+			    entry->map_aligned &&
+			    !VM_MAP_PAGE_ALIGNED(end,
+			    VM_MAP_PAGE_MASK(map))) {
+				/*
+				 * The entry will no longer be map-aligned
+				 * after clipping and the caller said it's OK.
+				 */
+				entry->map_aligned = FALSE;
+			}
+			if (map == kalloc_map) {
+				panic("vm_map_delete(%p,0x%llx,0x%llx): "
+				    "clipping %p at 0x%llx\n",
+				    map,
+				    (uint64_t)start,
+				    (uint64_t)end,
+				    entry,
+				    (uint64_t)end);
+			}
+			vm_map_clip_end(map, entry, end);
+		}
 
-	/*
-	 *	Update the hints and the map size
-	 */
+		if (entry->permanent) {
+			if (map->pmap == kernel_pmap) {
+				panic("%s(%p,0x%llx,0x%llx): "
+				    "attempt to remove permanent "
+				    "VM map entry "
+				    "%p [0x%llx:0x%llx]\n",
+				    __FUNCTION__,
+				    map,
+				    (uint64_t) start,
+				    (uint64_t) end,
+				    entry,
+				    (uint64_t) entry->vme_start,
+				    (uint64_t) entry->vme_end);
+			} else if (flags & VM_MAP_REMOVE_IMMUTABLE) {
+//				printf("FBDP %d[%s] removing permanent entry %p [0x%llx:0x%llx] prot 0x%x/0x%x\n", proc_selfpid(), (current_task()->bsd_info ? proc_name_address(current_task()->bsd_info) : "?"), entry, (uint64_t)entry->vme_start, (uint64_t)entry->vme_end, entry->protection, entry->max_protection);
+				entry->permanent = FALSE;
+#if PMAP_CS
+			} else if ((entry->protection & VM_PROT_EXECUTE) && !pmap_cs_enforced(map->pmap)) {
+				entry->permanent = FALSE;
+
+				printf("%d[%s] %s(0x%llx,0x%llx): "
+				    "pmap_cs disabled, allowing for permanent executable entry [0x%llx:0x%llx] "
+				    "prot 0x%x/0x%x\n",
+				    proc_selfpid(),
+				    (current_task()->bsd_info
+				    ? proc_name_address(current_task()->bsd_info)
+				    : "?"),
+				    __FUNCTION__,
+				    (uint64_t) start,
+				    (uint64_t) end,
+				    (uint64_t)entry->vme_start,
+				    (uint64_t)entry->vme_end,
+				    entry->protection,
+				    entry->max_protection);
+#endif
+			} else {
+				if (vm_map_executable_immutable_verbose) {
+					printf("%d[%s] %s(0x%llx,0x%llx): "
+					    "permanent entry [0x%llx:0x%llx] "
+					    "prot 0x%x/0x%x\n",
+					    proc_selfpid(),
+					    (current_task()->bsd_info
+					    ? proc_name_address(current_task()->bsd_info)
+					    : "?"),
+					    __FUNCTION__,
+					    (uint64_t) start,
+					    (uint64_t) end,
+					    (uint64_t)entry->vme_start,
+					    (uint64_t)entry->vme_end,
+					    entry->protection,
+					    entry->max_protection);
+				}
+				/*
+				 * dtrace -n 'vm_map_delete_permanent { print("start=0x%llx end=0x%llx prot=0x%x/0x%x\n", arg0, arg1, arg2, arg3); stack(); ustack(); }'
+				 */
+				DTRACE_VM5(vm_map_delete_permanent,
+				    vm_map_offset_t, entry->vme_start,
+				    vm_map_offset_t, entry->vme_end,
+				    vm_prot_t, entry->protection,
+				    vm_prot_t, entry->max_protection,
+				    int, VME_ALIAS(entry));
+			}
+		}
 
-	SAVE_HINT(dst_map, vm_map_copy_last_entry(copy));
 
-	dst_map->size += size;
+		if (entry->in_transition) {
+			wait_result_t wait_result;
 
-	/*
-	 *	Link in the copy
-	 */
-
-	vm_map_copy_insert(dst_map, last, copy);
-
-	vm_map_unlock(dst_map);
-
-	/*
-	 * XXX	If wiring_required, call vm_map_pageable
-	 */
-
-	return(KERN_SUCCESS);
-}
-
-boolean_t       vm_map_aggressive_enter;        /* not used yet */
-
-
-/*
- *	Routine:	vm_map_copyin
- *
- *	Description:
- *		Copy the specified region (src_addr, len) from the
- *		source address space (src_map), possibly removing
- *		the region from the source address space (src_destroy).
- *
- *	Returns:
- *		A vm_map_copy_t object (copy_result), suitable for
- *		insertion into another address space (using vm_map_copyout),
- *		copying over another address space region (using
- *		vm_map_copy_overwrite).  If the copy is unused, it
- *		should be destroyed (using vm_map_copy_discard).
- *
- *	In/out conditions:
- *		The source map should not be locked on entry.
- */
+			/*
+			 * Another thread is wiring/unwiring this entry.
+			 * Let the other thread know we are waiting.
+			 */
+			assert(s == entry->vme_start);
+			entry->needs_wakeup = TRUE;
 
-typedef struct submap_map {
-	vm_map_t	parent_map;
-	vm_offset_t	base_start;
-	vm_offset_t	base_end;
-	struct submap_map *next;
-} submap_map_t;
+			/*
+			 * wake up anybody waiting on entries that we have
+			 * already unwired/deleted.
+			 */
+			if (need_wakeup) {
+				vm_map_entry_wakeup(map);
+				need_wakeup = FALSE;
+			}
 
-kern_return_t
-vm_map_copyin_common(
-	vm_map_t	src_map,
-	vm_offset_t	src_addr,
-	vm_size_t	len,
-	boolean_t	src_destroy,
-	boolean_t	src_volatile,
-	vm_map_copy_t	*copy_result,	/* OUT */
-	boolean_t	use_maxprot)
-{
-	extern int	msg_ool_size_small;
-
-	vm_map_entry_t	tmp_entry;	/* Result of last map lookup --
-					 * in multi-level lookup, this
-					 * entry contains the actual
-					 * vm_object/offset.
-					 */
-	register
-	vm_map_entry_t	new_entry = VM_MAP_ENTRY_NULL;	/* Map entry for copy */
+			wait_result = vm_map_entry_wait(map, interruptible);
 
-	vm_offset_t	src_start;	/* Start of current entry --
-					 * where copy is taking place now
-					 */
-	vm_offset_t	src_end;	/* End of entire region to be
-					 * copied */
- 	vm_offset_t	base_start;	/* submap fields to save offsets */
-					/* in original map */
-	vm_offset_t	base_end;
-	vm_map_t	base_map=src_map;
-	vm_map_entry_t	base_entry;
-	boolean_t	map_share=FALSE;
-	submap_map_t	*parent_maps = NULL;
+			if (interruptible &&
+			    wait_result == THREAD_INTERRUPTED) {
+				/*
+				 * We do not clear the needs_wakeup flag,
+				 * since we cannot tell if we were the only one.
+				 */
+				return KERN_ABORTED;
+			}
 
-	register
-	vm_map_copy_t	copy;		/* Resulting copy */
-	vm_offset_t	copy_addr;
+			/*
+			 * The entry could have been clipped or it
+			 * may not exist anymore.  Look it up again.
+			 */
+			if (!vm_map_lookup_entry(map, s, &first_entry)) {
+				/*
+				 * User: use the next entry
+				 */
+				if (gap_start == FIND_GAP) {
+					gap_start = s;
+				}
+				entry = first_entry->vme_next;
+				s = entry->vme_start;
+			} else {
+				entry = first_entry;
+				SAVE_HINT_MAP_WRITE(map, entry->vme_prev);
+			}
+			last_timestamp = map->timestamp;
+			continue;
+		} /* end in_transition */
 
-	/*
-	 *	Check for copies of zero bytes.
-	 */
+		if (entry->wired_count) {
+			boolean_t       user_wire;
 
-	if (len == 0) {
-		*copy_result = VM_MAP_COPY_NULL;
-		return(KERN_SUCCESS);
-	}
+			user_wire = entry->user_wired_count > 0;
 
-	/*
-	 * If the copy is sufficiently small, use a kernel buffer instead
-	 * of making a virtual copy.  The theory being that the cost of
-	 * setting up VM (and taking C-O-W faults) dominates the copy costs
-	 * for small regions.
-	 */
-	if ((len < msg_ool_size_small) && !use_maxprot)
-	  return vm_map_copyin_kernel_buffer(src_map, src_addr, len,
-					     src_destroy, copy_result);
+			/*
+			 *      Remove a kernel wiring if requested
+			 */
+			if (flags & VM_MAP_REMOVE_KUNWIRE) {
+				entry->wired_count--;
+			}
 
-	/*
-	 *	Compute start and end of region
-	 */
+			/*
+			 *	Remove all user wirings for proper accounting
+			 */
+			if (entry->user_wired_count > 0) {
+				while (entry->user_wired_count) {
+					subtract_wire_counts(map, entry, user_wire);
+				}
+			}
 
-	src_start = trunc_page(src_addr);
-	src_end = round_page(src_addr + len);
+			if (entry->wired_count != 0) {
+				assert(map != kernel_map);
+				/*
+				 * Cannot continue.  Typical case is when
+				 * a user thread has physical io pending on
+				 * on this page.  Either wait for the
+				 * kernel wiring to go away or return an
+				 * error.
+				 */
+				if (flags & VM_MAP_REMOVE_WAIT_FOR_KWIRE) {
+					wait_result_t wait_result;
 
-	XPR(XPR_VM_MAP, "vm_map_copyin_common map 0x%x addr 0x%x len 0x%x dest %d\n", (natural_t)src_map, src_addr, len, src_destroy, 0);
+					assert(s == entry->vme_start);
+					entry->needs_wakeup = TRUE;
+					wait_result = vm_map_entry_wait(map,
+					    interruptible);
 
-	/*
-	 *	Check that the end address doesn't overflow
-	 */
+					if (interruptible &&
+					    wait_result == THREAD_INTERRUPTED) {
+						/*
+						 * We do not clear the
+						 * needs_wakeup flag, since we
+						 * cannot tell if we were the
+						 * only one.
+						 */
+						return KERN_ABORTED;
+					}
 
-	if (src_end <= src_start)
-		if ((src_end < src_start) || (src_start != 0))
-			return(KERN_INVALID_ADDRESS);
+					/*
+					 * The entry could have been clipped or
+					 * it may not exist anymore.  Look it
+					 * up again.
+					 */
+					if (!vm_map_lookup_entry(map, s,
+					    &first_entry)) {
+						assert(map != kernel_map);
+						/*
+						 * User: use the next entry
+						 */
+						if (gap_start == FIND_GAP) {
+							gap_start = s;
+						}
+						entry = first_entry->vme_next;
+						s = entry->vme_start;
+					} else {
+						entry = first_entry;
+						SAVE_HINT_MAP_WRITE(map, entry->vme_prev);
+					}
+					last_timestamp = map->timestamp;
+					continue;
+				} else {
+					return KERN_FAILURE;
+				}
+			}
 
-	/*
-	 *	Allocate a header element for the list.
-	 *
-	 *	Use the start and end in the header to 
-	 *	remember the endpoints prior to rounding.
-	 */
+			entry->in_transition = TRUE;
+			/*
+			 * copy current entry.  see comment in vm_map_wire()
+			 */
+			tmp_entry = *entry;
+			assert(s == entry->vme_start);
 
-	copy = (vm_map_copy_t) zalloc(vm_map_copy_zone);
-	vm_map_copy_first_entry(copy) =
-	 vm_map_copy_last_entry(copy) = vm_map_copy_to_entry(copy);
-	copy->type = VM_MAP_COPY_ENTRY_LIST;
-	copy->cpy_hdr.nentries = 0;
-	copy->cpy_hdr.entries_pageable = TRUE;
+			/*
+			 * We can unlock the map now. The in_transition
+			 * state guarentees existance of the entry.
+			 */
+			vm_map_unlock(map);
 
-	copy->offset = src_addr;
-	copy->size = len;
-	
-	new_entry = vm_map_copy_entry_create(copy);
-
-#define	RETURN(x)						\
-	MACRO_BEGIN						\
-	vm_map_unlock(src_map);					\
-	if (new_entry != VM_MAP_ENTRY_NULL)			\
-		vm_map_copy_entry_dispose(copy,new_entry);	\
-	vm_map_copy_discard(copy);				\
-	{							\
-		submap_map_t	*ptr;				\
-								\
-		for(ptr = parent_maps; ptr != NULL; ptr = parent_maps) { \
-			parent_maps=parent_maps->next;		\
-			kfree((vm_offset_t)ptr, sizeof(submap_map_t));	\
-		}						\
-	}							\
-	MACRO_RETURN(x);					\
-	MACRO_END
+			if (tmp_entry.is_sub_map) {
+				vm_map_t sub_map;
+				vm_map_offset_t sub_start, sub_end;
+				pmap_t pmap;
+				vm_map_offset_t pmap_addr;
 
-	/*
-	 *	Find the beginning of the region.
-	 */
 
- 	vm_map_lock(src_map);
+				sub_map = VME_SUBMAP(&tmp_entry);
+				sub_start = VME_OFFSET(&tmp_entry);
+				sub_end = sub_start + (tmp_entry.vme_end -
+				    tmp_entry.vme_start);
+				if (tmp_entry.use_pmap) {
+					pmap = sub_map->pmap;
+					pmap_addr = tmp_entry.vme_start;
+				} else {
+					pmap = map->pmap;
+					pmap_addr = tmp_entry.vme_start;
+				}
+				(void) vm_map_unwire_nested(sub_map,
+				    sub_start, sub_end,
+				    user_wire,
+				    pmap, pmap_addr);
+			} else {
+				if (VME_OBJECT(&tmp_entry) == kernel_object) {
+					pmap_protect_options(
+						map->pmap,
+						tmp_entry.vme_start,
+						tmp_entry.vme_end,
+						VM_PROT_NONE,
+						PMAP_OPTIONS_REMOVE,
+						NULL);
+				}
+				vm_fault_unwire(map, &tmp_entry,
+				    VME_OBJECT(&tmp_entry) == kernel_object,
+				    map->pmap, tmp_entry.vme_start);
+			}
 
-	if (!vm_map_lookup_entry(src_map, src_start, &tmp_entry))
-		RETURN(KERN_INVALID_ADDRESS);
-	if(!tmp_entry->is_sub_map) {
-		vm_map_clip_start(src_map, tmp_entry, src_start);
-	}
-	/* set for later submap fix-up */
-	copy_addr = src_start;
+			vm_map_lock(map);
 
-	/*
-	 *	Go through entries until we get to the end.
-	 */
+			if (last_timestamp + 1 != map->timestamp) {
+				/*
+				 * Find the entry again.  It could have
+				 * been clipped after we unlocked the map.
+				 */
+				if (!vm_map_lookup_entry(map, s, &first_entry)) {
+					assert((map != kernel_map) &&
+					    (!entry->is_sub_map));
+					if (gap_start == FIND_GAP) {
+						gap_start = s;
+					}
+					first_entry = first_entry->vme_next;
+					s = first_entry->vme_start;
+				} else {
+					SAVE_HINT_MAP_WRITE(map, entry->vme_prev);
+				}
+			} else {
+				SAVE_HINT_MAP_WRITE(map, entry->vme_prev);
+				first_entry = entry;
+			}
 
-	while (TRUE) {
-		register
-		vm_map_entry_t	src_entry = tmp_entry;	/* Top-level entry */
-		vm_size_t	src_size;		/* Size of source
-							 * map entry (in both
-							 * maps)
-							 */
+			last_timestamp = map->timestamp;
 
-		register
-		vm_object_t		src_object;	/* Object to copy */
-		vm_object_offset_t	src_offset;
+			entry = first_entry;
+			while ((entry != vm_map_to_entry(map)) &&
+			    (entry->vme_start < tmp_entry.vme_end)) {
+				assert(entry->in_transition);
+				entry->in_transition = FALSE;
+				if (entry->needs_wakeup) {
+					entry->needs_wakeup = FALSE;
+					need_wakeup = TRUE;
+				}
+				entry = entry->vme_next;
+			}
+			/*
+			 * We have unwired the entry(s).  Go back and
+			 * delete them.
+			 */
+			entry = first_entry;
+			continue;
+		}
 
-		boolean_t	src_needs_copy;		/* Should source map
-							 * be made read-only
-							 * for copy-on-write?
-							 */
+		/* entry is unwired */
+		assert(entry->wired_count == 0);
+		assert(entry->user_wired_count == 0);
 
-		boolean_t	new_entry_needs_copy;	/* Will new entry be COW? */
+		assert(s == entry->vme_start);
 
-		boolean_t	was_wired;		/* Was source wired? */
-		vm_map_version_t version;		/* Version before locks
-							 * dropped to make copy
-							 */
-		kern_return_t	result;			/* Return value from
-							 * copy_strategically.
-							 */
-		while(tmp_entry->is_sub_map) {
-			vm_size_t submap_len;
-			submap_map_t *ptr;
+		if (flags & VM_MAP_REMOVE_NO_PMAP_CLEANUP) {
+			/*
+			 * XXX with the VM_MAP_REMOVE_SAVE_ENTRIES flag to
+			 * vm_map_delete(), some map entries might have been
+			 * transferred to a "zap_map", which doesn't have a
+			 * pmap.  The original pmap has already been flushed
+			 * in the vm_map_delete() call targeting the original
+			 * map, but when we get to destroying the "zap_map",
+			 * we don't have any pmap to flush, so let's just skip
+			 * all this.
+			 */
+		} else if (entry->is_sub_map) {
+			if (entry->use_pmap) {
+#ifndef NO_NESTED_PMAP
+				int pmap_flags;
 
-			ptr = (submap_map_t *)kalloc(sizeof(submap_map_t));
-			ptr->next = parent_maps;
-			parent_maps = ptr;
-			ptr->parent_map = src_map;
-			ptr->base_start = src_start;
-			ptr->base_end = src_end;
-			submap_len = tmp_entry->vme_end - src_start;
-			if(submap_len > (src_end-src_start))
-				submap_len = src_end-src_start;
-			ptr->base_start += submap_len;
-	
-			src_start -= tmp_entry->vme_start;
-			src_start += tmp_entry->offset;
-			src_end = src_start + submap_len;
-			src_map = tmp_entry->object.sub_map;
-			vm_map_lock(src_map);
-			vm_map_unlock(ptr->parent_map);
-			if (!vm_map_lookup_entry(
-					src_map, src_start, &tmp_entry))
-				RETURN(KERN_INVALID_ADDRESS);
-			map_share = TRUE;
-			if(!tmp_entry->is_sub_map)
-			   vm_map_clip_start(src_map, tmp_entry, src_start);
-			src_entry = tmp_entry;
+				if (flags & VM_MAP_REMOVE_NO_UNNESTING) {
+					/*
+					 * This is the final cleanup of the
+					 * address space being terminated.
+					 * No new mappings are expected and
+					 * we don't really need to unnest the
+					 * shared region (and lose the "global"
+					 * pmap mappings, if applicable).
+					 *
+					 * Tell the pmap layer that we're
+					 * "clean" wrt nesting.
+					 */
+					pmap_flags = PMAP_UNNEST_CLEAN;
+				} else {
+					/*
+					 * We're unmapping part of the nested
+					 * shared region, so we can't keep the
+					 * nested pmap.
+					 */
+					pmap_flags = 0;
+				}
+				pmap_unnest_options(
+					map->pmap,
+					(addr64_t)entry->vme_start,
+					entry->vme_end - entry->vme_start,
+					pmap_flags);
+#endif  /* NO_NESTED_PMAP */
+				if (map->mapped_in_other_pmaps &&
+				    os_ref_get_count(&map->map_refcnt) != 0) {
+					/* clean up parent map/maps */
+					vm_map_submap_pmap_clean(
+						map, entry->vme_start,
+						entry->vme_end,
+						VME_SUBMAP(entry),
+						VME_OFFSET(entry));
+				}
+			} else {
+				vm_map_submap_pmap_clean(
+					map, entry->vme_start, entry->vme_end,
+					VME_SUBMAP(entry),
+					VME_OFFSET(entry));
+			}
+		} else if (VME_OBJECT(entry) != kernel_object &&
+		    VME_OBJECT(entry) != compressor_object) {
+			object = VME_OBJECT(entry);
+			if (map->mapped_in_other_pmaps &&
+			    os_ref_get_count(&map->map_refcnt) != 0) {
+				vm_object_pmap_protect_options(
+					object, VME_OFFSET(entry),
+					entry->vme_end - entry->vme_start,
+					PMAP_NULL,
+					entry->vme_start,
+					VM_PROT_NONE,
+					PMAP_OPTIONS_REMOVE);
+			} else if ((VME_OBJECT(entry) != VM_OBJECT_NULL) ||
+			    (map->pmap == kernel_pmap)) {
+				/* Remove translations associated
+				 * with this range unless the entry
+				 * does not have an object, or
+				 * it's the kernel map or a descendant
+				 * since the platform could potentially
+				 * create "backdoor" mappings invisible
+				 * to the VM. It is expected that
+				 * objectless, non-kernel ranges
+				 * do not have such VM invisible
+				 * translations.
+				 */
+				pmap_remove_options(map->pmap,
+				    (addr64_t)entry->vme_start,
+				    (addr64_t)entry->vme_end,
+				    PMAP_OPTIONS_REMOVE);
+			}
 		}
-		if ((tmp_entry->object.vm_object != VM_OBJECT_NULL) && 
-		    (tmp_entry->object.vm_object->phys_contiguous)) {
-			/* This is not, cannot be supported for now */
-			/* we need a description of the caching mode */
-			/* reflected in the object before we can     */
-			/* support copyin, and then the support will */
-			/* be for direct copy */
-			RETURN(KERN_PROTECTION_FAILURE);
+
+		if (entry->iokit_acct) {
+			/* alternate accounting */
+			DTRACE_VM4(vm_map_iokit_unmapped_region,
+			    vm_map_t, map,
+			    vm_map_offset_t, entry->vme_start,
+			    vm_map_offset_t, entry->vme_end,
+			    int, VME_ALIAS(entry));
+			vm_map_iokit_unmapped_region(map,
+			    (entry->vme_end -
+			    entry->vme_start));
+			entry->iokit_acct = FALSE;
+			entry->use_pmap = FALSE;
 		}
+
 		/*
-		 *	Create a new address map entry to hold the result. 
-		 *	Fill in the fields from the appropriate source entries.
-		 *	We must unlock the source map to do this if we need
-		 *	to allocate a map entry.
+		 * All pmap mappings for this map entry must have been
+		 * cleared by now.
 		 */
-		if (new_entry == VM_MAP_ENTRY_NULL) {
-		    version.main_timestamp = src_map->timestamp;
-		    vm_map_unlock(src_map);
+#if DEBUG
+		assert(vm_map_pmap_is_empty(map,
+		    entry->vme_start,
+		    entry->vme_end));
+#endif /* DEBUG */
 
-		    new_entry = vm_map_copy_entry_create(copy);
+		next = entry->vme_next;
 
-		    vm_map_lock(src_map);
-		    if ((version.main_timestamp + 1) != src_map->timestamp) {
-			if (!vm_map_lookup_entry(src_map, src_start,
-					&tmp_entry)) {
-				RETURN(KERN_INVALID_ADDRESS);
-			}
-			vm_map_clip_start(src_map, tmp_entry, src_start);
-			continue; /* restart w/ new tmp_entry */
-		    }
+		if (map->pmap == kernel_pmap &&
+		    os_ref_get_count(&map->map_refcnt) != 0 &&
+		    entry->vme_end < end &&
+		    (next == vm_map_to_entry(map) ||
+		    next->vme_start != entry->vme_end)) {
+			panic("vm_map_delete(%p,0x%llx,0x%llx): "
+			    "hole after %p at 0x%llx\n",
+			    map,
+			    (uint64_t)start,
+			    (uint64_t)end,
+			    entry,
+			    (uint64_t)entry->vme_end);
 		}
 
 		/*
-		 *	Verify that the region can be read.
+		 * If the desired range didn't end with "entry", then there is a gap if
+		 * we wrapped around to the start of the map or if "entry" and "next"
+		 * aren't contiguous.
+		 *
+		 * The vm_map_round_page() is needed since an entry can be less than VM_MAP_PAGE_MASK() sized.
+		 * For example, devices which have h/w 4K pages, but entry sizes are all now 16K.
 		 */
-		if (((src_entry->protection & VM_PROT_READ) == VM_PROT_NONE &&
-			!use_maxprot) ||
-		    (src_entry->max_protection & VM_PROT_READ) == 0)
-			RETURN(KERN_PROTECTION_FAILURE);
+		if (gap_start == FIND_GAP &&
+		    vm_map_round_page(entry->vme_end, VM_MAP_PAGE_MASK(map)) < end &&
+		    (next == vm_map_to_entry(map) || entry->vme_end != next->vme_start)) {
+			gap_start = entry->vme_end;
+		}
+		s = next->vme_start;
+		last_timestamp = map->timestamp;
 
-		/*
-		 *	Clip against the endpoints of the entire region.
-		 */
-
-		vm_map_clip_end(src_map, src_entry, src_end);
-
-		src_size = src_entry->vme_end - src_start;
-		src_object = src_entry->object.vm_object;
-		src_offset = src_entry->offset;
-		was_wired = (src_entry->wired_count != 0);
-
-		vm_map_entry_copy(new_entry, src_entry);
-		new_entry->use_pmap = FALSE; /* clr address space specifics */
-
-		/*
-		 *	Attempt non-blocking copy-on-write optimizations.
-		 */
-
-		if (src_destroy && 
-		    (src_object == VM_OBJECT_NULL || 
-		    (src_object->internal && !src_object->true_share
-		    && !map_share))) {
-		    /*
-		     * If we are destroying the source, and the object
-		     * is internal, we can move the object reference
-		     * from the source to the copy.  The copy is
-		     * copy-on-write only if the source is.
-		     * We make another reference to the object, because
-		     * destroying the source entry will deallocate it.
-		     */
-		    vm_object_reference(src_object);
-
-		    /*
-		     * Copy is always unwired.  vm_map_copy_entry
-		     * set its wired count to zero.
-		     */
-
-		    goto CopySuccessful;
+		if (entry->permanent) {
+			/*
+			 * A permanent entry can not be removed, so leave it
+			 * in place but remove all access permissions.
+			 */
+			entry->protection = VM_PROT_NONE;
+			entry->max_protection = VM_PROT_NONE;
+		} else if ((flags & VM_MAP_REMOVE_SAVE_ENTRIES) &&
+		    zap_map != VM_MAP_NULL) {
+			vm_map_size_t entry_size;
+			/*
+			 * The caller wants to save the affected VM map entries
+			 * into the "zap_map".  The caller will take care of
+			 * these entries.
+			 */
+			/* unlink the entry from "map" ... */
+			vm_map_store_entry_unlink(map, entry);
+			/* ... and add it to the end of the "zap_map" */
+			vm_map_store_entry_link(zap_map,
+			    vm_map_last_entry(zap_map),
+			    entry,
+			    VM_MAP_KERNEL_FLAGS_NONE);
+			entry_size = entry->vme_end - entry->vme_start;
+			map->size -= entry_size;
+			zap_map->size += entry_size;
+			/* we didn't unlock the map, so no timestamp increase */
+			last_timestamp--;
+		} else {
+			vm_map_entry_delete(map, entry);
+			/* vm_map_entry_delete unlocks the map */
+			vm_map_lock(map);
 		}
 
+		entry = next;
 
-RestartCopy:
-		XPR(XPR_VM_MAP, "vm_map_copyin_common src_obj 0x%x ent 0x%x obj 0x%x was_wired %d\n",
-		    src_object, new_entry, new_entry->object.vm_object,
-		    was_wired, 0);
-		if (!was_wired &&
-		    vm_object_copy_quickly(
-				&new_entry->object.vm_object,
-				src_offset,
-				src_size,
-				&src_needs_copy,
-				&new_entry_needs_copy)) {
-
-			new_entry->needs_copy = new_entry_needs_copy;
-
+		if (entry == vm_map_to_entry(map)) {
+			break;
+		}
+		if (last_timestamp + 1 != map->timestamp) {
 			/*
-			 *	Handle copy-on-write obligations
+			 * We are responsible for deleting everything
+			 * from the given space. If someone has interfered,
+			 * we pick up where we left off. Back fills should
+			 * be all right for anyone, except map_delete, and
+			 * we have to assume that the task has been fully
+			 * disabled before we get here
 			 */
+			if (!vm_map_lookup_entry(map, s, &entry)) {
+				entry = entry->vme_next;
 
-			if (src_needs_copy && !tmp_entry->needs_copy) {
-				if (tmp_entry->is_shared  || 
-				     tmp_entry->object.vm_object->true_share ||
-				     map_share) {
-					vm_map_unlock(src_map);
-					new_entry->object.vm_object = 
-						vm_object_copy_delayed(
-							src_object,
-							src_offset,	
-							src_size);
-					/* dec ref gained in copy_quickly */
-					vm_object_lock(src_object);
-					src_object->ref_count--;
-					assert(src_object->ref_count > 0);
-					vm_object_res_deallocate(src_object);
-					vm_object_unlock(src_object);
-		    			vm_map_lock(src_map);
-					/* 
-					 * it turns out that we have
-					 * finished our copy. No matter
-					 * what the state of the map
-					 * we will lock it again here
-					 * knowing that if there is
-					 * additional data to copy
-					 * it will be checked at
-					 * the top of the loop
-					 *
-					 * Don't do timestamp check
-					 */
-					
-				} else {
-					vm_object_pmap_protect(
-						src_object,
-						src_offset,
-						src_size,
-			      			(src_entry->is_shared ? 
-							PMAP_NULL
-							: src_map->pmap),
-						src_entry->vme_start,
-						src_entry->protection &
-							~VM_PROT_WRITE);
-
-					tmp_entry->needs_copy = TRUE;
+				/*
+				 * Nothing found for s. If we weren't already done, then there is a gap.
+				 */
+				if (gap_start == FIND_GAP && s < end) {
+					gap_start = s;
 				}
+				s = entry->vme_start;
+			} else {
+				SAVE_HINT_MAP_WRITE(map, entry->vme_prev);
 			}
-
 			/*
-			 *	The map has never been unlocked, so it's safe
-			 *	to move to the next entry rather than doing
-			 *	another lookup.
+			 * others can not only allocate behind us, we can
+			 * also see coalesce while we don't have the map lock
 			 */
-
-			goto CopySuccessful;
+			if (entry == vm_map_to_entry(map)) {
+				break;
+			}
 		}
+		last_timestamp = map->timestamp;
+	}
 
-		new_entry->needs_copy = FALSE;
+	if (map->wait_for_space) {
+		thread_wakeup((event_t) map);
+	}
+	/*
+	 * wake up anybody waiting on entries that we have already deleted.
+	 */
+	if (need_wakeup) {
+		vm_map_entry_wakeup(map);
+	}
 
-		/*
-		 *	Take an object reference, so that we may
-		 *	release the map lock(s).
-		 */
+	if (gap_start != FIND_GAP && gap_start != GAPS_OK) {
+		DTRACE_VM3(kern_vm_deallocate_gap,
+		    vm_map_offset_t, gap_start,
+		    vm_map_offset_t, save_start,
+		    vm_map_offset_t, save_end);
+		if (!(flags & VM_MAP_REMOVE_GAPS_OK)) {
+			vm_map_guard_exception(gap_start, kGUARD_EXC_DEALLOC_GAP);
+		}
+	}
 
-		assert(src_object != VM_OBJECT_NULL);
-		vm_object_reference(src_object);
+	return KERN_SUCCESS;
+}
 
-		/*
-		 *	Record the timestamp for later verification.
-		 *	Unlock the map.
-		 */
+/*
+ *	vm_map_remove:
+ *
+ *	Remove the given address range from the target map.
+ *	This is the exported form of vm_map_delete.
+ */
+kern_return_t
+vm_map_remove(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end,
+	boolean_t      flags)
+{
+	kern_return_t   result;
 
-		version.main_timestamp = src_map->timestamp;
-		vm_map_unlock(src_map);
+	vm_map_lock(map);
+	VM_MAP_RANGE_CHECK(map, start, end);
+	/*
+	 * For the zone_map, the kernel controls the allocation/freeing of memory.
+	 * Any free to the zone_map should be within the bounds of the map and
+	 * should free up memory. If the VM_MAP_RANGE_CHECK() silently converts a
+	 * free to the zone_map into a no-op, there is a problem and we should
+	 * panic.
+	 */
+	if ((map == zone_map) && (start == end)) {
+		panic("Nothing being freed to the zone_map. start = end = %p\n", (void *)start);
+	}
+	result = vm_map_delete(map, start, end, flags, VM_MAP_NULL);
+	vm_map_unlock(map);
 
-		/*
-		 *	Perform the copy
-		 */
+	return result;
+}
 
-		if (was_wired) {
-			vm_object_lock(src_object);
-			result = vm_object_copy_slowly(
-					src_object,
-					src_offset,
-					src_size,
-					THREAD_UNINT,
-					&new_entry->object.vm_object);
-			new_entry->offset = 0;
-			new_entry->needs_copy = FALSE;
-		} else {
-			result = vm_object_copy_strategically(src_object,
-				src_offset,
-				src_size,
-				&new_entry->object.vm_object,
-				&new_entry->offset,
-				&new_entry_needs_copy);
+/*
+ *	vm_map_remove_locked:
+ *
+ *	Remove the given address range from the target locked map.
+ *	This is the exported form of vm_map_delete.
+ */
+kern_return_t
+vm_map_remove_locked(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end,
+	boolean_t       flags)
+{
+	kern_return_t   result;
 
-			new_entry->needs_copy = new_entry_needs_copy;
-			
-		}
+	VM_MAP_RANGE_CHECK(map, start, end);
+	result = vm_map_delete(map, start, end, flags, VM_MAP_NULL);
+	return result;
+}
 
-		if (result != KERN_SUCCESS &&
-		    result != KERN_MEMORY_RESTART_COPY) {
-			vm_map_lock(src_map);
-			RETURN(result);
-		}
 
-		/*
-		 *	Throw away the extra reference
-		 */
+/*
+ *	Routine:	vm_map_copy_allocate
+ *
+ *	Description:
+ *		Allocates and initializes a map copy object.
+ */
+static vm_map_copy_t
+vm_map_copy_allocate(void)
+{
+	vm_map_copy_t new_copy;
 
-		vm_object_deallocate(src_object);
+	new_copy = zalloc(vm_map_copy_zone);
+	bzero(new_copy, sizeof(*new_copy));
+	new_copy->c_u.hdr.rb_head_store.rbh_root = (void*)(int)SKIP_RB_TREE;
+	vm_map_copy_first_entry(new_copy) = vm_map_copy_to_entry(new_copy);
+	vm_map_copy_last_entry(new_copy) = vm_map_copy_to_entry(new_copy);
+	return new_copy;
+}
 
-		/*
-		 *	Verify that the map has not substantially
-		 *	changed while the copy was being made.
-		 */
+/*
+ *	Routine:	vm_map_copy_discard
+ *
+ *	Description:
+ *		Dispose of a map copy object (returned by
+ *		vm_map_copyin).
+ */
+void
+vm_map_copy_discard(
+	vm_map_copy_t   copy)
+{
+	if (copy == VM_MAP_COPY_NULL) {
+		return;
+	}
 
-		vm_map_lock(src_map);	/* Increments timestamp once! */
+	switch (copy->type) {
+	case VM_MAP_COPY_ENTRY_LIST:
+		while (vm_map_copy_first_entry(copy) !=
+		    vm_map_copy_to_entry(copy)) {
+			vm_map_entry_t  entry = vm_map_copy_first_entry(copy);
 
-		if ((version.main_timestamp + 1) == src_map->timestamp)
-			goto VerificationSuccessful;
+			vm_map_copy_entry_unlink(copy, entry);
+			if (entry->is_sub_map) {
+				vm_map_deallocate(VME_SUBMAP(entry));
+			} else {
+				vm_object_deallocate(VME_OBJECT(entry));
+			}
+			vm_map_copy_entry_dispose(copy, entry);
+		}
+		break;
+	case VM_MAP_COPY_OBJECT:
+		vm_object_deallocate(copy->cpy_object);
+		break;
+	case VM_MAP_COPY_KERNEL_BUFFER:
 
 		/*
-		 *	Simple version comparison failed.
-		 *
-		 *	Retry the lookup and verify that the
-		 *	same object/offset are still present.
-		 *
-		 *	[Note: a memory manager that colludes with
-		 *	the calling task can detect that we have
-		 *	cheated.  While the map was unlocked, the
-		 *	mapping could have been changed and restored.]
+		 * The vm_map_copy_t and possibly the data buffer were
+		 * allocated by a single call to kalloc(), i.e. the
+		 * vm_map_copy_t was not allocated out of the zone.
 		 */
-
-		if (!vm_map_lookup_entry(src_map, src_start, &tmp_entry)) {
-			RETURN(KERN_INVALID_ADDRESS);
+		if (copy->size > msg_ool_size_small || copy->offset) {
+			panic("Invalid vm_map_copy_t sz:%lld, ofst:%lld",
+			    (long long)copy->size, (long long)copy->offset);
 		}
+		kfree(copy, copy->size + cpy_kdata_hdr_sz);
+		return;
+	}
+	zfree(vm_map_copy_zone, copy);
+}
 
-		src_entry = tmp_entry;
-		vm_map_clip_start(src_map, src_entry, src_start);
+/*
+ *	Routine:	vm_map_copy_copy
+ *
+ *	Description:
+ *			Move the information in a map copy object to
+ *			a new map copy object, leaving the old one
+ *			empty.
+ *
+ *			This is used by kernel routines that need
+ *			to look at out-of-line data (in copyin form)
+ *			before deciding whether to return SUCCESS.
+ *			If the routine returns FAILURE, the original
+ *			copy object will be deallocated; therefore,
+ *			these routines must make a copy of the copy
+ *			object and leave the original empty so that
+ *			deallocation will not fail.
+ */
+vm_map_copy_t
+vm_map_copy_copy(
+	vm_map_copy_t   copy)
+{
+	vm_map_copy_t   new_copy;
 
-		if ((src_entry->protection & VM_PROT_READ == VM_PROT_NONE &&
-			!use_maxprot) ||
-		    src_entry->max_protection & VM_PROT_READ == 0)
-			goto VerificationFailed;
+	if (copy == VM_MAP_COPY_NULL) {
+		return VM_MAP_COPY_NULL;
+	}
 
-		if (src_entry->vme_end < new_entry->vme_end)
-			src_size = (new_entry->vme_end = src_entry->vme_end) - src_start;
+	/*
+	 * Allocate a new copy object, and copy the information
+	 * from the old one into it.
+	 */
 
-		if ((src_entry->object.vm_object != src_object) ||
-		    (src_entry->offset != src_offset) ) {
+	new_copy = (vm_map_copy_t) zalloc(vm_map_copy_zone);
+	*new_copy = *copy;
 
-			/*
-			 *	Verification failed.
-			 *
-			 *	Start over with this top-level entry.
-			 */
+	if (copy->type == VM_MAP_COPY_ENTRY_LIST) {
+		/*
+		 * The links in the entry chain must be
+		 * changed to point to the new copy object.
+		 */
+		vm_map_copy_first_entry(copy)->vme_prev
+		        = vm_map_copy_to_entry(new_copy);
+		vm_map_copy_last_entry(copy)->vme_next
+		        = vm_map_copy_to_entry(new_copy);
+	}
 
-		 VerificationFailed: ;
+	/*
+	 * Change the old copy object into one that contains
+	 * nothing to be deallocated.
+	 */
+	copy->type = VM_MAP_COPY_OBJECT;
+	copy->cpy_object = VM_OBJECT_NULL;
 
-			vm_object_deallocate(new_entry->object.vm_object);
-			tmp_entry = src_entry;
-			continue;
-		}
+	/*
+	 * Return the new object.
+	 */
+	return new_copy;
+}
 
-		/*
-		 *	Verification succeeded.
-		 */
+static kern_return_t
+vm_map_overwrite_submap_recurse(
+	vm_map_t        dst_map,
+	vm_map_offset_t dst_addr,
+	vm_map_size_t   dst_size)
+{
+	vm_map_offset_t dst_end;
+	vm_map_entry_t  tmp_entry;
+	vm_map_entry_t  entry;
+	kern_return_t   result;
+	boolean_t       encountered_sub_map = FALSE;
 
-	 VerificationSuccessful: ;
 
-		if (result == KERN_MEMORY_RESTART_COPY)
-			goto RestartCopy;
 
-		/*
-		 *	Copy succeeded.
-		 */
+	/*
+	 *	Verify that the destination is all writeable
+	 *	initially.  We have to trunc the destination
+	 *	address and round the copy size or we'll end up
+	 *	splitting entries in strange ways.
+	 */
 
-	 CopySuccessful: ;
+	dst_end = vm_map_round_page(dst_addr + dst_size,
+	    VM_MAP_PAGE_MASK(dst_map));
+	vm_map_lock(dst_map);
 
-		/*
-		 *	Link in the new copy entry.
-		 */
+start_pass_1:
+	if (!vm_map_lookup_entry(dst_map, dst_addr, &tmp_entry)) {
+		vm_map_unlock(dst_map);
+		return KERN_INVALID_ADDRESS;
+	}
 
-		vm_map_copy_entry_link(copy, vm_map_copy_last_entry(copy),
-				       new_entry);
-		
-		/*
-		 *	Determine whether the entire region
-		 *	has been copied.
-		 */
-		src_start = new_entry->vme_end;
-		new_entry = VM_MAP_ENTRY_NULL;
-		while ((src_start >= src_end) && (src_end != 0)) {
-			if (src_map != base_map) {
-				submap_map_t	*ptr;
-
-				ptr = parent_maps;
-				assert(ptr != NULL);
-				parent_maps = parent_maps->next;
-				vm_map_lock(ptr->parent_map);
-				vm_map_unlock(src_map);
-				src_map = ptr->parent_map;
-				src_start = ptr->base_start;
-				src_end = ptr->base_end;
-				if ((src_end > src_start) &&
-					      !vm_map_lookup_entry(
-					      src_map, src_start, &tmp_entry))
-					RETURN(KERN_INVALID_ADDRESS);
-				kfree((vm_offset_t)ptr, sizeof(submap_map_t));
-				if(parent_maps == NULL)
-					map_share = FALSE;
-				src_entry = tmp_entry->vme_prev;
-			} else
-				break;
+	vm_map_clip_start(dst_map,
+	    tmp_entry,
+	    vm_map_trunc_page(dst_addr,
+	    VM_MAP_PAGE_MASK(dst_map)));
+	if (tmp_entry->is_sub_map) {
+		/* clipping did unnest if needed */
+		assert(!tmp_entry->use_pmap);
+	}
+
+	for (entry = tmp_entry;;) {
+		vm_map_entry_t  next;
+
+		next = entry->vme_next;
+		while (entry->is_sub_map) {
+			vm_map_offset_t sub_start;
+			vm_map_offset_t sub_end;
+			vm_map_offset_t local_end;
+
+			if (entry->in_transition) {
+				/*
+				 * Say that we are waiting, and wait for entry.
+				 */
+				entry->needs_wakeup = TRUE;
+				vm_map_entry_wait(dst_map, THREAD_UNINT);
+
+				goto start_pass_1;
+			}
+
+			encountered_sub_map = TRUE;
+			sub_start = VME_OFFSET(entry);
+
+			if (entry->vme_end < dst_end) {
+				sub_end = entry->vme_end;
+			} else {
+				sub_end = dst_end;
+			}
+			sub_end -= entry->vme_start;
+			sub_end += VME_OFFSET(entry);
+			local_end = entry->vme_end;
+			vm_map_unlock(dst_map);
+
+			result = vm_map_overwrite_submap_recurse(
+				VME_SUBMAP(entry),
+				sub_start,
+				sub_end - sub_start);
+
+			if (result != KERN_SUCCESS) {
+				return result;
+			}
+			if (dst_end <= entry->vme_end) {
+				return KERN_SUCCESS;
+			}
+			vm_map_lock(dst_map);
+			if (!vm_map_lookup_entry(dst_map, local_end,
+			    &tmp_entry)) {
+				vm_map_unlock(dst_map);
+				return KERN_INVALID_ADDRESS;
+			}
+			entry = tmp_entry;
+			next = entry->vme_next;
+		}
+
+		if (!(entry->protection & VM_PROT_WRITE)) {
+			vm_map_unlock(dst_map);
+			return KERN_PROTECTION_FAILURE;
 		}
-		if ((src_start >= src_end) && (src_end != 0))
-			break;
 
 		/*
-		 *	Verify that there are no gaps in the region
+		 *	If the entry is in transition, we must wait
+		 *	for it to exit that state.  Anything could happen
+		 *	when we unlock the map, so start over.
 		 */
+		if (entry->in_transition) {
+			/*
+			 * Say that we are waiting, and wait for entry.
+			 */
+			entry->needs_wakeup = TRUE;
+			vm_map_entry_wait(dst_map, THREAD_UNINT);
 
-		tmp_entry = src_entry->vme_next;
-		if ((tmp_entry->vme_start != src_start) || 
-				(tmp_entry == vm_map_to_entry(src_map)))
-			RETURN(KERN_INVALID_ADDRESS);
-	}
-
-	/*
-	 * If the source should be destroyed, do it now, since the
-	 * copy was successful. 
-	 */
-	if (src_destroy) {
-		(void) vm_map_delete(src_map,
-				     trunc_page(src_addr),
-				     src_end,
-				     (src_map == kernel_map) ?
-					VM_MAP_REMOVE_KUNWIRE :
-					VM_MAP_NO_FLAGS);
-	}
-
-	vm_map_unlock(src_map);
+			goto start_pass_1;
+		}
 
-	/* Fix-up start and end points in copy.  This is necessary */
-	/* when the various entries in the copy object were picked */
-	/* up from different sub-maps */
+/*
+ *		our range is contained completely within this map entry
+ */
+		if (dst_end <= entry->vme_end) {
+			vm_map_unlock(dst_map);
+			return KERN_SUCCESS;
+		}
+/*
+ *		check that range specified is contiguous region
+ */
+		if ((next == vm_map_to_entry(dst_map)) ||
+		    (next->vme_start != entry->vme_end)) {
+			vm_map_unlock(dst_map);
+			return KERN_INVALID_ADDRESS;
+		}
 
-	tmp_entry = vm_map_copy_first_entry(copy);
-	while (tmp_entry != vm_map_copy_to_entry(copy)) {
-		tmp_entry->vme_end = copy_addr + 
-			(tmp_entry->vme_end - tmp_entry->vme_start);
-		tmp_entry->vme_start = copy_addr;
-		copy_addr += tmp_entry->vme_end - tmp_entry->vme_start;
-		tmp_entry = (struct vm_map_entry *)tmp_entry->vme_next;
-	}
+		/*
+		 *	Check for permanent objects in the destination.
+		 */
+		if ((VME_OBJECT(entry) != VM_OBJECT_NULL) &&
+		    ((!VME_OBJECT(entry)->internal) ||
+		    (VME_OBJECT(entry)->true_share))) {
+			if (encountered_sub_map) {
+				vm_map_unlock(dst_map);
+				return KERN_FAILURE;
+			}
+		}
 
-	*copy_result = copy;
-	return(KERN_SUCCESS);
 
-#undef	RETURN
+		entry = next;
+	}/* for */
+	vm_map_unlock(dst_map);
+	return KERN_SUCCESS;
 }
 
 /*
- *	vm_map_copyin_object:
+ *	Routine:	vm_map_copy_overwrite
  *
- *	Create a copy object from an object.
- *	Our caller donates an object reference.
+ *	Description:
+ *		Copy the memory described by the map copy
+ *		object (copy; returned by vm_map_copyin) onto
+ *		the specified destination region (dst_map, dst_addr).
+ *		The destination must be writeable.
+ *
+ *		Unlike vm_map_copyout, this routine actually
+ *		writes over previously-mapped memory.  If the
+ *		previous mapping was to a permanent (user-supplied)
+ *		memory object, it is preserved.
+ *
+ *		The attributes (protection and inheritance) of the
+ *		destination region are preserved.
+ *
+ *		If successful, consumes the copy object.
+ *		Otherwise, the caller is responsible for it.
+ *
+ *	Implementation notes:
+ *		To overwrite aligned temporary virtual memory, it is
+ *		sufficient to remove the previous mapping and insert
+ *		the new copy.  This replacement is done either on
+ *		the whole region (if no permanent virtual memory
+ *		objects are embedded in the destination region) or
+ *		in individual map entries.
+ *
+ *		To overwrite permanent virtual memory , it is necessary
+ *		to copy each page, as the external memory management
+ *		interface currently does not provide any optimizations.
+ *
+ *		Unaligned memory also has to be copied.  It is possible
+ *		to use 'vm_trickery' to copy the aligned data.  This is
+ *		not done but not hard to implement.
+ *
+ *		Once a page of permanent memory has been overwritten,
+ *		it is impossible to interrupt this function; otherwise,
+ *		the call would be neither atomic nor location-independent.
+ *		The kernel-state portion of a user thread must be
+ *		interruptible.
+ *
+ *		It may be expensive to forward all requests that might
+ *		overwrite permanent memory (vm_write, vm_copy) to
+ *		uninterruptible kernel threads.  This routine may be
+ *		called by interruptible threads; however, success is
+ *		not guaranteed -- if the request cannot be performed
+ *		atomically and interruptibly, an error indication is
+ *		returned.
  */
 
-kern_return_t
-vm_map_copyin_object(
-	vm_object_t		object,
-	vm_object_offset_t	offset,	/* offset of region in object */
-	vm_object_size_t	size,	/* size of region in object */
-	vm_map_copy_t	*copy_result)	/* OUT */
+static kern_return_t
+vm_map_copy_overwrite_nested(
+	vm_map_t                dst_map,
+	vm_map_address_t        dst_addr,
+	vm_map_copy_t           copy,
+	boolean_t               interruptible,
+	pmap_t                  pmap,
+	boolean_t               discard_on_success)
 {
-	vm_map_copy_t	copy;		/* Resulting copy */
+	vm_map_offset_t         dst_end;
+	vm_map_entry_t          tmp_entry;
+	vm_map_entry_t          entry;
+	kern_return_t           kr;
+	boolean_t               aligned = TRUE;
+	boolean_t               contains_permanent_objects = FALSE;
+	boolean_t               encountered_sub_map = FALSE;
+	vm_map_offset_t         base_addr;
+	vm_map_size_t           copy_size;
+	vm_map_size_t           total_size;
+
 
 	/*
-	 *	We drop the object into a special copy object
-	 *	that contains the object directly.
+	 *	Check for null copy object.
 	 */
 
-	copy = (vm_map_copy_t) zalloc(vm_map_copy_zone);
-	copy->type = VM_MAP_COPY_OBJECT;
-	copy->cpy_object = object;
-	copy->cpy_index = 0;
-	copy->offset = offset;
-	copy->size = size;
+	if (copy == VM_MAP_COPY_NULL) {
+		return KERN_SUCCESS;
+	}
 
-	*copy_result = copy;
-	return(KERN_SUCCESS);
-}
+	/*
+	 *	Check for special kernel buffer allocated
+	 *	by new_ipc_kmsg_copyin.
+	 */
 
-void
-vm_map_fork_share(
-	vm_map_t	old_map,
-	vm_map_entry_t	old_entry,
-	vm_map_t	new_map)
-{
-	vm_object_t 	object;
-	vm_map_entry_t 	new_entry;
-	kern_return_t	result;
+	if (copy->type == VM_MAP_COPY_KERNEL_BUFFER) {
+		return vm_map_copyout_kernel_buffer(
+			dst_map, &dst_addr,
+			copy, copy->size, TRUE, discard_on_success);
+	}
 
 	/*
-	 *	New sharing code.  New map entry
-	 *	references original object.  Internal
-	 *	objects use asynchronous copy algorithm for
-	 *	future copies.  First make sure we have
-	 *	the right object.  If we need a shadow,
-	 *	or someone else already has one, then
-	 *	make a new shadow and share it.
+	 *      Only works for entry lists at the moment.  Will
+	 *	support page lists later.
 	 */
-	
-	object = old_entry->object.vm_object;
-	if (old_entry->is_sub_map) {
-		assert(old_entry->wired_count == 0);
-#ifndef i386
-		if(old_entry->use_pmap) {
-			result = pmap_nest(new_map->pmap, 
-				(old_entry->object.sub_map)->pmap, 
-				old_entry->vme_start,
-				old_entry->vme_end - old_entry->vme_start);
-			if(result)
-				panic("vm_map_fork_share: pmap_nest failed!");
+
+	assert(copy->type == VM_MAP_COPY_ENTRY_LIST);
+
+	if (copy->size == 0) {
+		if (discard_on_success) {
+			vm_map_copy_discard(copy);
 		}
-#endif
-	} else if (object == VM_OBJECT_NULL) {
-		object = vm_object_allocate((vm_size_t)(old_entry->vme_end -
-							old_entry->vme_start));
-		old_entry->offset = 0;
-		old_entry->object.vm_object = object;
-		assert(!old_entry->needs_copy);
-	} else if (object->copy_strategy !=
-		 MEMORY_OBJECT_COPY_SYMMETRIC) {
-		
-		/*
-		 *	We are already using an asymmetric
-		 *	copy, and therefore we already have
-		 *	the right object.
-		 */
-		
-		assert(! old_entry->needs_copy);
+		return KERN_SUCCESS;
 	}
-	else if (old_entry->needs_copy ||	/* case 1 */
-		 object->shadowed ||		/* case 2 */
-		 (!object->true_share && 	/* case 3 */
-		 !old_entry->is_shared &&
-		 (object->size >
-		  (vm_size_t)(old_entry->vme_end -
-			      old_entry->vme_start)))) {
-		
-		/*
-		 *	We need to create a shadow.
-		 *	There are three cases here.
-		 *	In the first case, we need to
-		 *	complete a deferred symmetrical
-		 *	copy that we participated in.
-		 *	In the second and third cases,
-		 *	we need to create the shadow so
-		 *	that changes that we make to the
-		 *	object do not interfere with
-		 *	any symmetrical copies which
-		 *	have occured (case 2) or which
-		 *	might occur (case 3).
-		 *
-		 *	The first case is when we had
-		 *	deferred shadow object creation
-		 *	via the entry->needs_copy mechanism.
-		 *	This mechanism only works when
-		 *	only one entry points to the source
-		 *	object, and we are about to create
-		 *	a second entry pointing to the
-		 *	same object. The problem is that
-		 *	there is no way of mapping from
-		 *	an object to the entries pointing
-		 *	to it. (Deferred shadow creation
-		 *	works with one entry because occurs
-		 *	at fault time, and we walk from the
-		 *	entry to the object when handling
-		 *	the fault.)
-		 *
-		 *	The second case is when the object
-		 *	to be shared has already been copied
+
+	/*
+	 *	Verify that the destination is all writeable
+	 *	initially.  We have to trunc the destination
+	 *	address and round the copy size or we'll end up
+	 *	splitting entries in strange ways.
+	 */
+
+	if (!VM_MAP_PAGE_ALIGNED(copy->size,
+	    VM_MAP_PAGE_MASK(dst_map)) ||
+	    !VM_MAP_PAGE_ALIGNED(copy->offset,
+	    VM_MAP_PAGE_MASK(dst_map)) ||
+	    !VM_MAP_PAGE_ALIGNED(dst_addr,
+	    VM_MAP_PAGE_MASK(dst_map))) {
+		aligned = FALSE;
+		dst_end = vm_map_round_page(dst_addr + copy->size,
+		    VM_MAP_PAGE_MASK(dst_map));
+	} else {
+		dst_end = dst_addr + copy->size;
+	}
+
+	vm_map_lock(dst_map);
+
+	/* LP64todo - remove this check when vm_map_commpage64()
+	 * no longer has to stuff in a map_entry for the commpage
+	 * above the map's max_offset.
+	 */
+	if (dst_addr >= dst_map->max_offset) {
+		vm_map_unlock(dst_map);
+		return KERN_INVALID_ADDRESS;
+	}
+
+start_pass_1:
+	if (!vm_map_lookup_entry(dst_map, dst_addr, &tmp_entry)) {
+		vm_map_unlock(dst_map);
+		return KERN_INVALID_ADDRESS;
+	}
+	vm_map_clip_start(dst_map,
+	    tmp_entry,
+	    vm_map_trunc_page(dst_addr,
+	    VM_MAP_PAGE_MASK(dst_map)));
+	for (entry = tmp_entry;;) {
+		vm_map_entry_t  next = entry->vme_next;
+
+		while (entry->is_sub_map) {
+			vm_map_offset_t sub_start;
+			vm_map_offset_t sub_end;
+			vm_map_offset_t local_end;
+
+			if (entry->in_transition) {
+				/*
+				 * Say that we are waiting, and wait for entry.
+				 */
+				entry->needs_wakeup = TRUE;
+				vm_map_entry_wait(dst_map, THREAD_UNINT);
+
+				goto start_pass_1;
+			}
+
+			local_end = entry->vme_end;
+			if (!(entry->needs_copy)) {
+				/* if needs_copy we are a COW submap */
+				/* in such a case we just replace so */
+				/* there is no need for the follow-  */
+				/* ing check.                        */
+				encountered_sub_map = TRUE;
+				sub_start = VME_OFFSET(entry);
+
+				if (entry->vme_end < dst_end) {
+					sub_end = entry->vme_end;
+				} else {
+					sub_end = dst_end;
+				}
+				sub_end -= entry->vme_start;
+				sub_end += VME_OFFSET(entry);
+				vm_map_unlock(dst_map);
+
+				kr = vm_map_overwrite_submap_recurse(
+					VME_SUBMAP(entry),
+					sub_start,
+					sub_end - sub_start);
+				if (kr != KERN_SUCCESS) {
+					return kr;
+				}
+				vm_map_lock(dst_map);
+			}
+
+			if (dst_end <= entry->vme_end) {
+				goto start_overwrite;
+			}
+			if (!vm_map_lookup_entry(dst_map, local_end,
+			    &entry)) {
+				vm_map_unlock(dst_map);
+				return KERN_INVALID_ADDRESS;
+			}
+			next = entry->vme_next;
+		}
+
+		if (!(entry->protection & VM_PROT_WRITE)) {
+			vm_map_unlock(dst_map);
+			return KERN_PROTECTION_FAILURE;
+		}
+
+		/*
+		 *	If the entry is in transition, we must wait
+		 *	for it to exit that state.  Anything could happen
+		 *	when we unlock the map, so start over.
+		 */
+		if (entry->in_transition) {
+			/*
+			 * Say that we are waiting, and wait for entry.
+			 */
+			entry->needs_wakeup = TRUE;
+			vm_map_entry_wait(dst_map, THREAD_UNINT);
+
+			goto start_pass_1;
+		}
+
+/*
+ *		our range is contained completely within this map entry
+ */
+		if (dst_end <= entry->vme_end) {
+			break;
+		}
+/*
+ *		check that range specified is contiguous region
+ */
+		if ((next == vm_map_to_entry(dst_map)) ||
+		    (next->vme_start != entry->vme_end)) {
+			vm_map_unlock(dst_map);
+			return KERN_INVALID_ADDRESS;
+		}
+
+
+		/*
+		 *	Check for permanent objects in the destination.
+		 */
+		if ((VME_OBJECT(entry) != VM_OBJECT_NULL) &&
+		    ((!VME_OBJECT(entry)->internal) ||
+		    (VME_OBJECT(entry)->true_share))) {
+			contains_permanent_objects = TRUE;
+		}
+
+		entry = next;
+	}/* for */
+
+start_overwrite:
+	/*
+	 *	If there are permanent objects in the destination, then
+	 *	the copy cannot be interrupted.
+	 */
+
+	if (interruptible && contains_permanent_objects) {
+		vm_map_unlock(dst_map);
+		return KERN_FAILURE;   /* XXX */
+	}
+
+	/*
+	 *
+	 *	Make a second pass, overwriting the data
+	 *	At the beginning of each loop iteration,
+	 *	the next entry to be overwritten is "tmp_entry"
+	 *	(initially, the value returned from the lookup above),
+	 *	and the starting address expected in that entry
+	 *	is "start".
+	 */
+
+	total_size = copy->size;
+	if (encountered_sub_map) {
+		copy_size = 0;
+		/* re-calculate tmp_entry since we've had the map */
+		/* unlocked */
+		if (!vm_map_lookup_entry( dst_map, dst_addr, &tmp_entry)) {
+			vm_map_unlock(dst_map);
+			return KERN_INVALID_ADDRESS;
+		}
+	} else {
+		copy_size = copy->size;
+	}
+
+	base_addr = dst_addr;
+	while (TRUE) {
+		/* deconstruct the copy object and do in parts */
+		/* only in sub_map, interruptable case */
+		vm_map_entry_t  copy_entry;
+		vm_map_entry_t  previous_prev = VM_MAP_ENTRY_NULL;
+		vm_map_entry_t  next_copy = VM_MAP_ENTRY_NULL;
+		int             nentries;
+		int             remaining_entries = 0;
+		vm_map_offset_t new_offset = 0;
+
+		for (entry = tmp_entry; copy_size == 0;) {
+			vm_map_entry_t  next;
+
+			next = entry->vme_next;
+
+			/* tmp_entry and base address are moved along */
+			/* each time we encounter a sub-map.  Otherwise */
+			/* entry can outpase tmp_entry, and the copy_size */
+			/* may reflect the distance between them */
+			/* if the current entry is found to be in transition */
+			/* we will start over at the beginning or the last */
+			/* encounter of a submap as dictated by base_addr */
+			/* we will zero copy_size accordingly. */
+			if (entry->in_transition) {
+				/*
+				 * Say that we are waiting, and wait for entry.
+				 */
+				entry->needs_wakeup = TRUE;
+				vm_map_entry_wait(dst_map, THREAD_UNINT);
+
+				if (!vm_map_lookup_entry(dst_map, base_addr,
+				    &tmp_entry)) {
+					vm_map_unlock(dst_map);
+					return KERN_INVALID_ADDRESS;
+				}
+				copy_size = 0;
+				entry = tmp_entry;
+				continue;
+			}
+			if (entry->is_sub_map) {
+				vm_map_offset_t sub_start;
+				vm_map_offset_t sub_end;
+				vm_map_offset_t local_end;
+
+				if (entry->needs_copy) {
+					/* if this is a COW submap */
+					/* just back the range with a */
+					/* anonymous entry */
+					if (entry->vme_end < dst_end) {
+						sub_end = entry->vme_end;
+					} else {
+						sub_end = dst_end;
+					}
+					if (entry->vme_start < base_addr) {
+						sub_start = base_addr;
+					} else {
+						sub_start = entry->vme_start;
+					}
+					vm_map_clip_end(
+						dst_map, entry, sub_end);
+					vm_map_clip_start(
+						dst_map, entry, sub_start);
+					assert(!entry->use_pmap);
+					assert(!entry->iokit_acct);
+					entry->use_pmap = TRUE;
+					entry->is_sub_map = FALSE;
+					vm_map_deallocate(
+						VME_SUBMAP(entry));
+					VME_OBJECT_SET(entry, VM_OBJECT_NULL);
+					VME_OFFSET_SET(entry, 0);
+					entry->is_shared = FALSE;
+					entry->needs_copy = FALSE;
+					entry->protection = VM_PROT_DEFAULT;
+					entry->max_protection = VM_PROT_ALL;
+					entry->wired_count = 0;
+					entry->user_wired_count = 0;
+					if (entry->inheritance
+					    == VM_INHERIT_SHARE) {
+						entry->inheritance = VM_INHERIT_COPY;
+					}
+					continue;
+				}
+				/* first take care of any non-sub_map */
+				/* entries to send */
+				if (base_addr < entry->vme_start) {
+					/* stuff to send */
+					copy_size =
+					    entry->vme_start - base_addr;
+					break;
+				}
+				sub_start = VME_OFFSET(entry);
+
+				if (entry->vme_end < dst_end) {
+					sub_end = entry->vme_end;
+				} else {
+					sub_end = dst_end;
+				}
+				sub_end -= entry->vme_start;
+				sub_end += VME_OFFSET(entry);
+				local_end = entry->vme_end;
+				vm_map_unlock(dst_map);
+				copy_size = sub_end - sub_start;
+
+				/* adjust the copy object */
+				if (total_size > copy_size) {
+					vm_map_size_t   local_size = 0;
+					vm_map_size_t   entry_size;
+
+					nentries = 1;
+					new_offset = copy->offset;
+					copy_entry = vm_map_copy_first_entry(copy);
+					while (copy_entry !=
+					    vm_map_copy_to_entry(copy)) {
+						entry_size = copy_entry->vme_end -
+						    copy_entry->vme_start;
+						if ((local_size < copy_size) &&
+						    ((local_size + entry_size)
+						    >= copy_size)) {
+							vm_map_copy_clip_end(copy,
+							    copy_entry,
+							    copy_entry->vme_start +
+							    (copy_size - local_size));
+							entry_size = copy_entry->vme_end -
+							    copy_entry->vme_start;
+							local_size += entry_size;
+							new_offset += entry_size;
+						}
+						if (local_size >= copy_size) {
+							next_copy = copy_entry->vme_next;
+							copy_entry->vme_next =
+							    vm_map_copy_to_entry(copy);
+							previous_prev =
+							    copy->cpy_hdr.links.prev;
+							copy->cpy_hdr.links.prev = copy_entry;
+							copy->size = copy_size;
+							remaining_entries =
+							    copy->cpy_hdr.nentries;
+							remaining_entries -= nentries;
+							copy->cpy_hdr.nentries = nentries;
+							break;
+						} else {
+							local_size += entry_size;
+							new_offset += entry_size;
+							nentries++;
+						}
+						copy_entry = copy_entry->vme_next;
+					}
+				}
+
+				if ((entry->use_pmap) && (pmap == NULL)) {
+					kr = vm_map_copy_overwrite_nested(
+						VME_SUBMAP(entry),
+						sub_start,
+						copy,
+						interruptible,
+						VME_SUBMAP(entry)->pmap,
+						TRUE);
+				} else if (pmap != NULL) {
+					kr = vm_map_copy_overwrite_nested(
+						VME_SUBMAP(entry),
+						sub_start,
+						copy,
+						interruptible, pmap,
+						TRUE);
+				} else {
+					kr = vm_map_copy_overwrite_nested(
+						VME_SUBMAP(entry),
+						sub_start,
+						copy,
+						interruptible,
+						dst_map->pmap,
+						TRUE);
+				}
+				if (kr != KERN_SUCCESS) {
+					if (next_copy != NULL) {
+						copy->cpy_hdr.nentries +=
+						    remaining_entries;
+						copy->cpy_hdr.links.prev->vme_next =
+						    next_copy;
+						copy->cpy_hdr.links.prev
+						        = previous_prev;
+						copy->size = total_size;
+					}
+					return kr;
+				}
+				if (dst_end <= local_end) {
+					return KERN_SUCCESS;
+				}
+				/* otherwise copy no longer exists, it was */
+				/* destroyed after successful copy_overwrite */
+				copy = vm_map_copy_allocate();
+				copy->type = VM_MAP_COPY_ENTRY_LIST;
+				copy->offset = new_offset;
+
+				/*
+				 * XXX FBDP
+				 * this does not seem to deal with
+				 * the VM map store (R&B tree)
+				 */
+
+				total_size -= copy_size;
+				copy_size = 0;
+				/* put back remainder of copy in container */
+				if (next_copy != NULL) {
+					copy->cpy_hdr.nentries = remaining_entries;
+					copy->cpy_hdr.links.next = next_copy;
+					copy->cpy_hdr.links.prev = previous_prev;
+					copy->size = total_size;
+					next_copy->vme_prev =
+					    vm_map_copy_to_entry(copy);
+					next_copy = NULL;
+				}
+				base_addr = local_end;
+				vm_map_lock(dst_map);
+				if (!vm_map_lookup_entry(dst_map,
+				    local_end, &tmp_entry)) {
+					vm_map_unlock(dst_map);
+					return KERN_INVALID_ADDRESS;
+				}
+				entry = tmp_entry;
+				continue;
+			}
+			if (dst_end <= entry->vme_end) {
+				copy_size = dst_end - base_addr;
+				break;
+			}
+
+			if ((next == vm_map_to_entry(dst_map)) ||
+			    (next->vme_start != entry->vme_end)) {
+				vm_map_unlock(dst_map);
+				return KERN_INVALID_ADDRESS;
+			}
+
+			entry = next;
+		}/* for */
+
+		next_copy = NULL;
+		nentries = 1;
+
+		/* adjust the copy object */
+		if (total_size > copy_size) {
+			vm_map_size_t   local_size = 0;
+			vm_map_size_t   entry_size;
+
+			new_offset = copy->offset;
+			copy_entry = vm_map_copy_first_entry(copy);
+			while (copy_entry != vm_map_copy_to_entry(copy)) {
+				entry_size = copy_entry->vme_end -
+				    copy_entry->vme_start;
+				if ((local_size < copy_size) &&
+				    ((local_size + entry_size)
+				    >= copy_size)) {
+					vm_map_copy_clip_end(copy, copy_entry,
+					    copy_entry->vme_start +
+					    (copy_size - local_size));
+					entry_size = copy_entry->vme_end -
+					    copy_entry->vme_start;
+					local_size += entry_size;
+					new_offset += entry_size;
+				}
+				if (local_size >= copy_size) {
+					next_copy = copy_entry->vme_next;
+					copy_entry->vme_next =
+					    vm_map_copy_to_entry(copy);
+					previous_prev =
+					    copy->cpy_hdr.links.prev;
+					copy->cpy_hdr.links.prev = copy_entry;
+					copy->size = copy_size;
+					remaining_entries =
+					    copy->cpy_hdr.nentries;
+					remaining_entries -= nentries;
+					copy->cpy_hdr.nentries = nentries;
+					break;
+				} else {
+					local_size += entry_size;
+					new_offset += entry_size;
+					nentries++;
+				}
+				copy_entry = copy_entry->vme_next;
+			}
+		}
+
+		if (aligned) {
+			pmap_t  local_pmap;
+
+			if (pmap) {
+				local_pmap = pmap;
+			} else {
+				local_pmap = dst_map->pmap;
+			}
+
+			if ((kr =  vm_map_copy_overwrite_aligned(
+				    dst_map, tmp_entry, copy,
+				    base_addr, local_pmap)) != KERN_SUCCESS) {
+				if (next_copy != NULL) {
+					copy->cpy_hdr.nentries +=
+					    remaining_entries;
+					copy->cpy_hdr.links.prev->vme_next =
+					    next_copy;
+					copy->cpy_hdr.links.prev =
+					    previous_prev;
+					copy->size += copy_size;
+				}
+				return kr;
+			}
+			vm_map_unlock(dst_map);
+		} else {
+			/*
+			 * Performance gain:
+			 *
+			 * if the copy and dst address are misaligned but the same
+			 * offset within the page we can copy_not_aligned the
+			 * misaligned parts and copy aligned the rest.  If they are
+			 * aligned but len is unaligned we simply need to copy
+			 * the end bit unaligned.  We'll need to split the misaligned
+			 * bits of the region in this case !
+			 */
+			/* ALWAYS UNLOCKS THE dst_map MAP */
+			kr = vm_map_copy_overwrite_unaligned(
+				dst_map,
+				tmp_entry,
+				copy,
+				base_addr,
+				discard_on_success);
+			if (kr != KERN_SUCCESS) {
+				if (next_copy != NULL) {
+					copy->cpy_hdr.nentries +=
+					    remaining_entries;
+					copy->cpy_hdr.links.prev->vme_next =
+					    next_copy;
+					copy->cpy_hdr.links.prev =
+					    previous_prev;
+					copy->size += copy_size;
+				}
+				return kr;
+			}
+		}
+		total_size -= copy_size;
+		if (total_size == 0) {
+			break;
+		}
+		base_addr += copy_size;
+		copy_size = 0;
+		copy->offset = new_offset;
+		if (next_copy != NULL) {
+			copy->cpy_hdr.nentries = remaining_entries;
+			copy->cpy_hdr.links.next = next_copy;
+			copy->cpy_hdr.links.prev = previous_prev;
+			next_copy->vme_prev = vm_map_copy_to_entry(copy);
+			copy->size = total_size;
+		}
+		vm_map_lock(dst_map);
+		while (TRUE) {
+			if (!vm_map_lookup_entry(dst_map,
+			    base_addr, &tmp_entry)) {
+				vm_map_unlock(dst_map);
+				return KERN_INVALID_ADDRESS;
+			}
+			if (tmp_entry->in_transition) {
+				entry->needs_wakeup = TRUE;
+				vm_map_entry_wait(dst_map, THREAD_UNINT);
+			} else {
+				break;
+			}
+		}
+		vm_map_clip_start(dst_map,
+		    tmp_entry,
+		    vm_map_trunc_page(base_addr,
+		    VM_MAP_PAGE_MASK(dst_map)));
+
+		entry = tmp_entry;
+	} /* while */
+
+	/*
+	 *	Throw away the vm_map_copy object
+	 */
+	if (discard_on_success) {
+		vm_map_copy_discard(copy);
+	}
+
+	return KERN_SUCCESS;
+}/* vm_map_copy_overwrite */
+
+kern_return_t
+vm_map_copy_overwrite(
+	vm_map_t        dst_map,
+	vm_map_offset_t dst_addr,
+	vm_map_copy_t   copy,
+	boolean_t       interruptible)
+{
+	vm_map_size_t   head_size, tail_size;
+	vm_map_copy_t   head_copy, tail_copy;
+	vm_map_offset_t head_addr, tail_addr;
+	vm_map_entry_t  entry;
+	kern_return_t   kr;
+	vm_map_offset_t effective_page_mask, effective_page_size;
+
+	head_size = 0;
+	tail_size = 0;
+	head_copy = NULL;
+	tail_copy = NULL;
+	head_addr = 0;
+	tail_addr = 0;
+
+	if (interruptible ||
+	    copy == VM_MAP_COPY_NULL ||
+	    copy->type != VM_MAP_COPY_ENTRY_LIST) {
+		/*
+		 * We can't split the "copy" map if we're interruptible
+		 * or if we don't have a "copy" map...
+		 */
+blunt_copy:
+		return vm_map_copy_overwrite_nested(dst_map,
+		           dst_addr,
+		           copy,
+		           interruptible,
+		           (pmap_t) NULL,
+		           TRUE);
+	}
+
+	effective_page_mask = MAX(VM_MAP_PAGE_MASK(dst_map), PAGE_MASK);
+	effective_page_mask = MAX(VM_MAP_COPY_PAGE_MASK(copy),
+	    effective_page_mask);
+	effective_page_size = effective_page_mask + 1;
+
+	if (copy->size < 3 * effective_page_size) {
+		/*
+		 * Too small to bother with optimizing...
+		 */
+		goto blunt_copy;
+	}
+
+	if ((dst_addr & effective_page_mask) !=
+	    (copy->offset & effective_page_mask)) {
+		/*
+		 * Incompatible mis-alignment of source and destination...
+		 */
+		goto blunt_copy;
+	}
+
+	/*
+	 * Proper alignment or identical mis-alignment at the beginning.
+	 * Let's try and do a small unaligned copy first (if needed)
+	 * and then an aligned copy for the rest.
+	 */
+	if (!vm_map_page_aligned(dst_addr, effective_page_mask)) {
+		head_addr = dst_addr;
+		head_size = (effective_page_size -
+		    (copy->offset & effective_page_mask));
+		head_size = MIN(head_size, copy->size);
+	}
+	if (!vm_map_page_aligned(copy->offset + copy->size,
+	    effective_page_mask)) {
+		/*
+		 * Mis-alignment at the end.
+		 * Do an aligned copy up to the last page and
+		 * then an unaligned copy for the remaining bytes.
+		 */
+		tail_size = ((copy->offset + copy->size) &
+		    effective_page_mask);
+		tail_size = MIN(tail_size, copy->size);
+		tail_addr = dst_addr + copy->size - tail_size;
+		assert(tail_addr >= head_addr + head_size);
+	}
+	assert(head_size + tail_size <= copy->size);
+
+	if (head_size + tail_size == copy->size) {
+		/*
+		 * It's all unaligned, no optimization possible...
+		 */
+		goto blunt_copy;
+	}
+
+	/*
+	 * Can't optimize if there are any submaps in the
+	 * destination due to the way we free the "copy" map
+	 * progressively in vm_map_copy_overwrite_nested()
+	 * in that case.
+	 */
+	vm_map_lock_read(dst_map);
+	if (!vm_map_lookup_entry(dst_map, dst_addr, &entry)) {
+		vm_map_unlock_read(dst_map);
+		goto blunt_copy;
+	}
+	for (;
+	    (entry != vm_map_copy_to_entry(copy) &&
+	    entry->vme_start < dst_addr + copy->size);
+	    entry = entry->vme_next) {
+		if (entry->is_sub_map) {
+			vm_map_unlock_read(dst_map);
+			goto blunt_copy;
+		}
+	}
+	vm_map_unlock_read(dst_map);
+
+	if (head_size) {
+		/*
+		 * Unaligned copy of the first "head_size" bytes, to reach
+		 * a page boundary.
+		 */
+
+		/*
+		 * Extract "head_copy" out of "copy".
+		 */
+		head_copy = vm_map_copy_allocate();
+		head_copy->type = VM_MAP_COPY_ENTRY_LIST;
+		head_copy->cpy_hdr.entries_pageable =
+		    copy->cpy_hdr.entries_pageable;
+		vm_map_store_init(&head_copy->cpy_hdr);
+
+		entry = vm_map_copy_first_entry(copy);
+		if (entry->vme_end < copy->offset + head_size) {
+			head_size = entry->vme_end - copy->offset;
+		}
+
+		head_copy->offset = copy->offset;
+		head_copy->size = head_size;
+		copy->offset += head_size;
+		copy->size -= head_size;
+
+		vm_map_copy_clip_end(copy, entry, copy->offset);
+		vm_map_copy_entry_unlink(copy, entry);
+		vm_map_copy_entry_link(head_copy,
+		    vm_map_copy_to_entry(head_copy),
+		    entry);
+
+		/*
+		 * Do the unaligned copy.
+		 */
+		kr = vm_map_copy_overwrite_nested(dst_map,
+		    head_addr,
+		    head_copy,
+		    interruptible,
+		    (pmap_t) NULL,
+		    FALSE);
+		if (kr != KERN_SUCCESS) {
+			goto done;
+		}
+	}
+
+	if (tail_size) {
+		/*
+		 * Extract "tail_copy" out of "copy".
+		 */
+		tail_copy = vm_map_copy_allocate();
+		tail_copy->type = VM_MAP_COPY_ENTRY_LIST;
+		tail_copy->cpy_hdr.entries_pageable =
+		    copy->cpy_hdr.entries_pageable;
+		vm_map_store_init(&tail_copy->cpy_hdr);
+
+		tail_copy->offset = copy->offset + copy->size - tail_size;
+		tail_copy->size = tail_size;
+
+		copy->size -= tail_size;
+
+		entry = vm_map_copy_last_entry(copy);
+		vm_map_copy_clip_start(copy, entry, tail_copy->offset);
+		entry = vm_map_copy_last_entry(copy);
+		vm_map_copy_entry_unlink(copy, entry);
+		vm_map_copy_entry_link(tail_copy,
+		    vm_map_copy_last_entry(tail_copy),
+		    entry);
+	}
+
+	/*
+	 * Copy most (or possibly all) of the data.
+	 */
+	kr = vm_map_copy_overwrite_nested(dst_map,
+	    dst_addr + head_size,
+	    copy,
+	    interruptible,
+	    (pmap_t) NULL,
+	    FALSE);
+	if (kr != KERN_SUCCESS) {
+		goto done;
+	}
+
+	if (tail_size) {
+		kr = vm_map_copy_overwrite_nested(dst_map,
+		    tail_addr,
+		    tail_copy,
+		    interruptible,
+		    (pmap_t) NULL,
+		    FALSE);
+	}
+
+done:
+	assert(copy->type == VM_MAP_COPY_ENTRY_LIST);
+	if (kr == KERN_SUCCESS) {
+		/*
+		 * Discard all the copy maps.
+		 */
+		if (head_copy) {
+			vm_map_copy_discard(head_copy);
+			head_copy = NULL;
+		}
+		vm_map_copy_discard(copy);
+		if (tail_copy) {
+			vm_map_copy_discard(tail_copy);
+			tail_copy = NULL;
+		}
+	} else {
+		/*
+		 * Re-assemble the original copy map.
+		 */
+		if (head_copy) {
+			entry = vm_map_copy_first_entry(head_copy);
+			vm_map_copy_entry_unlink(head_copy, entry);
+			vm_map_copy_entry_link(copy,
+			    vm_map_copy_to_entry(copy),
+			    entry);
+			copy->offset -= head_size;
+			copy->size += head_size;
+			vm_map_copy_discard(head_copy);
+			head_copy = NULL;
+		}
+		if (tail_copy) {
+			entry = vm_map_copy_last_entry(tail_copy);
+			vm_map_copy_entry_unlink(tail_copy, entry);
+			vm_map_copy_entry_link(copy,
+			    vm_map_copy_last_entry(copy),
+			    entry);
+			copy->size += tail_size;
+			vm_map_copy_discard(tail_copy);
+			tail_copy = NULL;
+		}
+	}
+	return kr;
+}
+
+
+/*
+ *	Routine: vm_map_copy_overwrite_unaligned	[internal use only]
+ *
+ *	Decription:
+ *	Physically copy unaligned data
+ *
+ *	Implementation:
+ *	Unaligned parts of pages have to be physically copied.  We use
+ *	a modified form of vm_fault_copy (which understands none-aligned
+ *	page offsets and sizes) to do the copy.  We attempt to copy as
+ *	much memory in one go as possibly, however vm_fault_copy copies
+ *	within 1 memory object so we have to find the smaller of "amount left"
+ *	"source object data size" and "target object data size".  With
+ *	unaligned data we don't need to split regions, therefore the source
+ *	(copy) object should be one map entry, the target range may be split
+ *	over multiple map entries however.  In any event we are pessimistic
+ *	about these assumptions.
+ *
+ *	Assumptions:
+ *	dst_map is locked on entry and is return locked on success,
+ *	unlocked on error.
+ */
+
+static kern_return_t
+vm_map_copy_overwrite_unaligned(
+	vm_map_t        dst_map,
+	vm_map_entry_t  entry,
+	vm_map_copy_t   copy,
+	vm_map_offset_t start,
+	boolean_t       discard_on_success)
+{
+	vm_map_entry_t          copy_entry;
+	vm_map_entry_t          copy_entry_next;
+	vm_map_version_t        version;
+	vm_object_t             dst_object;
+	vm_object_offset_t      dst_offset;
+	vm_object_offset_t      src_offset;
+	vm_object_offset_t      entry_offset;
+	vm_map_offset_t         entry_end;
+	vm_map_size_t           src_size,
+	    dst_size,
+	    copy_size,
+	    amount_left;
+	kern_return_t           kr = KERN_SUCCESS;
+
+
+	copy_entry = vm_map_copy_first_entry(copy);
+
+	vm_map_lock_write_to_read(dst_map);
+
+	src_offset = copy->offset - vm_object_trunc_page(copy->offset);
+	amount_left = copy->size;
+/*
+ *	unaligned so we never clipped this entry, we need the offset into
+ *	the vm_object not just the data.
+ */
+	while (amount_left > 0) {
+		if (entry == vm_map_to_entry(dst_map)) {
+			vm_map_unlock_read(dst_map);
+			return KERN_INVALID_ADDRESS;
+		}
+
+		/* "start" must be within the current map entry */
+		assert((start >= entry->vme_start) && (start < entry->vme_end));
+
+		dst_offset = start - entry->vme_start;
+
+		dst_size = entry->vme_end - start;
+
+		src_size = copy_entry->vme_end -
+		    (copy_entry->vme_start + src_offset);
+
+		if (dst_size < src_size) {
+/*
+ *			we can only copy dst_size bytes before
+ *			we have to get the next destination entry
+ */
+			copy_size = dst_size;
+		} else {
+/*
+ *			we can only copy src_size bytes before
+ *			we have to get the next source copy entry
+ */
+			copy_size = src_size;
+		}
+
+		if (copy_size > amount_left) {
+			copy_size = amount_left;
+		}
+/*
+ *		Entry needs copy, create a shadow shadow object for
+ *		Copy on write region.
+ */
+		if (entry->needs_copy &&
+		    ((entry->protection & VM_PROT_WRITE) != 0)) {
+			if (vm_map_lock_read_to_write(dst_map)) {
+				vm_map_lock_read(dst_map);
+				goto RetryLookup;
+			}
+			VME_OBJECT_SHADOW(entry,
+			    (vm_map_size_t)(entry->vme_end
+			    - entry->vme_start));
+			entry->needs_copy = FALSE;
+			vm_map_lock_write_to_read(dst_map);
+		}
+		dst_object = VME_OBJECT(entry);
+/*
+ *		unlike with the virtual (aligned) copy we're going
+ *		to fault on it therefore we need a target object.
+ */
+		if (dst_object == VM_OBJECT_NULL) {
+			if (vm_map_lock_read_to_write(dst_map)) {
+				vm_map_lock_read(dst_map);
+				goto RetryLookup;
+			}
+			dst_object = vm_object_allocate((vm_map_size_t)
+			    entry->vme_end - entry->vme_start);
+			VME_OBJECT_SET(entry, dst_object);
+			VME_OFFSET_SET(entry, 0);
+			assert(entry->use_pmap);
+			vm_map_lock_write_to_read(dst_map);
+		}
+/*
+ *		Take an object reference and unlock map. The "entry" may
+ *		disappear or change when the map is unlocked.
+ */
+		vm_object_reference(dst_object);
+		version.main_timestamp = dst_map->timestamp;
+		entry_offset = VME_OFFSET(entry);
+		entry_end = entry->vme_end;
+		vm_map_unlock_read(dst_map);
+/*
+ *		Copy as much as possible in one pass
+ */
+		kr = vm_fault_copy(
+			VME_OBJECT(copy_entry),
+			VME_OFFSET(copy_entry) + src_offset,
+			&copy_size,
+			dst_object,
+			entry_offset + dst_offset,
+			dst_map,
+			&version,
+			THREAD_UNINT );
+
+		start += copy_size;
+		src_offset += copy_size;
+		amount_left -= copy_size;
+/*
+ *		Release the object reference
+ */
+		vm_object_deallocate(dst_object);
+/*
+ *		If a hard error occurred, return it now
+ */
+		if (kr != KERN_SUCCESS) {
+			return kr;
+		}
+
+		if ((copy_entry->vme_start + src_offset) == copy_entry->vme_end
+		    || amount_left == 0) {
+/*
+ *			all done with this copy entry, dispose.
+ */
+			copy_entry_next = copy_entry->vme_next;
+
+			if (discard_on_success) {
+				vm_map_copy_entry_unlink(copy, copy_entry);
+				assert(!copy_entry->is_sub_map);
+				vm_object_deallocate(VME_OBJECT(copy_entry));
+				vm_map_copy_entry_dispose(copy, copy_entry);
+			}
+
+			if (copy_entry_next == vm_map_copy_to_entry(copy) &&
+			    amount_left) {
+/*
+ *				not finished copying but run out of source
+ */
+				return KERN_INVALID_ADDRESS;
+			}
+
+			copy_entry = copy_entry_next;
+
+			src_offset = 0;
+		}
+
+		if (amount_left == 0) {
+			return KERN_SUCCESS;
+		}
+
+		vm_map_lock_read(dst_map);
+		if (version.main_timestamp == dst_map->timestamp) {
+			if (start == entry_end) {
+/*
+ *				destination region is split.  Use the version
+ *				information to avoid a lookup in the normal
+ *				case.
+ */
+				entry = entry->vme_next;
+/*
+ *				should be contiguous. Fail if we encounter
+ *				a hole in the destination.
+ */
+				if (start != entry->vme_start) {
+					vm_map_unlock_read(dst_map);
+					return KERN_INVALID_ADDRESS;
+				}
+			}
+		} else {
+/*
+ *			Map version check failed.
+ *			we must lookup the entry because somebody
+ *			might have changed the map behind our backs.
+ */
+RetryLookup:
+			if (!vm_map_lookup_entry(dst_map, start, &entry)) {
+				vm_map_unlock_read(dst_map);
+				return KERN_INVALID_ADDRESS;
+			}
+		}
+	}/* while */
+
+	return KERN_SUCCESS;
+}/* vm_map_copy_overwrite_unaligned */
+
+/*
+ *	Routine: vm_map_copy_overwrite_aligned	[internal use only]
+ *
+ *	Description:
+ *	Does all the vm_trickery possible for whole pages.
+ *
+ *	Implementation:
+ *
+ *	If there are no permanent objects in the destination,
+ *	and the source and destination map entry zones match,
+ *	and the destination map entry is not shared,
+ *	then the map entries can be deleted and replaced
+ *	with those from the copy.  The following code is the
+ *	basic idea of what to do, but there are lots of annoying
+ *	little details about getting protection and inheritance
+ *	right.  Should add protection, inheritance, and sharing checks
+ *	to the above pass and make sure that no wiring is involved.
+ */
+
+int vm_map_copy_overwrite_aligned_src_not_internal = 0;
+int vm_map_copy_overwrite_aligned_src_not_symmetric = 0;
+int vm_map_copy_overwrite_aligned_src_large = 0;
+
+static kern_return_t
+vm_map_copy_overwrite_aligned(
+	vm_map_t        dst_map,
+	vm_map_entry_t  tmp_entry,
+	vm_map_copy_t   copy,
+	vm_map_offset_t start,
+	__unused pmap_t pmap)
+{
+	vm_object_t     object;
+	vm_map_entry_t  copy_entry;
+	vm_map_size_t   copy_size;
+	vm_map_size_t   size;
+	vm_map_entry_t  entry;
+
+	while ((copy_entry = vm_map_copy_first_entry(copy))
+	    != vm_map_copy_to_entry(copy)) {
+		copy_size = (copy_entry->vme_end - copy_entry->vme_start);
+
+		entry = tmp_entry;
+		if (entry->is_sub_map) {
+			/* unnested when clipped earlier */
+			assert(!entry->use_pmap);
+		}
+		if (entry == vm_map_to_entry(dst_map)) {
+			vm_map_unlock(dst_map);
+			return KERN_INVALID_ADDRESS;
+		}
+		size = (entry->vme_end - entry->vme_start);
+		/*
+		 *	Make sure that no holes popped up in the
+		 *	address map, and that the protection is
+		 *	still valid, in case the map was unlocked
+		 *	earlier.
+		 */
+
+		if ((entry->vme_start != start) || ((entry->is_sub_map)
+		    && !entry->needs_copy)) {
+			vm_map_unlock(dst_map);
+			return KERN_INVALID_ADDRESS;
+		}
+		assert(entry != vm_map_to_entry(dst_map));
+
+		/*
+		 *	Check protection again
+		 */
+
+		if (!(entry->protection & VM_PROT_WRITE)) {
+			vm_map_unlock(dst_map);
+			return KERN_PROTECTION_FAILURE;
+		}
+
+		/*
+		 *	Adjust to source size first
+		 */
+
+		if (copy_size < size) {
+			if (entry->map_aligned &&
+			    !VM_MAP_PAGE_ALIGNED(entry->vme_start + copy_size,
+			    VM_MAP_PAGE_MASK(dst_map))) {
+				/* no longer map-aligned */
+				entry->map_aligned = FALSE;
+			}
+			vm_map_clip_end(dst_map, entry, entry->vme_start + copy_size);
+			size = copy_size;
+		}
+
+		/*
+		 *	Adjust to destination size
+		 */
+
+		if (size < copy_size) {
+			vm_map_copy_clip_end(copy, copy_entry,
+			    copy_entry->vme_start + size);
+			copy_size = size;
+		}
+
+		assert((entry->vme_end - entry->vme_start) == size);
+		assert((tmp_entry->vme_end - tmp_entry->vme_start) == size);
+		assert((copy_entry->vme_end - copy_entry->vme_start) == size);
+
+		/*
+		 *	If the destination contains temporary unshared memory,
+		 *	we can perform the copy by throwing it away and
+		 *	installing the source data.
+		 */
+
+		object = VME_OBJECT(entry);
+		if ((!entry->is_shared &&
+		    ((object == VM_OBJECT_NULL) ||
+		    (object->internal && !object->true_share))) ||
+		    entry->needs_copy) {
+			vm_object_t     old_object = VME_OBJECT(entry);
+			vm_object_offset_t      old_offset = VME_OFFSET(entry);
+			vm_object_offset_t      offset;
+
+			/*
+			 * Ensure that the source and destination aren't
+			 * identical
+			 */
+			if (old_object == VME_OBJECT(copy_entry) &&
+			    old_offset == VME_OFFSET(copy_entry)) {
+				vm_map_copy_entry_unlink(copy, copy_entry);
+				vm_map_copy_entry_dispose(copy, copy_entry);
+
+				if (old_object != VM_OBJECT_NULL) {
+					vm_object_deallocate(old_object);
+				}
+
+				start = tmp_entry->vme_end;
+				tmp_entry = tmp_entry->vme_next;
+				continue;
+			}
+
+#if !CONFIG_EMBEDDED
+#define __TRADEOFF1_OBJ_SIZE (64 * 1024 * 1024) /* 64 MB */
+#define __TRADEOFF1_COPY_SIZE (128 * 1024)      /* 128 KB */
+			if (VME_OBJECT(copy_entry) != VM_OBJECT_NULL &&
+			    VME_OBJECT(copy_entry)->vo_size >= __TRADEOFF1_OBJ_SIZE &&
+			    copy_size <= __TRADEOFF1_COPY_SIZE) {
+				/*
+				 * Virtual vs. Physical copy tradeoff #1.
+				 *
+				 * Copying only a few pages out of a large
+				 * object:  do a physical copy instead of
+				 * a virtual copy, to avoid possibly keeping
+				 * the entire large object alive because of
+				 * those few copy-on-write pages.
+				 */
+				vm_map_copy_overwrite_aligned_src_large++;
+				goto slow_copy;
+			}
+#endif /* !CONFIG_EMBEDDED */
+
+			if ((dst_map->pmap != kernel_pmap) &&
+			    (VME_ALIAS(entry) >= VM_MEMORY_MALLOC) &&
+			    (VME_ALIAS(entry) <= VM_MEMORY_MALLOC_MEDIUM)) {
+				vm_object_t new_object, new_shadow;
+
+				/*
+				 * We're about to map something over a mapping
+				 * established by malloc()...
+				 */
+				new_object = VME_OBJECT(copy_entry);
+				if (new_object != VM_OBJECT_NULL) {
+					vm_object_lock_shared(new_object);
+				}
+				while (new_object != VM_OBJECT_NULL &&
+#if !CONFIG_EMBEDDED
+				    !new_object->true_share &&
+				    new_object->copy_strategy == MEMORY_OBJECT_COPY_SYMMETRIC &&
+#endif /* !CONFIG_EMBEDDED */
+				    new_object->internal) {
+					new_shadow = new_object->shadow;
+					if (new_shadow == VM_OBJECT_NULL) {
+						break;
+					}
+					vm_object_lock_shared(new_shadow);
+					vm_object_unlock(new_object);
+					new_object = new_shadow;
+				}
+				if (new_object != VM_OBJECT_NULL) {
+					if (!new_object->internal) {
+						/*
+						 * The new mapping is backed
+						 * by an external object.  We
+						 * don't want malloc'ed memory
+						 * to be replaced with such a
+						 * non-anonymous mapping, so
+						 * let's go off the optimized
+						 * path...
+						 */
+						vm_map_copy_overwrite_aligned_src_not_internal++;
+						vm_object_unlock(new_object);
+						goto slow_copy;
+					}
+#if !CONFIG_EMBEDDED
+					if (new_object->true_share ||
+					    new_object->copy_strategy != MEMORY_OBJECT_COPY_SYMMETRIC) {
+						/*
+						 * Same if there's a "true_share"
+						 * object in the shadow chain, or
+						 * an object with a non-default
+						 * (SYMMETRIC) copy strategy.
+						 */
+						vm_map_copy_overwrite_aligned_src_not_symmetric++;
+						vm_object_unlock(new_object);
+						goto slow_copy;
+					}
+#endif /* !CONFIG_EMBEDDED */
+					vm_object_unlock(new_object);
+				}
+				/*
+				 * The new mapping is still backed by
+				 * anonymous (internal) memory, so it's
+				 * OK to substitute it for the original
+				 * malloc() mapping.
+				 */
+			}
+
+			if (old_object != VM_OBJECT_NULL) {
+				if (entry->is_sub_map) {
+					if (entry->use_pmap) {
+#ifndef NO_NESTED_PMAP
+						pmap_unnest(dst_map->pmap,
+						    (addr64_t)entry->vme_start,
+						    entry->vme_end - entry->vme_start);
+#endif  /* NO_NESTED_PMAP */
+						if (dst_map->mapped_in_other_pmaps) {
+							/* clean up parent */
+							/* map/maps */
+							vm_map_submap_pmap_clean(
+								dst_map, entry->vme_start,
+								entry->vme_end,
+								VME_SUBMAP(entry),
+								VME_OFFSET(entry));
+						}
+					} else {
+						vm_map_submap_pmap_clean(
+							dst_map, entry->vme_start,
+							entry->vme_end,
+							VME_SUBMAP(entry),
+							VME_OFFSET(entry));
+					}
+					vm_map_deallocate(VME_SUBMAP(entry));
+				} else {
+					if (dst_map->mapped_in_other_pmaps) {
+						vm_object_pmap_protect_options(
+							VME_OBJECT(entry),
+							VME_OFFSET(entry),
+							entry->vme_end
+							- entry->vme_start,
+							PMAP_NULL,
+							entry->vme_start,
+							VM_PROT_NONE,
+							PMAP_OPTIONS_REMOVE);
+					} else {
+						pmap_remove_options(
+							dst_map->pmap,
+							(addr64_t)(entry->vme_start),
+							(addr64_t)(entry->vme_end),
+							PMAP_OPTIONS_REMOVE);
+					}
+					vm_object_deallocate(old_object);
+				}
+			}
+
+			if (entry->iokit_acct) {
+				/* keep using iokit accounting */
+				entry->use_pmap = FALSE;
+			} else {
+				/* use pmap accounting */
+				entry->use_pmap = TRUE;
+			}
+			entry->is_sub_map = FALSE;
+			VME_OBJECT_SET(entry, VME_OBJECT(copy_entry));
+			object = VME_OBJECT(entry);
+			entry->needs_copy = copy_entry->needs_copy;
+			entry->wired_count = 0;
+			entry->user_wired_count = 0;
+			offset = VME_OFFSET(copy_entry);
+			VME_OFFSET_SET(entry, offset);
+
+			vm_map_copy_entry_unlink(copy, copy_entry);
+			vm_map_copy_entry_dispose(copy, copy_entry);
+
+			/*
+			 * we could try to push pages into the pmap at this point, BUT
+			 * this optimization only saved on average 2 us per page if ALL
+			 * the pages in the source were currently mapped
+			 * and ALL the pages in the dest were touched, if there were fewer
+			 * than 2/3 of the pages touched, this optimization actually cost more cycles
+			 * it also puts a lot of pressure on the pmap layer w/r to mapping structures
+			 */
+
+			/*
+			 *	Set up for the next iteration.  The map
+			 *	has not been unlocked, so the next
+			 *	address should be at the end of this
+			 *	entry, and the next map entry should be
+			 *	the one following it.
+			 */
+
+			start = tmp_entry->vme_end;
+			tmp_entry = tmp_entry->vme_next;
+		} else {
+			vm_map_version_t        version;
+			vm_object_t             dst_object;
+			vm_object_offset_t      dst_offset;
+			kern_return_t           r;
+
+slow_copy:
+			if (entry->needs_copy) {
+				VME_OBJECT_SHADOW(entry,
+				    (entry->vme_end -
+				    entry->vme_start));
+				entry->needs_copy = FALSE;
+			}
+
+			dst_object = VME_OBJECT(entry);
+			dst_offset = VME_OFFSET(entry);
+
+			/*
+			 *	Take an object reference, and record
+			 *	the map version information so that the
+			 *	map can be safely unlocked.
+			 */
+
+			if (dst_object == VM_OBJECT_NULL) {
+				/*
+				 * We would usually have just taken the
+				 * optimized path above if the destination
+				 * object has not been allocated yet.  But we
+				 * now disable that optimization if the copy
+				 * entry's object is not backed by anonymous
+				 * memory to avoid replacing malloc'ed
+				 * (i.e. re-usable) anonymous memory with a
+				 * not-so-anonymous mapping.
+				 * So we have to handle this case here and
+				 * allocate a new VM object for this map entry.
+				 */
+				dst_object = vm_object_allocate(
+					entry->vme_end - entry->vme_start);
+				dst_offset = 0;
+				VME_OBJECT_SET(entry, dst_object);
+				VME_OFFSET_SET(entry, dst_offset);
+				assert(entry->use_pmap);
+			}
+
+			vm_object_reference(dst_object);
+
+			/* account for unlock bumping up timestamp */
+			version.main_timestamp = dst_map->timestamp + 1;
+
+			vm_map_unlock(dst_map);
+
+			/*
+			 *	Copy as much as possible in one pass
+			 */
+
+			copy_size = size;
+			r = vm_fault_copy(
+				VME_OBJECT(copy_entry),
+				VME_OFFSET(copy_entry),
+				&copy_size,
+				dst_object,
+				dst_offset,
+				dst_map,
+				&version,
+				THREAD_UNINT );
+
+			/*
+			 *	Release the object reference
+			 */
+
+			vm_object_deallocate(dst_object);
+
+			/*
+			 *	If a hard error occurred, return it now
+			 */
+
+			if (r != KERN_SUCCESS) {
+				return r;
+			}
+
+			if (copy_size != 0) {
+				/*
+				 *	Dispose of the copied region
+				 */
+
+				vm_map_copy_clip_end(copy, copy_entry,
+				    copy_entry->vme_start + copy_size);
+				vm_map_copy_entry_unlink(copy, copy_entry);
+				vm_object_deallocate(VME_OBJECT(copy_entry));
+				vm_map_copy_entry_dispose(copy, copy_entry);
+			}
+
+			/*
+			 *	Pick up in the destination map where we left off.
+			 *
+			 *	Use the version information to avoid a lookup
+			 *	in the normal case.
+			 */
+
+			start += copy_size;
+			vm_map_lock(dst_map);
+			if (version.main_timestamp == dst_map->timestamp &&
+			    copy_size != 0) {
+				/* We can safely use saved tmp_entry value */
+
+				if (tmp_entry->map_aligned &&
+				    !VM_MAP_PAGE_ALIGNED(
+					    start,
+					    VM_MAP_PAGE_MASK(dst_map))) {
+					/* no longer map-aligned */
+					tmp_entry->map_aligned = FALSE;
+				}
+				vm_map_clip_end(dst_map, tmp_entry, start);
+				tmp_entry = tmp_entry->vme_next;
+			} else {
+				/* Must do lookup of tmp_entry */
+
+				if (!vm_map_lookup_entry(dst_map, start, &tmp_entry)) {
+					vm_map_unlock(dst_map);
+					return KERN_INVALID_ADDRESS;
+				}
+				if (tmp_entry->map_aligned &&
+				    !VM_MAP_PAGE_ALIGNED(
+					    start,
+					    VM_MAP_PAGE_MASK(dst_map))) {
+					/* no longer map-aligned */
+					tmp_entry->map_aligned = FALSE;
+				}
+				vm_map_clip_start(dst_map, tmp_entry, start);
+			}
+		}
+	}/* while */
+
+	return KERN_SUCCESS;
+}/* vm_map_copy_overwrite_aligned */
+
+/*
+ *	Routine: vm_map_copyin_kernel_buffer [internal use only]
+ *
+ *	Description:
+ *		Copy in data to a kernel buffer from space in the
+ *		source map. The original space may be optionally
+ *		deallocated.
+ *
+ *		If successful, returns a new copy object.
+ */
+static kern_return_t
+vm_map_copyin_kernel_buffer(
+	vm_map_t        src_map,
+	vm_map_offset_t src_addr,
+	vm_map_size_t   len,
+	boolean_t       src_destroy,
+	vm_map_copy_t   *copy_result)
+{
+	kern_return_t kr;
+	vm_map_copy_t copy;
+	vm_size_t kalloc_size;
+
+	if (len > msg_ool_size_small) {
+		return KERN_INVALID_ARGUMENT;
+	}
+
+	kalloc_size = (vm_size_t)(cpy_kdata_hdr_sz + len);
+
+	copy = (vm_map_copy_t)kalloc(kalloc_size);
+	if (copy == VM_MAP_COPY_NULL) {
+		return KERN_RESOURCE_SHORTAGE;
+	}
+	copy->type = VM_MAP_COPY_KERNEL_BUFFER;
+	copy->size = len;
+	copy->offset = 0;
+
+	kr = copyinmap(src_map, src_addr, copy->cpy_kdata, (vm_size_t)len);
+	if (kr != KERN_SUCCESS) {
+		kfree(copy, kalloc_size);
+		return kr;
+	}
+	if (src_destroy) {
+		(void) vm_map_remove(
+			src_map,
+			vm_map_trunc_page(src_addr,
+			VM_MAP_PAGE_MASK(src_map)),
+			vm_map_round_page(src_addr + len,
+			VM_MAP_PAGE_MASK(src_map)),
+			(VM_MAP_REMOVE_INTERRUPTIBLE |
+			VM_MAP_REMOVE_WAIT_FOR_KWIRE |
+			((src_map == kernel_map) ? VM_MAP_REMOVE_KUNWIRE : VM_MAP_REMOVE_NO_FLAGS)));
+	}
+	*copy_result = copy;
+	return KERN_SUCCESS;
+}
+
+/*
+ *	Routine: vm_map_copyout_kernel_buffer	[internal use only]
+ *
+ *	Description:
+ *		Copy out data from a kernel buffer into space in the
+ *		destination map. The space may be otpionally dynamically
+ *		allocated.
+ *
+ *		If successful, consumes the copy object.
+ *		Otherwise, the caller is responsible for it.
+ */
+static int vm_map_copyout_kernel_buffer_failures = 0;
+static kern_return_t
+vm_map_copyout_kernel_buffer(
+	vm_map_t                map,
+	vm_map_address_t        *addr,  /* IN/OUT */
+	vm_map_copy_t           copy,
+	vm_map_size_t           copy_size,
+	boolean_t               overwrite,
+	boolean_t               consume_on_success)
+{
+	kern_return_t kr = KERN_SUCCESS;
+	thread_t thread = current_thread();
+
+	assert(copy->size == copy_size);
+
+	/*
+	 * check for corrupted vm_map_copy structure
+	 */
+	if (copy_size > msg_ool_size_small || copy->offset) {
+		panic("Invalid vm_map_copy_t sz:%lld, ofst:%lld",
+		    (long long)copy->size, (long long)copy->offset);
+	}
+
+	if (!overwrite) {
+		/*
+		 * Allocate space in the target map for the data
+		 */
+		*addr = 0;
+		kr = vm_map_enter(map,
+		    addr,
+		    vm_map_round_page(copy_size,
+		    VM_MAP_PAGE_MASK(map)),
+		    (vm_map_offset_t) 0,
+		    VM_FLAGS_ANYWHERE,
+		    VM_MAP_KERNEL_FLAGS_NONE,
+		    VM_KERN_MEMORY_NONE,
+		    VM_OBJECT_NULL,
+		    (vm_object_offset_t) 0,
+		    FALSE,
+		    VM_PROT_DEFAULT,
+		    VM_PROT_ALL,
+		    VM_INHERIT_DEFAULT);
+		if (kr != KERN_SUCCESS) {
+			return kr;
+		}
+#if KASAN
+		if (map->pmap == kernel_pmap) {
+			kasan_notify_address(*addr, copy->size);
+		}
+#endif
+	}
+
+	/*
+	 * Copyout the data from the kernel buffer to the target map.
+	 */
+	if (thread->map == map) {
+		/*
+		 * If the target map is the current map, just do
+		 * the copy.
+		 */
+		assert((vm_size_t)copy_size == copy_size);
+		if (copyout(copy->cpy_kdata, *addr, (vm_size_t)copy_size)) {
+			kr = KERN_INVALID_ADDRESS;
+		}
+	} else {
+		vm_map_t oldmap;
+
+		/*
+		 * If the target map is another map, assume the
+		 * target's address space identity for the duration
+		 * of the copy.
+		 */
+		vm_map_reference(map);
+		oldmap = vm_map_switch(map);
+
+		assert((vm_size_t)copy_size == copy_size);
+		if (copyout(copy->cpy_kdata, *addr, (vm_size_t)copy_size)) {
+			vm_map_copyout_kernel_buffer_failures++;
+			kr = KERN_INVALID_ADDRESS;
+		}
+
+		(void) vm_map_switch(oldmap);
+		vm_map_deallocate(map);
+	}
+
+	if (kr != KERN_SUCCESS) {
+		/* the copy failed, clean up */
+		if (!overwrite) {
+			/*
+			 * Deallocate the space we allocated in the target map.
+			 */
+			(void) vm_map_remove(
+				map,
+				vm_map_trunc_page(*addr,
+				VM_MAP_PAGE_MASK(map)),
+				vm_map_round_page((*addr +
+				vm_map_round_page(copy_size,
+				VM_MAP_PAGE_MASK(map))),
+				VM_MAP_PAGE_MASK(map)),
+				VM_MAP_REMOVE_NO_FLAGS);
+			*addr = 0;
+		}
+	} else {
+		/* copy was successful, dicard the copy structure */
+		if (consume_on_success) {
+			kfree(copy, copy_size + cpy_kdata_hdr_sz);
+		}
+	}
+
+	return kr;
+}
+
+/*
+ *	Routine:	vm_map_copy_insert      [internal use only]
+ *
+ *	Description:
+ *		Link a copy chain ("copy") into a map at the
+ *		specified location (after "where").
+ *	Side effects:
+ *		The copy chain is destroyed.
+ */
+static void
+vm_map_copy_insert(
+	vm_map_t        map,
+	vm_map_entry_t  after_where,
+	vm_map_copy_t   copy)
+{
+	vm_map_entry_t  entry;
+
+	while (vm_map_copy_first_entry(copy) != vm_map_copy_to_entry(copy)) {
+		entry = vm_map_copy_first_entry(copy);
+		vm_map_copy_entry_unlink(copy, entry);
+		vm_map_store_entry_link(map, after_where, entry,
+		    VM_MAP_KERNEL_FLAGS_NONE);
+		after_where = entry;
+	}
+	zfree(vm_map_copy_zone, copy);
+}
+
+void
+vm_map_copy_remap(
+	vm_map_t        map,
+	vm_map_entry_t  where,
+	vm_map_copy_t   copy,
+	vm_map_offset_t adjustment,
+	vm_prot_t       cur_prot,
+	vm_prot_t       max_prot,
+	vm_inherit_t    inheritance)
+{
+	vm_map_entry_t  copy_entry, new_entry;
+
+	for (copy_entry = vm_map_copy_first_entry(copy);
+	    copy_entry != vm_map_copy_to_entry(copy);
+	    copy_entry = copy_entry->vme_next) {
+		/* get a new VM map entry for the map */
+		new_entry = vm_map_entry_create(map,
+		    !map->hdr.entries_pageable);
+		/* copy the "copy entry" to the new entry */
+		vm_map_entry_copy(new_entry, copy_entry);
+		/* adjust "start" and "end" */
+		new_entry->vme_start += adjustment;
+		new_entry->vme_end += adjustment;
+		/* clear some attributes */
+		new_entry->inheritance = inheritance;
+		new_entry->protection = cur_prot;
+		new_entry->max_protection = max_prot;
+		new_entry->behavior = VM_BEHAVIOR_DEFAULT;
+		/* take an extra reference on the entry's "object" */
+		if (new_entry->is_sub_map) {
+			assert(!new_entry->use_pmap); /* not nested */
+			vm_map_lock(VME_SUBMAP(new_entry));
+			vm_map_reference(VME_SUBMAP(new_entry));
+			vm_map_unlock(VME_SUBMAP(new_entry));
+		} else {
+			vm_object_reference(VME_OBJECT(new_entry));
+		}
+		/* insert the new entry in the map */
+		vm_map_store_entry_link(map, where, new_entry,
+		    VM_MAP_KERNEL_FLAGS_NONE);
+		/* continue inserting the "copy entries" after the new entry */
+		where = new_entry;
+	}
+}
+
+
+/*
+ * Returns true if *size matches (or is in the range of) copy->size.
+ * Upon returning true, the *size field is updated with the actual size of the
+ * copy object (may be different for VM_MAP_COPY_ENTRY_LIST types)
+ */
+boolean_t
+vm_map_copy_validate_size(
+	vm_map_t                dst_map,
+	vm_map_copy_t           copy,
+	vm_map_size_t           *size)
+{
+	if (copy == VM_MAP_COPY_NULL) {
+		return FALSE;
+	}
+	vm_map_size_t copy_sz = copy->size;
+	vm_map_size_t sz = *size;
+	switch (copy->type) {
+	case VM_MAP_COPY_OBJECT:
+	case VM_MAP_COPY_KERNEL_BUFFER:
+		if (sz == copy_sz) {
+			return TRUE;
+		}
+		break;
+	case VM_MAP_COPY_ENTRY_LIST:
+		/*
+		 * potential page-size rounding prevents us from exactly
+		 * validating this flavor of vm_map_copy, but we can at least
+		 * assert that it's within a range.
+		 */
+		if (copy_sz >= sz &&
+		    copy_sz <= vm_map_round_page(sz, VM_MAP_PAGE_MASK(dst_map))) {
+			*size = copy_sz;
+			return TRUE;
+		}
+		break;
+	default:
+		break;
+	}
+	return FALSE;
+}
+
+/*
+ *	Routine:	vm_map_copyout_size
+ *
+ *	Description:
+ *		Copy out a copy chain ("copy") into newly-allocated
+ *		space in the destination map. Uses a prevalidated
+ *		size for the copy object (vm_map_copy_validate_size).
+ *
+ *		If successful, consumes the copy object.
+ *		Otherwise, the caller is responsible for it.
+ */
+kern_return_t
+vm_map_copyout_size(
+	vm_map_t                dst_map,
+	vm_map_address_t        *dst_addr,      /* OUT */
+	vm_map_copy_t           copy,
+	vm_map_size_t           copy_size)
+{
+	return vm_map_copyout_internal(dst_map, dst_addr, copy, copy_size,
+	           TRUE,                     /* consume_on_success */
+	           VM_PROT_DEFAULT,
+	           VM_PROT_ALL,
+	           VM_INHERIT_DEFAULT);
+}
+
+/*
+ *	Routine:	vm_map_copyout
+ *
+ *	Description:
+ *		Copy out a copy chain ("copy") into newly-allocated
+ *		space in the destination map.
+ *
+ *		If successful, consumes the copy object.
+ *		Otherwise, the caller is responsible for it.
+ */
+kern_return_t
+vm_map_copyout(
+	vm_map_t                dst_map,
+	vm_map_address_t        *dst_addr,      /* OUT */
+	vm_map_copy_t           copy)
+{
+	return vm_map_copyout_internal(dst_map, dst_addr, copy, copy ? copy->size : 0,
+	           TRUE,                     /* consume_on_success */
+	           VM_PROT_DEFAULT,
+	           VM_PROT_ALL,
+	           VM_INHERIT_DEFAULT);
+}
+
+kern_return_t
+vm_map_copyout_internal(
+	vm_map_t                dst_map,
+	vm_map_address_t        *dst_addr,      /* OUT */
+	vm_map_copy_t           copy,
+	vm_map_size_t           copy_size,
+	boolean_t               consume_on_success,
+	vm_prot_t               cur_protection,
+	vm_prot_t               max_protection,
+	vm_inherit_t            inheritance)
+{
+	vm_map_size_t           size;
+	vm_map_size_t           adjustment;
+	vm_map_offset_t         start;
+	vm_object_offset_t      vm_copy_start;
+	vm_map_entry_t          last;
+	vm_map_entry_t          entry;
+	vm_map_entry_t          hole_entry;
+
+	/*
+	 *	Check for null copy object.
+	 */
+
+	if (copy == VM_MAP_COPY_NULL) {
+		*dst_addr = 0;
+		return KERN_SUCCESS;
+	}
+
+	if (copy->size != copy_size) {
+		*dst_addr = 0;
+		return KERN_FAILURE;
+	}
+
+	/*
+	 *	Check for special copy object, created
+	 *	by vm_map_copyin_object.
+	 */
+
+	if (copy->type == VM_MAP_COPY_OBJECT) {
+		vm_object_t             object = copy->cpy_object;
+		kern_return_t           kr;
+		vm_object_offset_t      offset;
+
+		offset = vm_object_trunc_page(copy->offset);
+		size = vm_map_round_page((copy_size +
+		    (vm_map_size_t)(copy->offset -
+		    offset)),
+		    VM_MAP_PAGE_MASK(dst_map));
+		*dst_addr = 0;
+		kr = vm_map_enter(dst_map, dst_addr, size,
+		    (vm_map_offset_t) 0, VM_FLAGS_ANYWHERE,
+		    VM_MAP_KERNEL_FLAGS_NONE,
+		    VM_KERN_MEMORY_NONE,
+		    object, offset, FALSE,
+		    VM_PROT_DEFAULT, VM_PROT_ALL,
+		    VM_INHERIT_DEFAULT);
+		if (kr != KERN_SUCCESS) {
+			return kr;
+		}
+		/* Account for non-pagealigned copy object */
+		*dst_addr += (vm_map_offset_t)(copy->offset - offset);
+		if (consume_on_success) {
+			zfree(vm_map_copy_zone, copy);
+		}
+		return KERN_SUCCESS;
+	}
+
+	/*
+	 *	Check for special kernel buffer allocated
+	 *	by new_ipc_kmsg_copyin.
+	 */
+
+	if (copy->type == VM_MAP_COPY_KERNEL_BUFFER) {
+		return vm_map_copyout_kernel_buffer(dst_map, dst_addr,
+		           copy, copy_size, FALSE,
+		           consume_on_success);
+	}
+
+
+	/*
+	 *	Find space for the data
+	 */
+
+	vm_copy_start = vm_map_trunc_page((vm_map_size_t)copy->offset,
+	    VM_MAP_COPY_PAGE_MASK(copy));
+	size = vm_map_round_page((vm_map_size_t)copy->offset + copy_size,
+	    VM_MAP_COPY_PAGE_MASK(copy))
+	    - vm_copy_start;
+
+
+StartAgain:;
+
+	vm_map_lock(dst_map);
+	if (dst_map->disable_vmentry_reuse == TRUE) {
+		VM_MAP_HIGHEST_ENTRY(dst_map, entry, start);
+		last = entry;
+	} else {
+		if (dst_map->holelistenabled) {
+			hole_entry = CAST_TO_VM_MAP_ENTRY(dst_map->holes_list);
+
+			if (hole_entry == NULL) {
+				/*
+				 * No more space in the map?
+				 */
+				vm_map_unlock(dst_map);
+				return KERN_NO_SPACE;
+			}
+
+			last = hole_entry;
+			start = last->vme_start;
+		} else {
+			assert(first_free_is_valid(dst_map));
+			start = ((last = dst_map->first_free) == vm_map_to_entry(dst_map)) ?
+			    vm_map_min(dst_map) : last->vme_end;
+		}
+		start = vm_map_round_page(start,
+		    VM_MAP_PAGE_MASK(dst_map));
+	}
+
+	while (TRUE) {
+		vm_map_entry_t  next = last->vme_next;
+		vm_map_offset_t end = start + size;
+
+		if ((end > dst_map->max_offset) || (end < start)) {
+			if (dst_map->wait_for_space) {
+				if (size <= (dst_map->max_offset - dst_map->min_offset)) {
+					assert_wait((event_t) dst_map,
+					    THREAD_INTERRUPTIBLE);
+					vm_map_unlock(dst_map);
+					thread_block(THREAD_CONTINUE_NULL);
+					goto StartAgain;
+				}
+			}
+			vm_map_unlock(dst_map);
+			return KERN_NO_SPACE;
+		}
+
+		if (dst_map->holelistenabled) {
+			if (last->vme_end >= end) {
+				break;
+			}
+		} else {
+			/*
+			 *	If there are no more entries, we must win.
+			 *
+			 *	OR
+			 *
+			 *	If there is another entry, it must be
+			 *	after the end of the potential new region.
+			 */
+
+			if (next == vm_map_to_entry(dst_map)) {
+				break;
+			}
+
+			if (next->vme_start >= end) {
+				break;
+			}
+		}
+
+		last = next;
+
+		if (dst_map->holelistenabled) {
+			if (last == CAST_TO_VM_MAP_ENTRY(dst_map->holes_list)) {
+				/*
+				 * Wrapped around
+				 */
+				vm_map_unlock(dst_map);
+				return KERN_NO_SPACE;
+			}
+			start = last->vme_start;
+		} else {
+			start = last->vme_end;
+		}
+		start = vm_map_round_page(start,
+		    VM_MAP_PAGE_MASK(dst_map));
+	}
+
+	if (dst_map->holelistenabled) {
+		if (vm_map_lookup_entry(dst_map, last->vme_start, &last)) {
+			panic("Found an existing entry (%p) instead of potential hole at address: 0x%llx.\n", last, (unsigned long long)last->vme_start);
+		}
+	}
+
+
+	adjustment = start - vm_copy_start;
+	if (!consume_on_success) {
+		/*
+		 * We're not allowed to consume "copy", so we'll have to
+		 * copy its map entries into the destination map below.
+		 * No need to re-allocate map entries from the correct
+		 * (pageable or not) zone, since we'll get new map entries
+		 * during the transfer.
+		 * We'll also adjust the map entries's "start" and "end"
+		 * during the transfer, to keep "copy"'s entries consistent
+		 * with its "offset".
+		 */
+		goto after_adjustments;
+	}
+
+	/*
+	 *	Since we're going to just drop the map
+	 *	entries from the copy into the destination
+	 *	map, they must come from the same pool.
+	 */
+
+	if (copy->cpy_hdr.entries_pageable != dst_map->hdr.entries_pageable) {
+		/*
+		 * Mismatches occur when dealing with the default
+		 * pager.
+		 */
+		zone_t          old_zone;
+		vm_map_entry_t  next, new;
+
+		/*
+		 * Find the zone that the copies were allocated from
+		 */
+
+		entry = vm_map_copy_first_entry(copy);
+
+		/*
+		 * Reinitialize the copy so that vm_map_copy_entry_link
+		 * will work.
+		 */
+		vm_map_store_copy_reset(copy, entry);
+		copy->cpy_hdr.entries_pageable = dst_map->hdr.entries_pageable;
+
+		/*
+		 * Copy each entry.
+		 */
+		while (entry != vm_map_copy_to_entry(copy)) {
+			new = vm_map_copy_entry_create(copy, !copy->cpy_hdr.entries_pageable);
+			vm_map_entry_copy_full(new, entry);
+			new->vme_no_copy_on_read = FALSE;
+			assert(!new->iokit_acct);
+			if (new->is_sub_map) {
+				/* clr address space specifics */
+				new->use_pmap = FALSE;
+			}
+			vm_map_copy_entry_link(copy,
+			    vm_map_copy_last_entry(copy),
+			    new);
+			next = entry->vme_next;
+			old_zone = entry->from_reserved_zone ? vm_map_entry_reserved_zone : vm_map_entry_zone;
+			zfree(old_zone, entry);
+			entry = next;
+		}
+	}
+
+	/*
+	 *	Adjust the addresses in the copy chain, and
+	 *	reset the region attributes.
+	 */
+
+	for (entry = vm_map_copy_first_entry(copy);
+	    entry != vm_map_copy_to_entry(copy);
+	    entry = entry->vme_next) {
+		if (VM_MAP_PAGE_SHIFT(dst_map) == PAGE_SHIFT) {
+			/*
+			 * We're injecting this copy entry into a map that
+			 * has the standard page alignment, so clear
+			 * "map_aligned" (which might have been inherited
+			 * from the original map entry).
+			 */
+			entry->map_aligned = FALSE;
+		}
+
+		entry->vme_start += adjustment;
+		entry->vme_end += adjustment;
+
+		if (entry->map_aligned) {
+			assert(VM_MAP_PAGE_ALIGNED(entry->vme_start,
+			    VM_MAP_PAGE_MASK(dst_map)));
+			assert(VM_MAP_PAGE_ALIGNED(entry->vme_end,
+			    VM_MAP_PAGE_MASK(dst_map)));
+		}
+
+		entry->inheritance = VM_INHERIT_DEFAULT;
+		entry->protection = VM_PROT_DEFAULT;
+		entry->max_protection = VM_PROT_ALL;
+		entry->behavior = VM_BEHAVIOR_DEFAULT;
+
+		/*
+		 * If the entry is now wired,
+		 * map the pages into the destination map.
+		 */
+		if (entry->wired_count != 0) {
+			vm_map_offset_t va;
+			vm_object_offset_t       offset;
+			vm_object_t object;
+			vm_prot_t prot;
+			int     type_of_fault;
+
+			object = VME_OBJECT(entry);
+			offset = VME_OFFSET(entry);
+			va = entry->vme_start;
+
+			pmap_pageable(dst_map->pmap,
+			    entry->vme_start,
+			    entry->vme_end,
+			    TRUE);
+
+			while (va < entry->vme_end) {
+				vm_page_t       m;
+				struct vm_object_fault_info fault_info = {};
+
+				/*
+				 * Look up the page in the object.
+				 * Assert that the page will be found in the
+				 * top object:
+				 * either
+				 *	the object was newly created by
+				 *	vm_object_copy_slowly, and has
+				 *	copies of all of the pages from
+				 *	the source object
+				 * or
+				 *	the object was moved from the old
+				 *	map entry; because the old map
+				 *	entry was wired, all of the pages
+				 *	were in the top-level object.
+				 *	(XXX not true if we wire pages for
+				 *	 reading)
+				 */
+				vm_object_lock(object);
+
+				m = vm_page_lookup(object, offset);
+				if (m == VM_PAGE_NULL || !VM_PAGE_WIRED(m) ||
+				    m->vmp_absent) {
+					panic("vm_map_copyout: wiring %p", m);
+				}
+
+				prot = entry->protection;
+
+				if (override_nx(dst_map, VME_ALIAS(entry)) &&
+				    prot) {
+					prot |= VM_PROT_EXECUTE;
+				}
+
+				type_of_fault = DBG_CACHE_HIT_FAULT;
+
+				fault_info.user_tag = VME_ALIAS(entry);
+				fault_info.pmap_options = 0;
+				if (entry->iokit_acct ||
+				    (!entry->is_sub_map && !entry->use_pmap)) {
+					fault_info.pmap_options |= PMAP_OPTIONS_ALT_ACCT;
+				}
+
+				vm_fault_enter(m,
+				    dst_map->pmap,
+				    va,
+				    prot,
+				    prot,
+				    VM_PAGE_WIRED(m),
+				    FALSE,            /* change_wiring */
+				    VM_KERN_MEMORY_NONE,            /* tag - not wiring */
+				    &fault_info,
+				    NULL,             /* need_retry */
+				    &type_of_fault);
+
+				vm_object_unlock(object);
+
+				offset += PAGE_SIZE_64;
+				va += PAGE_SIZE;
+			}
+		}
+	}
+
+after_adjustments:
+
+	/*
+	 *	Correct the page alignment for the result
+	 */
+
+	*dst_addr = start + (copy->offset - vm_copy_start);
+
+#if KASAN
+	kasan_notify_address(*dst_addr, size);
+#endif
+
+	/*
+	 *	Update the hints and the map size
+	 */
+
+	if (consume_on_success) {
+		SAVE_HINT_MAP_WRITE(dst_map, vm_map_copy_last_entry(copy));
+	} else {
+		SAVE_HINT_MAP_WRITE(dst_map, last);
+	}
+
+	dst_map->size += size;
+
+	/*
+	 *	Link in the copy
+	 */
+
+	if (consume_on_success) {
+		vm_map_copy_insert(dst_map, last, copy);
+	} else {
+		vm_map_copy_remap(dst_map, last, copy, adjustment,
+		    cur_protection, max_protection,
+		    inheritance);
+	}
+
+	vm_map_unlock(dst_map);
+
+	/*
+	 * XXX	If wiring_required, call vm_map_pageable
+	 */
+
+	return KERN_SUCCESS;
+}
+
+/*
+ *	Routine:	vm_map_copyin
+ *
+ *	Description:
+ *		see vm_map_copyin_common.  Exported via Unsupported.exports.
+ *
+ */
+
+#undef vm_map_copyin
+
+kern_return_t
+vm_map_copyin(
+	vm_map_t                        src_map,
+	vm_map_address_t        src_addr,
+	vm_map_size_t           len,
+	boolean_t                       src_destroy,
+	vm_map_copy_t           *copy_result)   /* OUT */
+{
+	return vm_map_copyin_common(src_map, src_addr, len, src_destroy,
+	           FALSE, copy_result, FALSE);
+}
+
+/*
+ *	Routine:	vm_map_copyin_common
+ *
+ *	Description:
+ *		Copy the specified region (src_addr, len) from the
+ *		source address space (src_map), possibly removing
+ *		the region from the source address space (src_destroy).
+ *
+ *	Returns:
+ *		A vm_map_copy_t object (copy_result), suitable for
+ *		insertion into another address space (using vm_map_copyout),
+ *		copying over another address space region (using
+ *		vm_map_copy_overwrite).  If the copy is unused, it
+ *		should be destroyed (using vm_map_copy_discard).
+ *
+ *	In/out conditions:
+ *		The source map should not be locked on entry.
+ */
+
+typedef struct submap_map {
+	vm_map_t        parent_map;
+	vm_map_offset_t base_start;
+	vm_map_offset_t base_end;
+	vm_map_size_t   base_len;
+	struct submap_map *next;
+} submap_map_t;
+
+kern_return_t
+vm_map_copyin_common(
+	vm_map_t        src_map,
+	vm_map_address_t src_addr,
+	vm_map_size_t   len,
+	boolean_t       src_destroy,
+	__unused boolean_t      src_volatile,
+	vm_map_copy_t   *copy_result,   /* OUT */
+	boolean_t       use_maxprot)
+{
+	int flags;
+
+	flags = 0;
+	if (src_destroy) {
+		flags |= VM_MAP_COPYIN_SRC_DESTROY;
+	}
+	if (use_maxprot) {
+		flags |= VM_MAP_COPYIN_USE_MAXPROT;
+	}
+	return vm_map_copyin_internal(src_map,
+	           src_addr,
+	           len,
+	           flags,
+	           copy_result);
+}
+kern_return_t
+vm_map_copyin_internal(
+	vm_map_t        src_map,
+	vm_map_address_t src_addr,
+	vm_map_size_t   len,
+	int             flags,
+	vm_map_copy_t   *copy_result)   /* OUT */
+{
+	vm_map_entry_t  tmp_entry;      /* Result of last map lookup --
+	                                 * in multi-level lookup, this
+	                                 * entry contains the actual
+	                                 * vm_object/offset.
+	                                 */
+	vm_map_entry_t  new_entry = VM_MAP_ENTRY_NULL;  /* Map entry for copy */
+
+	vm_map_offset_t src_start;      /* Start of current entry --
+	                                 * where copy is taking place now
+	                                 */
+	vm_map_offset_t src_end;        /* End of entire region to be
+	                                 * copied */
+	vm_map_offset_t src_base;
+	vm_map_t        base_map = src_map;
+	boolean_t       map_share = FALSE;
+	submap_map_t    *parent_maps = NULL;
+
+	vm_map_copy_t   copy;           /* Resulting copy */
+	vm_map_address_t copy_addr;
+	vm_map_size_t   copy_size;
+	boolean_t       src_destroy;
+	boolean_t       use_maxprot;
+	boolean_t       preserve_purgeable;
+	boolean_t       entry_was_shared;
+	vm_map_entry_t  saved_src_entry;
+
+	if (flags & ~VM_MAP_COPYIN_ALL_FLAGS) {
+		return KERN_INVALID_ARGUMENT;
+	}
+
+	src_destroy = (flags & VM_MAP_COPYIN_SRC_DESTROY) ? TRUE : FALSE;
+	use_maxprot = (flags & VM_MAP_COPYIN_USE_MAXPROT) ? TRUE : FALSE;
+	preserve_purgeable =
+	    (flags & VM_MAP_COPYIN_PRESERVE_PURGEABLE) ? TRUE : FALSE;
+
+	/*
+	 *	Check for copies of zero bytes.
+	 */
+
+	if (len == 0) {
+		*copy_result = VM_MAP_COPY_NULL;
+		return KERN_SUCCESS;
+	}
+
+	/*
+	 *	Check that the end address doesn't overflow
+	 */
+	src_end = src_addr + len;
+	if (src_end < src_addr) {
+		return KERN_INVALID_ADDRESS;
+	}
+
+	/*
+	 *	Compute (page aligned) start and end of region
+	 */
+	src_start = vm_map_trunc_page(src_addr,
+	    VM_MAP_PAGE_MASK(src_map));
+	src_end = vm_map_round_page(src_end,
+	    VM_MAP_PAGE_MASK(src_map));
+
+	/*
+	 * If the copy is sufficiently small, use a kernel buffer instead
+	 * of making a virtual copy.  The theory being that the cost of
+	 * setting up VM (and taking C-O-W faults) dominates the copy costs
+	 * for small regions.
+	 */
+	if ((len < msg_ool_size_small) &&
+	    !use_maxprot &&
+	    !preserve_purgeable &&
+	    !(flags & VM_MAP_COPYIN_ENTRY_LIST) &&
+	    /*
+	     * Since the "msg_ool_size_small" threshold was increased and
+	     * vm_map_copyin_kernel_buffer() doesn't handle accesses beyond the
+	     * address space limits, we revert to doing a virtual copy if the
+	     * copied range goes beyond those limits.  Otherwise, mach_vm_read()
+	     * of the commpage would now fail when it used to work.
+	     */
+	    (src_start >= vm_map_min(src_map) &&
+	    src_start < vm_map_max(src_map) &&
+	    src_end >= vm_map_min(src_map) &&
+	    src_end < vm_map_max(src_map))) {
+		return vm_map_copyin_kernel_buffer(src_map, src_addr, len,
+		           src_destroy, copy_result);
+	}
+
+	/*
+	 *	Allocate a header element for the list.
+	 *
+	 *	Use the start and end in the header to
+	 *	remember the endpoints prior to rounding.
+	 */
+
+	copy = vm_map_copy_allocate();
+	copy->type = VM_MAP_COPY_ENTRY_LIST;
+	copy->cpy_hdr.entries_pageable = TRUE;
+#if 00
+	copy->cpy_hdr.page_shift = src_map->hdr.page_shift;
+#else
+	/*
+	 * The copy entries can be broken down for a variety of reasons,
+	 * so we can't guarantee that they will remain map-aligned...
+	 * Will need to adjust the first copy_entry's "vme_start" and
+	 * the last copy_entry's "vme_end" to be rounded to PAGE_MASK
+	 * rather than the original map's alignment.
+	 */
+	copy->cpy_hdr.page_shift = PAGE_SHIFT;
+#endif
+
+	vm_map_store_init( &(copy->cpy_hdr));
+
+	copy->offset = src_addr;
+	copy->size = len;
+
+	new_entry = vm_map_copy_entry_create(copy, !copy->cpy_hdr.entries_pageable);
+
+#define RETURN(x)                                               \
+	MACRO_BEGIN                                             \
+	vm_map_unlock(src_map);                                 \
+	if(src_map != base_map)                                 \
+	        vm_map_deallocate(src_map);                     \
+	if (new_entry != VM_MAP_ENTRY_NULL)                     \
+	        vm_map_copy_entry_dispose(copy,new_entry);      \
+	vm_map_copy_discard(copy);                              \
+	{                                                       \
+	        submap_map_t	*_ptr;                          \
+                                                                \
+	        for(_ptr = parent_maps; _ptr != NULL; _ptr = parent_maps) { \
+	                parent_maps=parent_maps->next;          \
+	                if (_ptr->parent_map != base_map)       \
+	                        vm_map_deallocate(_ptr->parent_map);    \
+	                kfree(_ptr, sizeof(submap_map_t));      \
+	        }                                               \
+	}                                                       \
+	MACRO_RETURN(x);                                        \
+	MACRO_END
+
+	/*
+	 *	Find the beginning of the region.
+	 */
+
+	vm_map_lock(src_map);
+
+	/*
+	 * Lookup the original "src_addr" rather than the truncated
+	 * "src_start", in case "src_start" falls in a non-map-aligned
+	 * map entry *before* the map entry that contains "src_addr"...
+	 */
+	if (!vm_map_lookup_entry(src_map, src_addr, &tmp_entry)) {
+		RETURN(KERN_INVALID_ADDRESS);
+	}
+	if (!tmp_entry->is_sub_map) {
+		/*
+		 * ... but clip to the map-rounded "src_start" rather than
+		 * "src_addr" to preserve map-alignment.  We'll adjust the
+		 * first copy entry at the end, if needed.
+		 */
+		vm_map_clip_start(src_map, tmp_entry, src_start);
+	}
+	if (src_start < tmp_entry->vme_start) {
+		/*
+		 * Move "src_start" up to the start of the
+		 * first map entry to copy.
+		 */
+		src_start = tmp_entry->vme_start;
+	}
+	/* set for later submap fix-up */
+	copy_addr = src_start;
+
+	/*
+	 *	Go through entries until we get to the end.
+	 */
+
+	while (TRUE) {
+		vm_map_entry_t  src_entry = tmp_entry;  /* Top-level entry */
+		vm_map_size_t   src_size;               /* Size of source
+		                                         * map entry (in both
+		                                         * maps)
+		                                         */
+
+		vm_object_t             src_object;     /* Object to copy */
+		vm_object_offset_t      src_offset;
+
+		boolean_t       src_needs_copy;         /* Should source map
+		                                         * be made read-only
+		                                         * for copy-on-write?
+		                                         */
+
+		boolean_t       new_entry_needs_copy;   /* Will new entry be COW? */
+
+		boolean_t       was_wired;              /* Was source wired? */
+		vm_map_version_t version;               /* Version before locks
+		                                         * dropped to make copy
+		                                         */
+		kern_return_t   result;                 /* Return value from
+		                                         * copy_strategically.
+		                                         */
+		while (tmp_entry->is_sub_map) {
+			vm_map_size_t submap_len;
+			submap_map_t *ptr;
+
+			ptr = (submap_map_t *)kalloc(sizeof(submap_map_t));
+			ptr->next = parent_maps;
+			parent_maps = ptr;
+			ptr->parent_map = src_map;
+			ptr->base_start = src_start;
+			ptr->base_end = src_end;
+			submap_len = tmp_entry->vme_end - src_start;
+			if (submap_len > (src_end - src_start)) {
+				submap_len = src_end - src_start;
+			}
+			ptr->base_len = submap_len;
+
+			src_start -= tmp_entry->vme_start;
+			src_start += VME_OFFSET(tmp_entry);
+			src_end = src_start + submap_len;
+			src_map = VME_SUBMAP(tmp_entry);
+			vm_map_lock(src_map);
+			/* keep an outstanding reference for all maps in */
+			/* the parents tree except the base map */
+			vm_map_reference(src_map);
+			vm_map_unlock(ptr->parent_map);
+			if (!vm_map_lookup_entry(
+				    src_map, src_start, &tmp_entry)) {
+				RETURN(KERN_INVALID_ADDRESS);
+			}
+			map_share = TRUE;
+			if (!tmp_entry->is_sub_map) {
+				vm_map_clip_start(src_map, tmp_entry, src_start);
+			}
+			src_entry = tmp_entry;
+		}
+		/* we are now in the lowest level submap... */
+
+		if ((VME_OBJECT(tmp_entry) != VM_OBJECT_NULL) &&
+		    (VME_OBJECT(tmp_entry)->phys_contiguous)) {
+			/* This is not, supported for now.In future */
+			/* we will need to detect the phys_contig   */
+			/* condition and then upgrade copy_slowly   */
+			/* to do physical copy from the device mem  */
+			/* based object. We can piggy-back off of   */
+			/* the was wired boolean to set-up the      */
+			/* proper handling */
+			RETURN(KERN_PROTECTION_FAILURE);
+		}
+		/*
+		 *	Create a new address map entry to hold the result.
+		 *	Fill in the fields from the appropriate source entries.
+		 *	We must unlock the source map to do this if we need
+		 *	to allocate a map entry.
+		 */
+		if (new_entry == VM_MAP_ENTRY_NULL) {
+			version.main_timestamp = src_map->timestamp;
+			vm_map_unlock(src_map);
+
+			new_entry = vm_map_copy_entry_create(copy, !copy->cpy_hdr.entries_pageable);
+
+			vm_map_lock(src_map);
+			if ((version.main_timestamp + 1) != src_map->timestamp) {
+				if (!vm_map_lookup_entry(src_map, src_start,
+				    &tmp_entry)) {
+					RETURN(KERN_INVALID_ADDRESS);
+				}
+				if (!tmp_entry->is_sub_map) {
+					vm_map_clip_start(src_map, tmp_entry, src_start);
+				}
+				continue; /* restart w/ new tmp_entry */
+			}
+		}
+
+		/*
+		 *	Verify that the region can be read.
+		 */
+		if (((src_entry->protection & VM_PROT_READ) == VM_PROT_NONE &&
+		    !use_maxprot) ||
+		    (src_entry->max_protection & VM_PROT_READ) == 0) {
+			RETURN(KERN_PROTECTION_FAILURE);
+		}
+
+		/*
+		 *	Clip against the endpoints of the entire region.
+		 */
+
+		vm_map_clip_end(src_map, src_entry, src_end);
+
+		src_size = src_entry->vme_end - src_start;
+		src_object = VME_OBJECT(src_entry);
+		src_offset = VME_OFFSET(src_entry);
+		was_wired = (src_entry->wired_count != 0);
+
+		vm_map_entry_copy(new_entry, src_entry);
+		if (new_entry->is_sub_map) {
+			/* clr address space specifics */
+			new_entry->use_pmap = FALSE;
+		} else {
+			/*
+			 * We're dealing with a copy-on-write operation,
+			 * so the resulting mapping should not inherit the
+			 * original mapping's accounting settings.
+			 * "iokit_acct" should have been cleared in
+			 * vm_map_entry_copy().
+			 * "use_pmap" should be reset to its default (TRUE)
+			 * so that the new mapping gets accounted for in
+			 * the task's memory footprint.
+			 */
+			assert(!new_entry->iokit_acct);
+			new_entry->use_pmap = TRUE;
+		}
+
+		/*
+		 *	Attempt non-blocking copy-on-write optimizations.
+		 */
+
+		/*
+		 * If we are destroying the source, and the object
+		 * is internal, we could move the object reference
+		 * from the source to the copy.  The copy is
+		 * copy-on-write only if the source is.
+		 * We make another reference to the object, because
+		 * destroying the source entry will deallocate it.
+		 *
+		 * This memory transfer has to be atomic, (to prevent
+		 * the VM object from being shared or copied while
+		 * it's being moved here), so we could only do this
+		 * if we won't have to unlock the VM map until the
+		 * original mapping has been fully removed.
+		 */
+
+RestartCopy:
+		if ((src_object == VM_OBJECT_NULL ||
+		    (!was_wired && !map_share && !tmp_entry->is_shared)) &&
+		    vm_object_copy_quickly(
+			    VME_OBJECT_PTR(new_entry),
+			    src_offset,
+			    src_size,
+			    &src_needs_copy,
+			    &new_entry_needs_copy)) {
+			new_entry->needs_copy = new_entry_needs_copy;
+
+			/*
+			 *	Handle copy-on-write obligations
+			 */
+
+			if (src_needs_copy && !tmp_entry->needs_copy) {
+				vm_prot_t prot;
+
+				prot = src_entry->protection & ~VM_PROT_WRITE;
+
+				if (override_nx(src_map, VME_ALIAS(src_entry))
+				    && prot) {
+					prot |= VM_PROT_EXECUTE;
+				}
+
+				vm_object_pmap_protect(
+					src_object,
+					src_offset,
+					src_size,
+					(src_entry->is_shared ?
+					PMAP_NULL
+					: src_map->pmap),
+					src_entry->vme_start,
+					prot);
+
+				assert(tmp_entry->wired_count == 0);
+				tmp_entry->needs_copy = TRUE;
+			}
+
+			/*
+			 *	The map has never been unlocked, so it's safe
+			 *	to move to the next entry rather than doing
+			 *	another lookup.
+			 */
+
+			goto CopySuccessful;
+		}
+
+		entry_was_shared = tmp_entry->is_shared;
+
+		/*
+		 *	Take an object reference, so that we may
+		 *	release the map lock(s).
+		 */
+
+		assert(src_object != VM_OBJECT_NULL);
+		vm_object_reference(src_object);
+
+		/*
+		 *	Record the timestamp for later verification.
+		 *	Unlock the map.
+		 */
+
+		version.main_timestamp = src_map->timestamp;
+		vm_map_unlock(src_map); /* Increments timestamp once! */
+		saved_src_entry = src_entry;
+		tmp_entry = VM_MAP_ENTRY_NULL;
+		src_entry = VM_MAP_ENTRY_NULL;
+
+		/*
+		 *	Perform the copy
+		 */
+
+		if (was_wired) {
+CopySlowly:
+			vm_object_lock(src_object);
+			result = vm_object_copy_slowly(
+				src_object,
+				src_offset,
+				src_size,
+				THREAD_UNINT,
+				VME_OBJECT_PTR(new_entry));
+			VME_OFFSET_SET(new_entry, 0);
+			new_entry->needs_copy = FALSE;
+		} else if (src_object->copy_strategy == MEMORY_OBJECT_COPY_SYMMETRIC &&
+		    (entry_was_shared || map_share)) {
+			vm_object_t new_object;
+
+			vm_object_lock_shared(src_object);
+			new_object = vm_object_copy_delayed(
+				src_object,
+				src_offset,
+				src_size,
+				TRUE);
+			if (new_object == VM_OBJECT_NULL) {
+				goto CopySlowly;
+			}
+
+			VME_OBJECT_SET(new_entry, new_object);
+			assert(new_entry->wired_count == 0);
+			new_entry->needs_copy = TRUE;
+			assert(!new_entry->iokit_acct);
+			assert(new_object->purgable == VM_PURGABLE_DENY);
+			assertf(new_entry->use_pmap, "src_map %p new_entry %p\n", src_map, new_entry);
+			result = KERN_SUCCESS;
+		} else {
+			vm_object_offset_t new_offset;
+			new_offset = VME_OFFSET(new_entry);
+			result = vm_object_copy_strategically(src_object,
+			    src_offset,
+			    src_size,
+			    VME_OBJECT_PTR(new_entry),
+			    &new_offset,
+			    &new_entry_needs_copy);
+			if (new_offset != VME_OFFSET(new_entry)) {
+				VME_OFFSET_SET(new_entry, new_offset);
+			}
+
+			new_entry->needs_copy = new_entry_needs_copy;
+		}
+
+		if (result == KERN_SUCCESS &&
+		    preserve_purgeable &&
+		    src_object->purgable != VM_PURGABLE_DENY) {
+			vm_object_t     new_object;
+
+			new_object = VME_OBJECT(new_entry);
+			assert(new_object != src_object);
+			vm_object_lock(new_object);
+			assert(new_object->ref_count == 1);
+			assert(new_object->shadow == VM_OBJECT_NULL);
+			assert(new_object->copy == VM_OBJECT_NULL);
+			assert(new_object->vo_owner == NULL);
+
+			new_object->copy_strategy = MEMORY_OBJECT_COPY_NONE;
+			new_object->true_share = TRUE;
+			/* start as non-volatile with no owner... */
+			new_object->purgable = VM_PURGABLE_NONVOLATILE;
+			vm_purgeable_nonvolatile_enqueue(new_object, NULL);
+			/* ... and move to src_object's purgeable state */
+			if (src_object->purgable != VM_PURGABLE_NONVOLATILE) {
+				int state;
+				state = src_object->purgable;
+				vm_object_purgable_control(
+					new_object,
+					VM_PURGABLE_SET_STATE_FROM_KERNEL,
+					&state);
+			}
+			vm_object_unlock(new_object);
+			new_object = VM_OBJECT_NULL;
+			/* no pmap accounting for purgeable objects */
+			new_entry->use_pmap = FALSE;
+		}
+
+		if (result != KERN_SUCCESS &&
+		    result != KERN_MEMORY_RESTART_COPY) {
+			vm_map_lock(src_map);
+			RETURN(result);
+		}
+
+		/*
+		 *	Throw away the extra reference
+		 */
+
+		vm_object_deallocate(src_object);
+
+		/*
+		 *	Verify that the map has not substantially
+		 *	changed while the copy was being made.
+		 */
+
+		vm_map_lock(src_map);
+
+		if ((version.main_timestamp + 1) == src_map->timestamp) {
+			/* src_map hasn't changed: src_entry is still valid */
+			src_entry = saved_src_entry;
+			goto VerificationSuccessful;
+		}
+
+		/*
+		 *	Simple version comparison failed.
+		 *
+		 *	Retry the lookup and verify that the
+		 *	same object/offset are still present.
+		 *
+		 *	[Note: a memory manager that colludes with
+		 *	the calling task can detect that we have
+		 *	cheated.  While the map was unlocked, the
+		 *	mapping could have been changed and restored.]
+		 */
+
+		if (!vm_map_lookup_entry(src_map, src_start, &tmp_entry)) {
+			if (result != KERN_MEMORY_RESTART_COPY) {
+				vm_object_deallocate(VME_OBJECT(new_entry));
+				VME_OBJECT_SET(new_entry, VM_OBJECT_NULL);
+				/* reset accounting state */
+				new_entry->iokit_acct = FALSE;
+				new_entry->use_pmap = TRUE;
+			}
+			RETURN(KERN_INVALID_ADDRESS);
+		}
+
+		src_entry = tmp_entry;
+		vm_map_clip_start(src_map, src_entry, src_start);
+
+		if ((((src_entry->protection & VM_PROT_READ) == VM_PROT_NONE) &&
+		    !use_maxprot) ||
+		    ((src_entry->max_protection & VM_PROT_READ) == 0)) {
+			goto VerificationFailed;
+		}
+
+		if (src_entry->vme_end < new_entry->vme_end) {
+			/*
+			 * This entry might have been shortened
+			 * (vm_map_clip_end) or been replaced with
+			 * an entry that ends closer to "src_start"
+			 * than before.
+			 * Adjust "new_entry" accordingly; copying
+			 * less memory would be correct but we also
+			 * redo the copy (see below) if the new entry
+			 * no longer points at the same object/offset.
+			 */
+			assert(VM_MAP_PAGE_ALIGNED(src_entry->vme_end,
+			    VM_MAP_COPY_PAGE_MASK(copy)));
+			new_entry->vme_end = src_entry->vme_end;
+			src_size = new_entry->vme_end - src_start;
+		} else if (src_entry->vme_end > new_entry->vme_end) {
+			/*
+			 * This entry might have been extended
+			 * (vm_map_entry_simplify() or coalesce)
+			 * or been replaced with an entry that ends farther
+			 * from "src_start" than before.
+			 *
+			 * We've called vm_object_copy_*() only on
+			 * the previous <start:end> range, so we can't
+			 * just extend new_entry.  We have to re-do
+			 * the copy based on the new entry as if it was
+			 * pointing at a different object/offset (see
+			 * "Verification failed" below).
+			 */
+		}
+
+		if ((VME_OBJECT(src_entry) != src_object) ||
+		    (VME_OFFSET(src_entry) != src_offset) ||
+		    (src_entry->vme_end > new_entry->vme_end)) {
+			/*
+			 *	Verification failed.
+			 *
+			 *	Start over with this top-level entry.
+			 */
+
+VerificationFailed:     ;
+
+			vm_object_deallocate(VME_OBJECT(new_entry));
+			tmp_entry = src_entry;
+			continue;
+		}
+
+		/*
+		 *	Verification succeeded.
+		 */
+
+VerificationSuccessful:;
+
+		if (result == KERN_MEMORY_RESTART_COPY) {
+			goto RestartCopy;
+		}
+
+		/*
+		 *	Copy succeeded.
+		 */
+
+CopySuccessful: ;
+
+		/*
+		 *	Link in the new copy entry.
+		 */
+
+		vm_map_copy_entry_link(copy, vm_map_copy_last_entry(copy),
+		    new_entry);
+
+		/*
+		 *	Determine whether the entire region
+		 *	has been copied.
+		 */
+		src_base = src_start;
+		src_start = new_entry->vme_end;
+		new_entry = VM_MAP_ENTRY_NULL;
+		while ((src_start >= src_end) && (src_end != 0)) {
+			submap_map_t    *ptr;
+
+			if (src_map == base_map) {
+				/* back to the top */
+				break;
+			}
+
+			ptr = parent_maps;
+			assert(ptr != NULL);
+			parent_maps = parent_maps->next;
+
+			/* fix up the damage we did in that submap */
+			vm_map_simplify_range(src_map,
+			    src_base,
+			    src_end);
+
+			vm_map_unlock(src_map);
+			vm_map_deallocate(src_map);
+			vm_map_lock(ptr->parent_map);
+			src_map = ptr->parent_map;
+			src_base = ptr->base_start;
+			src_start = ptr->base_start + ptr->base_len;
+			src_end = ptr->base_end;
+			if (!vm_map_lookup_entry(src_map,
+			    src_start,
+			    &tmp_entry) &&
+			    (src_end > src_start)) {
+				RETURN(KERN_INVALID_ADDRESS);
+			}
+			kfree(ptr, sizeof(submap_map_t));
+			if (parent_maps == NULL) {
+				map_share = FALSE;
+			}
+			src_entry = tmp_entry->vme_prev;
+		}
+
+		if ((VM_MAP_PAGE_SHIFT(src_map) != PAGE_SHIFT) &&
+		    (src_start >= src_addr + len) &&
+		    (src_addr + len != 0)) {
+			/*
+			 * Stop copying now, even though we haven't reached
+			 * "src_end".  We'll adjust the end of the last copy
+			 * entry at the end, if needed.
+			 *
+			 * If src_map's aligment is different from the
+			 * system's page-alignment, there could be
+			 * extra non-map-aligned map entries between
+			 * the original (non-rounded) "src_addr + len"
+			 * and the rounded "src_end".
+			 * We do not want to copy those map entries since
+			 * they're not part of the copied range.
+			 */
+			break;
+		}
+
+		if ((src_start >= src_end) && (src_end != 0)) {
+			break;
+		}
+
+		/*
+		 *	Verify that there are no gaps in the region
+		 */
+
+		tmp_entry = src_entry->vme_next;
+		if ((tmp_entry->vme_start != src_start) ||
+		    (tmp_entry == vm_map_to_entry(src_map))) {
+			RETURN(KERN_INVALID_ADDRESS);
+		}
+	}
+
+	/*
+	 * If the source should be destroyed, do it now, since the
+	 * copy was successful.
+	 */
+	if (src_destroy) {
+		(void) vm_map_delete(
+			src_map,
+			vm_map_trunc_page(src_addr,
+			VM_MAP_PAGE_MASK(src_map)),
+			src_end,
+			((src_map == kernel_map) ?
+			VM_MAP_REMOVE_KUNWIRE :
+			VM_MAP_REMOVE_NO_FLAGS),
+			VM_MAP_NULL);
+	} else {
+		/* fix up the damage we did in the base map */
+		vm_map_simplify_range(
+			src_map,
+			vm_map_trunc_page(src_addr,
+			VM_MAP_PAGE_MASK(src_map)),
+			vm_map_round_page(src_end,
+			VM_MAP_PAGE_MASK(src_map)));
+	}
+
+	vm_map_unlock(src_map);
+	tmp_entry = VM_MAP_ENTRY_NULL;
+
+	if (VM_MAP_PAGE_SHIFT(src_map) != PAGE_SHIFT) {
+		vm_map_offset_t original_start, original_offset, original_end;
+
+		assert(VM_MAP_COPY_PAGE_MASK(copy) == PAGE_MASK);
+
+		/* adjust alignment of first copy_entry's "vme_start" */
+		tmp_entry = vm_map_copy_first_entry(copy);
+		if (tmp_entry != vm_map_copy_to_entry(copy)) {
+			vm_map_offset_t adjustment;
+
+			original_start = tmp_entry->vme_start;
+			original_offset = VME_OFFSET(tmp_entry);
+
+			/* map-align the start of the first copy entry... */
+			adjustment = (tmp_entry->vme_start -
+			    vm_map_trunc_page(
+				    tmp_entry->vme_start,
+				    VM_MAP_PAGE_MASK(src_map)));
+			tmp_entry->vme_start -= adjustment;
+			VME_OFFSET_SET(tmp_entry,
+			    VME_OFFSET(tmp_entry) - adjustment);
+			copy_addr -= adjustment;
+			assert(tmp_entry->vme_start < tmp_entry->vme_end);
+			/* ... adjust for mis-aligned start of copy range */
+			adjustment =
+			    (vm_map_trunc_page(copy->offset,
+			    PAGE_MASK) -
+			    vm_map_trunc_page(copy->offset,
+			    VM_MAP_PAGE_MASK(src_map)));
+			if (adjustment) {
+				assert(page_aligned(adjustment));
+				assert(adjustment < VM_MAP_PAGE_SIZE(src_map));
+				tmp_entry->vme_start += adjustment;
+				VME_OFFSET_SET(tmp_entry,
+				    (VME_OFFSET(tmp_entry) +
+				    adjustment));
+				copy_addr += adjustment;
+				assert(tmp_entry->vme_start < tmp_entry->vme_end);
+			}
+
+			/*
+			 * Assert that the adjustments haven't exposed
+			 * more than was originally copied...
+			 */
+			assert(tmp_entry->vme_start >= original_start);
+			assert(VME_OFFSET(tmp_entry) >= original_offset);
+			/*
+			 * ... and that it did not adjust outside of a
+			 * a single 16K page.
+			 */
+			assert(vm_map_trunc_page(tmp_entry->vme_start,
+			    VM_MAP_PAGE_MASK(src_map)) ==
+			    vm_map_trunc_page(original_start,
+			    VM_MAP_PAGE_MASK(src_map)));
+		}
+
+		/* adjust alignment of last copy_entry's "vme_end" */
+		tmp_entry = vm_map_copy_last_entry(copy);
+		if (tmp_entry != vm_map_copy_to_entry(copy)) {
+			vm_map_offset_t adjustment;
+
+			original_end = tmp_entry->vme_end;
+
+			/* map-align the end of the last copy entry... */
+			tmp_entry->vme_end =
+			    vm_map_round_page(tmp_entry->vme_end,
+			    VM_MAP_PAGE_MASK(src_map));
+			/* ... adjust for mis-aligned end of copy range */
+			adjustment =
+			    (vm_map_round_page((copy->offset +
+			    copy->size),
+			    VM_MAP_PAGE_MASK(src_map)) -
+			    vm_map_round_page((copy->offset +
+			    copy->size),
+			    PAGE_MASK));
+			if (adjustment) {
+				assert(page_aligned(adjustment));
+				assert(adjustment < VM_MAP_PAGE_SIZE(src_map));
+				tmp_entry->vme_end -= adjustment;
+				assert(tmp_entry->vme_start < tmp_entry->vme_end);
+			}
+
+			/*
+			 * Assert that the adjustments haven't exposed
+			 * more than was originally copied...
+			 */
+			assert(tmp_entry->vme_end <= original_end);
+			/*
+			 * ... and that it did not adjust outside of a
+			 * a single 16K page.
+			 */
+			assert(vm_map_round_page(tmp_entry->vme_end,
+			    VM_MAP_PAGE_MASK(src_map)) ==
+			    vm_map_round_page(original_end,
+			    VM_MAP_PAGE_MASK(src_map)));
+		}
+	}
+
+	/* Fix-up start and end points in copy.  This is necessary */
+	/* when the various entries in the copy object were picked */
+	/* up from different sub-maps */
+
+	tmp_entry = vm_map_copy_first_entry(copy);
+	copy_size = 0; /* compute actual size */
+	while (tmp_entry != vm_map_copy_to_entry(copy)) {
+		assert(VM_MAP_PAGE_ALIGNED(
+			    copy_addr + (tmp_entry->vme_end -
+			    tmp_entry->vme_start),
+			    VM_MAP_COPY_PAGE_MASK(copy)));
+		assert(VM_MAP_PAGE_ALIGNED(
+			    copy_addr,
+			    VM_MAP_COPY_PAGE_MASK(copy)));
+
+		/*
+		 * The copy_entries will be injected directly into the
+		 * destination map and might not be "map aligned" there...
+		 */
+		tmp_entry->map_aligned = FALSE;
+
+		tmp_entry->vme_end = copy_addr +
+		    (tmp_entry->vme_end - tmp_entry->vme_start);
+		tmp_entry->vme_start = copy_addr;
+		assert(tmp_entry->vme_start < tmp_entry->vme_end);
+		copy_addr += tmp_entry->vme_end - tmp_entry->vme_start;
+		copy_size += tmp_entry->vme_end - tmp_entry->vme_start;
+		tmp_entry = (struct vm_map_entry *)tmp_entry->vme_next;
+	}
+
+	if (VM_MAP_PAGE_SHIFT(src_map) != PAGE_SHIFT &&
+	    copy_size < copy->size) {
+		/*
+		 * The actual size of the VM map copy is smaller than what
+		 * was requested by the caller.  This must be because some
+		 * PAGE_SIZE-sized pages are missing at the end of the last
+		 * VM_MAP_PAGE_SIZE(src_map)-sized chunk of the range.
+		 * The caller might not have been aware of those missing
+		 * pages and might not want to be aware of it, which is
+		 * fine as long as they don't try to access (and crash on)
+		 * those missing pages.
+		 * Let's adjust the size of the "copy", to avoid failing
+		 * in vm_map_copyout() or vm_map_copy_overwrite().
+		 */
+		assert(vm_map_round_page(copy_size,
+		    VM_MAP_PAGE_MASK(src_map)) ==
+		    vm_map_round_page(copy->size,
+		    VM_MAP_PAGE_MASK(src_map)));
+		copy->size = copy_size;
+	}
+
+	*copy_result = copy;
+	return KERN_SUCCESS;
+
+#undef  RETURN
+}
+
+kern_return_t
+vm_map_copy_extract(
+	vm_map_t                src_map,
+	vm_map_address_t        src_addr,
+	vm_map_size_t           len,
+	vm_map_copy_t           *copy_result,   /* OUT */
+	vm_prot_t               *cur_prot,      /* OUT */
+	vm_prot_t               *max_prot)
+{
+	vm_map_offset_t src_start, src_end;
+	vm_map_copy_t   copy;
+	kern_return_t   kr;
+
+	/*
+	 *	Check for copies of zero bytes.
+	 */
+
+	if (len == 0) {
+		*copy_result = VM_MAP_COPY_NULL;
+		return KERN_SUCCESS;
+	}
+
+	/*
+	 *	Check that the end address doesn't overflow
+	 */
+	src_end = src_addr + len;
+	if (src_end < src_addr) {
+		return KERN_INVALID_ADDRESS;
+	}
+
+	/*
+	 *	Compute (page aligned) start and end of region
+	 */
+	src_start = vm_map_trunc_page(src_addr, PAGE_MASK);
+	src_end = vm_map_round_page(src_end, PAGE_MASK);
+
+	/*
+	 *	Allocate a header element for the list.
+	 *
+	 *	Use the start and end in the header to
+	 *	remember the endpoints prior to rounding.
+	 */
+
+	copy = vm_map_copy_allocate();
+	copy->type = VM_MAP_COPY_ENTRY_LIST;
+	copy->cpy_hdr.entries_pageable = TRUE;
+
+	vm_map_store_init(&copy->cpy_hdr);
+
+	copy->offset = 0;
+	copy->size = len;
+
+	kr = vm_map_remap_extract(src_map,
+	    src_addr,
+	    len,
+	    FALSE,                       /* copy */
+	    &copy->cpy_hdr,
+	    cur_prot,
+	    max_prot,
+	    VM_INHERIT_SHARE,
+	    TRUE,                       /* pageable */
+	    FALSE,                       /* same_map */
+	    VM_MAP_KERNEL_FLAGS_NONE);
+	if (kr != KERN_SUCCESS) {
+		vm_map_copy_discard(copy);
+		return kr;
+	}
+
+	*copy_result = copy;
+	return KERN_SUCCESS;
+}
+
+/*
+ *	vm_map_copyin_object:
+ *
+ *	Create a copy object from an object.
+ *	Our caller donates an object reference.
+ */
+
+kern_return_t
+vm_map_copyin_object(
+	vm_object_t             object,
+	vm_object_offset_t      offset, /* offset of region in object */
+	vm_object_size_t        size,   /* size of region in object */
+	vm_map_copy_t   *copy_result)   /* OUT */
+{
+	vm_map_copy_t   copy;           /* Resulting copy */
+
+	/*
+	 *	We drop the object into a special copy object
+	 *	that contains the object directly.
+	 */
+
+	copy = vm_map_copy_allocate();
+	copy->type = VM_MAP_COPY_OBJECT;
+	copy->cpy_object = object;
+	copy->offset = offset;
+	copy->size = size;
+
+	*copy_result = copy;
+	return KERN_SUCCESS;
+}
+
+static void
+vm_map_fork_share(
+	vm_map_t        old_map,
+	vm_map_entry_t  old_entry,
+	vm_map_t        new_map)
+{
+	vm_object_t     object;
+	vm_map_entry_t  new_entry;
+
+	/*
+	 *	New sharing code.  New map entry
+	 *	references original object.  Internal
+	 *	objects use asynchronous copy algorithm for
+	 *	future copies.  First make sure we have
+	 *	the right object.  If we need a shadow,
+	 *	or someone else already has one, then
+	 *	make a new shadow and share it.
+	 */
+
+	object = VME_OBJECT(old_entry);
+	if (old_entry->is_sub_map) {
+		assert(old_entry->wired_count == 0);
+#ifndef NO_NESTED_PMAP
+		if (old_entry->use_pmap) {
+			kern_return_t   result;
+
+			result = pmap_nest(new_map->pmap,
+			    (VME_SUBMAP(old_entry))->pmap,
+			    (addr64_t)old_entry->vme_start,
+			    (addr64_t)old_entry->vme_start,
+			    (uint64_t)(old_entry->vme_end - old_entry->vme_start));
+			if (result) {
+				panic("vm_map_fork_share: pmap_nest failed!");
+			}
+		}
+#endif  /* NO_NESTED_PMAP */
+	} else if (object == VM_OBJECT_NULL) {
+		object = vm_object_allocate((vm_map_size_t)(old_entry->vme_end -
+		    old_entry->vme_start));
+		VME_OFFSET_SET(old_entry, 0);
+		VME_OBJECT_SET(old_entry, object);
+		old_entry->use_pmap = TRUE;
+//		assert(!old_entry->needs_copy);
+	} else if (object->copy_strategy !=
+	    MEMORY_OBJECT_COPY_SYMMETRIC) {
+		/*
+		 *	We are already using an asymmetric
+		 *	copy, and therefore we already have
+		 *	the right object.
+		 */
+
+		assert(!old_entry->needs_copy);
+	} else if (old_entry->needs_copy ||       /* case 1 */
+	    object->shadowed ||                 /* case 2 */
+	    (!object->true_share &&             /* case 3 */
+	    !old_entry->is_shared &&
+	    (object->vo_size >
+	    (vm_map_size_t)(old_entry->vme_end -
+	    old_entry->vme_start)))) {
+		/*
+		 *	We need to create a shadow.
+		 *	There are three cases here.
+		 *	In the first case, we need to
+		 *	complete a deferred symmetrical
+		 *	copy that we participated in.
+		 *	In the second and third cases,
+		 *	we need to create the shadow so
+		 *	that changes that we make to the
+		 *	object do not interfere with
+		 *	any symmetrical copies which
+		 *	have occured (case 2) or which
+		 *	might occur (case 3).
+		 *
+		 *	The first case is when we had
+		 *	deferred shadow object creation
+		 *	via the entry->needs_copy mechanism.
+		 *	This mechanism only works when
+		 *	only one entry points to the source
+		 *	object, and we are about to create
+		 *	a second entry pointing to the
+		 *	same object. The problem is that
+		 *	there is no way of mapping from
+		 *	an object to the entries pointing
+		 *	to it. (Deferred shadow creation
+		 *	works with one entry because occurs
+		 *	at fault time, and we walk from the
+		 *	entry to the object when handling
+		 *	the fault.)
+		 *
+		 *	The second case is when the object
+		 *	to be shared has already been copied
 		 *	with a symmetric copy, but we point
 		 *	directly to the object without
 		 *	needs_copy set in our entry. (This
@@ -5956,3100 +12173,7916 @@ vm_map_fork_share(
 		 *	which won't happen if the changes
 		 *	are made to a copy.)
 		 *
-		 *	The third case is when the object
-		 *	to be shared has parts sticking
-		 *	outside of the entry we're working
-		 *	with, and thus may in the future
-		 *	be subject to a symmetrical copy.
-		 *	(This is a preemptive version of
-		 *	case 2.)
+		 *	The third case is when the object
+		 *	to be shared has parts sticking
+		 *	outside of the entry we're working
+		 *	with, and thus may in the future
+		 *	be subject to a symmetrical copy.
+		 *	(This is a preemptive version of
+		 *	case 2.)
+		 */
+		VME_OBJECT_SHADOW(old_entry,
+		    (vm_map_size_t) (old_entry->vme_end -
+		    old_entry->vme_start));
+
+		/*
+		 *	If we're making a shadow for other than
+		 *	copy on write reasons, then we have
+		 *	to remove write permission.
+		 */
+
+		if (!old_entry->needs_copy &&
+		    (old_entry->protection & VM_PROT_WRITE)) {
+			vm_prot_t prot;
+
+			assert(!pmap_has_prot_policy(old_entry->protection));
+
+			prot = old_entry->protection & ~VM_PROT_WRITE;
+
+			assert(!pmap_has_prot_policy(prot));
+
+			if (override_nx(old_map, VME_ALIAS(old_entry)) && prot) {
+				prot |= VM_PROT_EXECUTE;
+			}
+
+
+			if (old_map->mapped_in_other_pmaps) {
+				vm_object_pmap_protect(
+					VME_OBJECT(old_entry),
+					VME_OFFSET(old_entry),
+					(old_entry->vme_end -
+					old_entry->vme_start),
+					PMAP_NULL,
+					old_entry->vme_start,
+					prot);
+			} else {
+				pmap_protect(old_map->pmap,
+				    old_entry->vme_start,
+				    old_entry->vme_end,
+				    prot);
+			}
+		}
+
+		old_entry->needs_copy = FALSE;
+		object = VME_OBJECT(old_entry);
+	}
+
+
+	/*
+	 *	If object was using a symmetric copy strategy,
+	 *	change its copy strategy to the default
+	 *	asymmetric copy strategy, which is copy_delay
+	 *	in the non-norma case and copy_call in the
+	 *	norma case. Bump the reference count for the
+	 *	new entry.
+	 */
+
+	if (old_entry->is_sub_map) {
+		vm_map_lock(VME_SUBMAP(old_entry));
+		vm_map_reference(VME_SUBMAP(old_entry));
+		vm_map_unlock(VME_SUBMAP(old_entry));
+	} else {
+		vm_object_lock(object);
+		vm_object_reference_locked(object);
+		if (object->copy_strategy == MEMORY_OBJECT_COPY_SYMMETRIC) {
+			object->copy_strategy = MEMORY_OBJECT_COPY_DELAY;
+		}
+		vm_object_unlock(object);
+	}
+
+	/*
+	 *	Clone the entry, using object ref from above.
+	 *	Mark both entries as shared.
+	 */
+
+	new_entry = vm_map_entry_create(new_map, FALSE); /* Never the kernel
+	                                                  * map or descendants */
+	vm_map_entry_copy(new_entry, old_entry);
+	old_entry->is_shared = TRUE;
+	new_entry->is_shared = TRUE;
+
+	/*
+	 * We're dealing with a shared mapping, so the resulting mapping
+	 * should inherit some of the original mapping's accounting settings.
+	 * "iokit_acct" should have been cleared in vm_map_entry_copy().
+	 * "use_pmap" should stay the same as before (if it hasn't been reset
+	 * to TRUE when we cleared "iokit_acct").
+	 */
+	assert(!new_entry->iokit_acct);
+
+	/*
+	 *	If old entry's inheritence is VM_INHERIT_NONE,
+	 *	the new entry is for corpse fork, remove the
+	 *	write permission from the new entry.
+	 */
+	if (old_entry->inheritance == VM_INHERIT_NONE) {
+		new_entry->protection &= ~VM_PROT_WRITE;
+		new_entry->max_protection &= ~VM_PROT_WRITE;
+	}
+
+	/*
+	 *	Insert the entry into the new map -- we
+	 *	know we're inserting at the end of the new
+	 *	map.
+	 */
+
+	vm_map_store_entry_link(new_map, vm_map_last_entry(new_map), new_entry,
+	    VM_MAP_KERNEL_FLAGS_NONE);
+
+	/*
+	 *	Update the physical map
+	 */
+
+	if (old_entry->is_sub_map) {
+		/* Bill Angell pmap support goes here */
+	} else {
+		pmap_copy(new_map->pmap, old_map->pmap, new_entry->vme_start,
+		    old_entry->vme_end - old_entry->vme_start,
+		    old_entry->vme_start);
+	}
+}
+
+static boolean_t
+vm_map_fork_copy(
+	vm_map_t        old_map,
+	vm_map_entry_t  *old_entry_p,
+	vm_map_t        new_map,
+	int             vm_map_copyin_flags)
+{
+	vm_map_entry_t old_entry = *old_entry_p;
+	vm_map_size_t entry_size = old_entry->vme_end - old_entry->vme_start;
+	vm_map_offset_t start = old_entry->vme_start;
+	vm_map_copy_t copy;
+	vm_map_entry_t last = vm_map_last_entry(new_map);
+
+	vm_map_unlock(old_map);
+	/*
+	 *	Use maxprot version of copyin because we
+	 *	care about whether this memory can ever
+	 *	be accessed, not just whether it's accessible
+	 *	right now.
+	 */
+	vm_map_copyin_flags |= VM_MAP_COPYIN_USE_MAXPROT;
+	if (vm_map_copyin_internal(old_map, start, entry_size,
+	    vm_map_copyin_flags, &copy)
+	    != KERN_SUCCESS) {
+		/*
+		 *	The map might have changed while it
+		 *	was unlocked, check it again.  Skip
+		 *	any blank space or permanently
+		 *	unreadable region.
+		 */
+		vm_map_lock(old_map);
+		if (!vm_map_lookup_entry(old_map, start, &last) ||
+		    (last->max_protection & VM_PROT_READ) == VM_PROT_NONE) {
+			last = last->vme_next;
+		}
+		*old_entry_p = last;
+
+		/*
+		 * XXX	For some error returns, want to
+		 * XXX	skip to the next element.  Note
+		 *	that INVALID_ADDRESS and
+		 *	PROTECTION_FAILURE are handled above.
+		 */
+
+		return FALSE;
+	}
+
+	/*
+	 *	Insert the copy into the new map
+	 */
+
+	vm_map_copy_insert(new_map, last, copy);
+
+	/*
+	 *	Pick up the traversal at the end of
+	 *	the copied region.
+	 */
+
+	vm_map_lock(old_map);
+	start += entry_size;
+	if (!vm_map_lookup_entry(old_map, start, &last)) {
+		last = last->vme_next;
+	} else {
+		if (last->vme_start == start) {
+			/*
+			 * No need to clip here and we don't
+			 * want to cause any unnecessary
+			 * unnesting...
+			 */
+		} else {
+			vm_map_clip_start(old_map, last, start);
+		}
+	}
+	*old_entry_p = last;
+
+	return TRUE;
+}
+
+/*
+ *	vm_map_fork:
+ *
+ *	Create and return a new map based on the old
+ *	map, according to the inheritance values on the
+ *	regions in that map and the options.
+ *
+ *	The source map must not be locked.
+ */
+vm_map_t
+vm_map_fork(
+	ledger_t        ledger,
+	vm_map_t        old_map,
+	int             options)
+{
+	pmap_t          new_pmap;
+	vm_map_t        new_map;
+	vm_map_entry_t  old_entry;
+	vm_map_size_t   new_size = 0, entry_size;
+	vm_map_entry_t  new_entry;
+	boolean_t       src_needs_copy;
+	boolean_t       new_entry_needs_copy;
+	boolean_t       pmap_is64bit;
+	int             vm_map_copyin_flags;
+	vm_inherit_t    old_entry_inheritance;
+	int             map_create_options;
+	kern_return_t   footprint_collect_kr;
+
+	if (options & ~(VM_MAP_FORK_SHARE_IF_INHERIT_NONE |
+	    VM_MAP_FORK_PRESERVE_PURGEABLE |
+	    VM_MAP_FORK_CORPSE_FOOTPRINT)) {
+		/* unsupported option */
+		return VM_MAP_NULL;
+	}
+
+	pmap_is64bit =
+#if defined(__i386__) || defined(__x86_64__)
+	    old_map->pmap->pm_task_map != TASK_MAP_32BIT;
+#elif defined(__arm64__)
+	    old_map->pmap->max == MACH_VM_MAX_ADDRESS;
+#elif defined(__arm__)
+	    FALSE;
+#else
+#error Unknown architecture.
+#endif
+
+	unsigned int pmap_flags = 0;
+	pmap_flags |= pmap_is64bit ? PMAP_CREATE_64BIT : 0;
+#if defined(HAS_APPLE_PAC)
+	pmap_flags |= old_map->pmap->disable_jop ? PMAP_CREATE_DISABLE_JOP : 0;
+#endif
+	new_pmap = pmap_create_options(ledger, (vm_map_size_t) 0, pmap_flags);
+
+	vm_map_reference_swap(old_map);
+	vm_map_lock(old_map);
+
+	map_create_options = 0;
+	if (old_map->hdr.entries_pageable) {
+		map_create_options |= VM_MAP_CREATE_PAGEABLE;
+	}
+	if (options & VM_MAP_FORK_CORPSE_FOOTPRINT) {
+		map_create_options |= VM_MAP_CREATE_CORPSE_FOOTPRINT;
+		footprint_collect_kr = KERN_SUCCESS;
+	}
+	new_map = vm_map_create_options(new_pmap,
+	    old_map->min_offset,
+	    old_map->max_offset,
+	    map_create_options);
+	vm_map_lock(new_map);
+	vm_commit_pagezero_status(new_map);
+	/* inherit the parent map's page size */
+	vm_map_set_page_shift(new_map, VM_MAP_PAGE_SHIFT(old_map));
+	for (
+		old_entry = vm_map_first_entry(old_map);
+		old_entry != vm_map_to_entry(old_map);
+		) {
+		entry_size = old_entry->vme_end - old_entry->vme_start;
+
+		old_entry_inheritance = old_entry->inheritance;
+		/*
+		 * If caller used the VM_MAP_FORK_SHARE_IF_INHERIT_NONE option
+		 * share VM_INHERIT_NONE entries that are not backed by a
+		 * device pager.
+		 */
+		if (old_entry_inheritance == VM_INHERIT_NONE &&
+		    (options & VM_MAP_FORK_SHARE_IF_INHERIT_NONE) &&
+		    !(!old_entry->is_sub_map &&
+		    VME_OBJECT(old_entry) != NULL &&
+		    VME_OBJECT(old_entry)->pager != NULL &&
+		    is_device_pager_ops(
+			    VME_OBJECT(old_entry)->pager->mo_pager_ops))) {
+			old_entry_inheritance = VM_INHERIT_SHARE;
+		}
+
+		if (old_entry_inheritance != VM_INHERIT_NONE &&
+		    (options & VM_MAP_FORK_CORPSE_FOOTPRINT) &&
+		    footprint_collect_kr == KERN_SUCCESS) {
+			/*
+			 * The corpse won't have old_map->pmap to query
+			 * footprint information, so collect that data now
+			 * and store it in new_map->vmmap_corpse_footprint
+			 * for later autopsy.
+			 */
+			footprint_collect_kr =
+			    vm_map_corpse_footprint_collect(old_map,
+			    old_entry,
+			    new_map);
+		}
+
+		switch (old_entry_inheritance) {
+		case VM_INHERIT_NONE:
+			break;
+
+		case VM_INHERIT_SHARE:
+			vm_map_fork_share(old_map, old_entry, new_map);
+			new_size += entry_size;
+			break;
+
+		case VM_INHERIT_COPY:
+
+			/*
+			 *	Inline the copy_quickly case;
+			 *	upon failure, fall back on call
+			 *	to vm_map_fork_copy.
+			 */
+
+			if (old_entry->is_sub_map) {
+				break;
+			}
+			if ((old_entry->wired_count != 0) ||
+			    ((VME_OBJECT(old_entry) != NULL) &&
+			    (VME_OBJECT(old_entry)->true_share))) {
+				goto slow_vm_map_fork_copy;
+			}
+
+			new_entry = vm_map_entry_create(new_map, FALSE); /* never the kernel map or descendants */
+			vm_map_entry_copy(new_entry, old_entry);
+			if (new_entry->is_sub_map) {
+				/* clear address space specifics */
+				new_entry->use_pmap = FALSE;
+			} else {
+				/*
+				 * We're dealing with a copy-on-write operation,
+				 * so the resulting mapping should not inherit
+				 * the original mapping's accounting settings.
+				 * "iokit_acct" should have been cleared in
+				 * vm_map_entry_copy().
+				 * "use_pmap" should be reset to its default
+				 * (TRUE) so that the new mapping gets
+				 * accounted for in the task's memory footprint.
+				 */
+				assert(!new_entry->iokit_acct);
+				new_entry->use_pmap = TRUE;
+			}
+
+			if (!vm_object_copy_quickly(
+				    VME_OBJECT_PTR(new_entry),
+				    VME_OFFSET(old_entry),
+				    (old_entry->vme_end -
+				    old_entry->vme_start),
+				    &src_needs_copy,
+				    &new_entry_needs_copy)) {
+				vm_map_entry_dispose(new_map, new_entry);
+				goto slow_vm_map_fork_copy;
+			}
+
+			/*
+			 *	Handle copy-on-write obligations
+			 */
+
+			if (src_needs_copy && !old_entry->needs_copy) {
+				vm_prot_t prot;
+
+				assert(!pmap_has_prot_policy(old_entry->protection));
+
+				prot = old_entry->protection & ~VM_PROT_WRITE;
+
+				if (override_nx(old_map, VME_ALIAS(old_entry))
+				    && prot) {
+					prot |= VM_PROT_EXECUTE;
+				}
+
+				assert(!pmap_has_prot_policy(prot));
+
+				vm_object_pmap_protect(
+					VME_OBJECT(old_entry),
+					VME_OFFSET(old_entry),
+					(old_entry->vme_end -
+					old_entry->vme_start),
+					((old_entry->is_shared
+					|| old_map->mapped_in_other_pmaps)
+					? PMAP_NULL :
+					old_map->pmap),
+					old_entry->vme_start,
+					prot);
+
+				assert(old_entry->wired_count == 0);
+				old_entry->needs_copy = TRUE;
+			}
+			new_entry->needs_copy = new_entry_needs_copy;
+
+			/*
+			 *	Insert the entry at the end
+			 *	of the map.
+			 */
+
+			vm_map_store_entry_link(new_map,
+			    vm_map_last_entry(new_map),
+			    new_entry,
+			    VM_MAP_KERNEL_FLAGS_NONE);
+			new_size += entry_size;
+			break;
+
+slow_vm_map_fork_copy:
+			vm_map_copyin_flags = 0;
+			if (options & VM_MAP_FORK_PRESERVE_PURGEABLE) {
+				vm_map_copyin_flags |=
+				    VM_MAP_COPYIN_PRESERVE_PURGEABLE;
+			}
+			if (vm_map_fork_copy(old_map,
+			    &old_entry,
+			    new_map,
+			    vm_map_copyin_flags)) {
+				new_size += entry_size;
+			}
+			continue;
+		}
+		old_entry = old_entry->vme_next;
+	}
+
+#if defined(__arm64__)
+	pmap_insert_sharedpage(new_map->pmap);
+#endif
+
+	new_map->size = new_size;
+
+	if (options & VM_MAP_FORK_CORPSE_FOOTPRINT) {
+		vm_map_corpse_footprint_collect_done(new_map);
+	}
+
+	vm_map_unlock(new_map);
+	vm_map_unlock(old_map);
+	vm_map_deallocate(old_map);
+
+	return new_map;
+}
+
+/*
+ * vm_map_exec:
+ *
+ *      Setup the "new_map" with the proper execution environment according
+ *	to the type of executable (platform, 64bit, chroot environment).
+ *	Map the comm page and shared region, etc...
+ */
+kern_return_t
+vm_map_exec(
+	vm_map_t        new_map,
+	task_t          task,
+	boolean_t       is64bit,
+	void            *fsroot,
+	cpu_type_t      cpu,
+	cpu_subtype_t   cpu_subtype)
+{
+	SHARED_REGION_TRACE_DEBUG(
+		("shared_region: task %p: vm_map_exec(%p,%p,%p,0x%x,0x%x): ->\n",
+		(void *)VM_KERNEL_ADDRPERM(current_task()),
+		(void *)VM_KERNEL_ADDRPERM(new_map),
+		(void *)VM_KERNEL_ADDRPERM(task),
+		(void *)VM_KERNEL_ADDRPERM(fsroot),
+		cpu,
+		cpu_subtype));
+	(void) vm_commpage_enter(new_map, task, is64bit);
+	(void) vm_shared_region_enter(new_map, task, is64bit, fsroot, cpu, cpu_subtype);
+	SHARED_REGION_TRACE_DEBUG(
+		("shared_region: task %p: vm_map_exec(%p,%p,%p,0x%x,0x%x): <-\n",
+		(void *)VM_KERNEL_ADDRPERM(current_task()),
+		(void *)VM_KERNEL_ADDRPERM(new_map),
+		(void *)VM_KERNEL_ADDRPERM(task),
+		(void *)VM_KERNEL_ADDRPERM(fsroot),
+		cpu,
+		cpu_subtype));
+	return KERN_SUCCESS;
+}
+
+/*
+ *	vm_map_lookup_locked:
+ *
+ *	Finds the VM object, offset, and
+ *	protection for a given virtual address in the
+ *	specified map, assuming a page fault of the
+ *	type specified.
+ *
+ *	Returns the (object, offset, protection) for
+ *	this address, whether it is wired down, and whether
+ *	this map has the only reference to the data in question.
+ *	In order to later verify this lookup, a "version"
+ *	is returned.
+ *
+ *	The map MUST be locked by the caller and WILL be
+ *	locked on exit.  In order to guarantee the
+ *	existence of the returned object, it is returned
+ *	locked.
+ *
+ *	If a lookup is requested with "write protection"
+ *	specified, the map may be changed to perform virtual
+ *	copying operations, although the data referenced will
+ *	remain the same.
+ */
+kern_return_t
+vm_map_lookup_locked(
+	vm_map_t                *var_map,       /* IN/OUT */
+	vm_map_offset_t         vaddr,
+	vm_prot_t               fault_type,
+	int                     object_lock_type,
+	vm_map_version_t        *out_version,   /* OUT */
+	vm_object_t             *object,        /* OUT */
+	vm_object_offset_t      *offset,        /* OUT */
+	vm_prot_t               *out_prot,      /* OUT */
+	boolean_t               *wired,         /* OUT */
+	vm_object_fault_info_t  fault_info,     /* OUT */
+	vm_map_t                *real_map)
+{
+	vm_map_entry_t                  entry;
+	vm_map_t                        map = *var_map;
+	vm_map_t                        old_map = *var_map;
+	vm_map_t                        cow_sub_map_parent = VM_MAP_NULL;
+	vm_map_offset_t                 cow_parent_vaddr = 0;
+	vm_map_offset_t                 old_start = 0;
+	vm_map_offset_t                 old_end = 0;
+	vm_prot_t                       prot;
+	boolean_t                       mask_protections;
+	boolean_t                       force_copy;
+	vm_prot_t                       original_fault_type;
+
+	/*
+	 * VM_PROT_MASK means that the caller wants us to use "fault_type"
+	 * as a mask against the mapping's actual protections, not as an
+	 * absolute value.
+	 */
+	mask_protections = (fault_type & VM_PROT_IS_MASK) ? TRUE : FALSE;
+	force_copy = (fault_type & VM_PROT_COPY) ? TRUE : FALSE;
+	fault_type &= VM_PROT_ALL;
+	original_fault_type = fault_type;
+
+	*real_map = map;
+
+RetryLookup:
+	fault_type = original_fault_type;
+
+	/*
+	 *	If the map has an interesting hint, try it before calling
+	 *	full blown lookup routine.
+	 */
+	entry = map->hint;
+
+	if ((entry == vm_map_to_entry(map)) ||
+	    (vaddr < entry->vme_start) || (vaddr >= entry->vme_end)) {
+		vm_map_entry_t  tmp_entry;
+
+		/*
+		 *	Entry was either not a valid hint, or the vaddr
+		 *	was not contained in the entry, so do a full lookup.
+		 */
+		if (!vm_map_lookup_entry(map, vaddr, &tmp_entry)) {
+			if ((cow_sub_map_parent) && (cow_sub_map_parent != map)) {
+				vm_map_unlock(cow_sub_map_parent);
+			}
+			if ((*real_map != map)
+			    && (*real_map != cow_sub_map_parent)) {
+				vm_map_unlock(*real_map);
+			}
+			return KERN_INVALID_ADDRESS;
+		}
+
+		entry = tmp_entry;
+	}
+	if (map == old_map) {
+		old_start = entry->vme_start;
+		old_end = entry->vme_end;
+	}
+
+	/*
+	 *	Handle submaps.  Drop lock on upper map, submap is
+	 *	returned locked.
+	 */
+
+submap_recurse:
+	if (entry->is_sub_map) {
+		vm_map_offset_t         local_vaddr;
+		vm_map_offset_t         end_delta;
+		vm_map_offset_t         start_delta;
+		vm_map_entry_t          submap_entry;
+		vm_prot_t               subentry_protection;
+		vm_prot_t               subentry_max_protection;
+		boolean_t               subentry_no_copy_on_read;
+		boolean_t               mapped_needs_copy = FALSE;
+
+		local_vaddr = vaddr;
+
+		if ((entry->use_pmap &&
+		    !((fault_type & VM_PROT_WRITE) ||
+		    force_copy))) {
+			/* if real_map equals map we unlock below */
+			if ((*real_map != map) &&
+			    (*real_map != cow_sub_map_parent)) {
+				vm_map_unlock(*real_map);
+			}
+			*real_map = VME_SUBMAP(entry);
+		}
+
+		if (entry->needs_copy &&
+		    ((fault_type & VM_PROT_WRITE) ||
+		    force_copy)) {
+			if (!mapped_needs_copy) {
+				if (vm_map_lock_read_to_write(map)) {
+					vm_map_lock_read(map);
+					*real_map = map;
+					goto RetryLookup;
+				}
+				vm_map_lock_read(VME_SUBMAP(entry));
+				*var_map = VME_SUBMAP(entry);
+				cow_sub_map_parent = map;
+				/* reset base to map before cow object */
+				/* this is the map which will accept   */
+				/* the new cow object */
+				old_start = entry->vme_start;
+				old_end = entry->vme_end;
+				cow_parent_vaddr = vaddr;
+				mapped_needs_copy = TRUE;
+			} else {
+				vm_map_lock_read(VME_SUBMAP(entry));
+				*var_map = VME_SUBMAP(entry);
+				if ((cow_sub_map_parent != map) &&
+				    (*real_map != map)) {
+					vm_map_unlock(map);
+				}
+			}
+		} else {
+			vm_map_lock_read(VME_SUBMAP(entry));
+			*var_map = VME_SUBMAP(entry);
+			/* leave map locked if it is a target */
+			/* cow sub_map above otherwise, just  */
+			/* follow the maps down to the object */
+			/* here we unlock knowing we are not  */
+			/* revisiting the map.  */
+			if ((*real_map != map) && (map != cow_sub_map_parent)) {
+				vm_map_unlock_read(map);
+			}
+		}
+
+		map = *var_map;
+
+		/* calculate the offset in the submap for vaddr */
+		local_vaddr = (local_vaddr - entry->vme_start) + VME_OFFSET(entry);
+
+RetrySubMap:
+		if (!vm_map_lookup_entry(map, local_vaddr, &submap_entry)) {
+			if ((cow_sub_map_parent) && (cow_sub_map_parent != map)) {
+				vm_map_unlock(cow_sub_map_parent);
+			}
+			if ((*real_map != map)
+			    && (*real_map != cow_sub_map_parent)) {
+				vm_map_unlock(*real_map);
+			}
+			*real_map = map;
+			return KERN_INVALID_ADDRESS;
+		}
+
+		/* find the attenuated shadow of the underlying object */
+		/* on our target map */
+
+		/* in english the submap object may extend beyond the     */
+		/* region mapped by the entry or, may only fill a portion */
+		/* of it.  For our purposes, we only care if the object   */
+		/* doesn't fill.  In this case the area which will        */
+		/* ultimately be clipped in the top map will only need    */
+		/* to be as big as the portion of the underlying entry    */
+		/* which is mapped */
+		start_delta = submap_entry->vme_start > VME_OFFSET(entry) ?
+		    submap_entry->vme_start - VME_OFFSET(entry) : 0;
+
+		end_delta =
+		    (VME_OFFSET(entry) + start_delta + (old_end - old_start)) <=
+		    submap_entry->vme_end ?
+		    0 : (VME_OFFSET(entry) +
+		    (old_end - old_start))
+		    - submap_entry->vme_end;
+
+		old_start += start_delta;
+		old_end -= end_delta;
+
+		if (submap_entry->is_sub_map) {
+			entry = submap_entry;
+			vaddr = local_vaddr;
+			goto submap_recurse;
+		}
+
+		if (((fault_type & VM_PROT_WRITE) ||
+		    force_copy)
+		    && cow_sub_map_parent) {
+			vm_object_t     sub_object, copy_object;
+			vm_object_offset_t copy_offset;
+			vm_map_offset_t local_start;
+			vm_map_offset_t local_end;
+			boolean_t               copied_slowly = FALSE;
+
+			if (vm_map_lock_read_to_write(map)) {
+				vm_map_lock_read(map);
+				old_start -= start_delta;
+				old_end += end_delta;
+				goto RetrySubMap;
+			}
+
+
+			sub_object = VME_OBJECT(submap_entry);
+			if (sub_object == VM_OBJECT_NULL) {
+				sub_object =
+				    vm_object_allocate(
+					(vm_map_size_t)
+					(submap_entry->vme_end -
+					submap_entry->vme_start));
+				VME_OBJECT_SET(submap_entry, sub_object);
+				VME_OFFSET_SET(submap_entry, 0);
+				assert(!submap_entry->is_sub_map);
+				assert(submap_entry->use_pmap);
+			}
+			local_start =  local_vaddr -
+			    (cow_parent_vaddr - old_start);
+			local_end = local_vaddr +
+			    (old_end - cow_parent_vaddr);
+			vm_map_clip_start(map, submap_entry, local_start);
+			vm_map_clip_end(map, submap_entry, local_end);
+			if (submap_entry->is_sub_map) {
+				/* unnesting was done when clipping */
+				assert(!submap_entry->use_pmap);
+			}
+
+			/* This is the COW case, lets connect */
+			/* an entry in our space to the underlying */
+			/* object in the submap, bypassing the  */
+			/* submap. */
+
+
+			if (submap_entry->wired_count != 0 ||
+			    (sub_object->copy_strategy ==
+			    MEMORY_OBJECT_COPY_NONE)) {
+				vm_object_lock(sub_object);
+				vm_object_copy_slowly(sub_object,
+				    VME_OFFSET(submap_entry),
+				    (submap_entry->vme_end -
+				    submap_entry->vme_start),
+				    FALSE,
+				    &copy_object);
+				copied_slowly = TRUE;
+			} else {
+				/* set up shadow object */
+				copy_object = sub_object;
+				vm_object_lock(sub_object);
+				vm_object_reference_locked(sub_object);
+				sub_object->shadowed = TRUE;
+				vm_object_unlock(sub_object);
+
+				assert(submap_entry->wired_count == 0);
+				submap_entry->needs_copy = TRUE;
+
+				prot = submap_entry->protection;
+				assert(!pmap_has_prot_policy(prot));
+				prot = prot & ~VM_PROT_WRITE;
+				assert(!pmap_has_prot_policy(prot));
+
+				if (override_nx(old_map,
+				    VME_ALIAS(submap_entry))
+				    && prot) {
+					prot |= VM_PROT_EXECUTE;
+				}
+
+				vm_object_pmap_protect(
+					sub_object,
+					VME_OFFSET(submap_entry),
+					submap_entry->vme_end -
+					submap_entry->vme_start,
+					(submap_entry->is_shared
+					|| map->mapped_in_other_pmaps) ?
+					PMAP_NULL : map->pmap,
+					submap_entry->vme_start,
+					prot);
+			}
+
+			/*
+			 * Adjust the fault offset to the submap entry.
+			 */
+			copy_offset = (local_vaddr -
+			    submap_entry->vme_start +
+			    VME_OFFSET(submap_entry));
+
+			/* This works diffently than the   */
+			/* normal submap case. We go back  */
+			/* to the parent of the cow map and*/
+			/* clip out the target portion of  */
+			/* the sub_map, substituting the   */
+			/* new copy object,                */
+
+			subentry_protection = submap_entry->protection;
+			subentry_max_protection = submap_entry->max_protection;
+			subentry_no_copy_on_read = submap_entry->vme_no_copy_on_read;
+			vm_map_unlock(map);
+			submap_entry = NULL; /* not valid after map unlock */
+
+			local_start = old_start;
+			local_end = old_end;
+			map = cow_sub_map_parent;
+			*var_map = cow_sub_map_parent;
+			vaddr = cow_parent_vaddr;
+			cow_sub_map_parent = NULL;
+
+			if (!vm_map_lookup_entry(map,
+			    vaddr, &entry)) {
+				vm_object_deallocate(
+					copy_object);
+				vm_map_lock_write_to_read(map);
+				return KERN_INVALID_ADDRESS;
+			}
+
+			/* clip out the portion of space */
+			/* mapped by the sub map which   */
+			/* corresponds to the underlying */
+			/* object */
+
+			/*
+			 * Clip (and unnest) the smallest nested chunk
+			 * possible around the faulting address...
+			 */
+			local_start = vaddr & ~(pmap_nesting_size_min - 1);
+			local_end = local_start + pmap_nesting_size_min;
+			/*
+			 * ... but don't go beyond the "old_start" to "old_end"
+			 * range, to avoid spanning over another VM region
+			 * with a possibly different VM object and/or offset.
+			 */
+			if (local_start < old_start) {
+				local_start = old_start;
+			}
+			if (local_end > old_end) {
+				local_end = old_end;
+			}
+			/*
+			 * Adjust copy_offset to the start of the range.
+			 */
+			copy_offset -= (vaddr - local_start);
+
+			vm_map_clip_start(map, entry, local_start);
+			vm_map_clip_end(map, entry, local_end);
+			if (entry->is_sub_map) {
+				/* unnesting was done when clipping */
+				assert(!entry->use_pmap);
+			}
+
+			/* substitute copy object for */
+			/* shared map entry           */
+			vm_map_deallocate(VME_SUBMAP(entry));
+			assert(!entry->iokit_acct);
+			entry->is_sub_map = FALSE;
+			entry->use_pmap = TRUE;
+			VME_OBJECT_SET(entry, copy_object);
+
+			/* propagate the submap entry's protections */
+			if (entry->protection != VM_PROT_READ) {
+				/*
+				 * Someone has already altered the top entry's
+				 * protections via vm_protect(VM_PROT_COPY).
+				 * Respect these new values and ignore the
+				 * submap entry's protections.
+				 */
+			} else {
+				/*
+				 * Regular copy-on-write: propagate the submap
+				 * entry's protections to the top map entry.
+				 */
+				entry->protection |= subentry_protection;
+			}
+			entry->max_protection |= subentry_max_protection;
+			/* propagate no_copy_on_read */
+			entry->vme_no_copy_on_read = subentry_no_copy_on_read;
+
+			if ((entry->protection & VM_PROT_WRITE) &&
+			    (entry->protection & VM_PROT_EXECUTE) &&
+#if !CONFIG_EMBEDDED
+			    map != kernel_map &&
+			    cs_process_enforcement(NULL) &&
+#endif /* !CONFIG_EMBEDDED */
+			    !(entry->used_for_jit)) {
+				DTRACE_VM3(cs_wx,
+				    uint64_t, (uint64_t)entry->vme_start,
+				    uint64_t, (uint64_t)entry->vme_end,
+				    vm_prot_t, entry->protection);
+				printf("CODE SIGNING: %d[%s] %s can't have both write and exec at the same time\n",
+				    proc_selfpid(),
+				    (current_task()->bsd_info
+				    ? proc_name_address(current_task()->bsd_info)
+				    : "?"),
+				    __FUNCTION__);
+				entry->protection &= ~VM_PROT_EXECUTE;
+			}
+
+			if (copied_slowly) {
+				VME_OFFSET_SET(entry, local_start - old_start);
+				entry->needs_copy = FALSE;
+				entry->is_shared = FALSE;
+			} else {
+				VME_OFFSET_SET(entry, copy_offset);
+				assert(entry->wired_count == 0);
+				entry->needs_copy = TRUE;
+				if (entry->inheritance == VM_INHERIT_SHARE) {
+					entry->inheritance = VM_INHERIT_COPY;
+				}
+				if (map != old_map) {
+					entry->is_shared = TRUE;
+				}
+			}
+			if (entry->inheritance == VM_INHERIT_SHARE) {
+				entry->inheritance = VM_INHERIT_COPY;
+			}
+
+			vm_map_lock_write_to_read(map);
+		} else {
+			if ((cow_sub_map_parent)
+			    && (cow_sub_map_parent != *real_map)
+			    && (cow_sub_map_parent != map)) {
+				vm_map_unlock(cow_sub_map_parent);
+			}
+			entry = submap_entry;
+			vaddr = local_vaddr;
+		}
+	}
+
+	/*
+	 *	Check whether this task is allowed to have
+	 *	this page.
+	 */
+
+	prot = entry->protection;
+
+	if (override_nx(old_map, VME_ALIAS(entry)) && prot) {
+		/*
+		 * HACK -- if not a stack, then allow execution
+		 */
+		prot |= VM_PROT_EXECUTE;
+	}
+
+	if (mask_protections) {
+		fault_type &= prot;
+		if (fault_type == VM_PROT_NONE) {
+			goto protection_failure;
+		}
+	}
+	if (((fault_type & prot) != fault_type)
+#if __arm64__
+	    /* prefetch abort in execute-only page */
+	    && !(prot == VM_PROT_EXECUTE && fault_type == (VM_PROT_READ | VM_PROT_EXECUTE))
+#endif
+	    ) {
+protection_failure:
+		if (*real_map != map) {
+			vm_map_unlock(*real_map);
+		}
+		*real_map = map;
+
+		if ((fault_type & VM_PROT_EXECUTE) && prot) {
+			log_stack_execution_failure((addr64_t)vaddr, prot);
+		}
+
+		DTRACE_VM2(prot_fault, int, 1, (uint64_t *), NULL);
+		return KERN_PROTECTION_FAILURE;
+	}
+
+	/*
+	 *	If this page is not pageable, we have to get
+	 *	it for all possible accesses.
+	 */
+
+	*wired = (entry->wired_count != 0);
+	if (*wired) {
+		fault_type = prot;
+	}
+
+	/*
+	 *	If the entry was copy-on-write, we either ...
+	 */
+
+	if (entry->needs_copy) {
+		/*
+		 *	If we want to write the page, we may as well
+		 *	handle that now since we've got the map locked.
+		 *
+		 *	If we don't need to write the page, we just
+		 *	demote the permissions allowed.
+		 */
+
+		if ((fault_type & VM_PROT_WRITE) || *wired || force_copy) {
+			/*
+			 *	Make a new object, and place it in the
+			 *	object chain.  Note that no new references
+			 *	have appeared -- one just moved from the
+			 *	map to the new object.
+			 */
+
+			if (vm_map_lock_read_to_write(map)) {
+				vm_map_lock_read(map);
+				goto RetryLookup;
+			}
+
+			if (VME_OBJECT(entry)->shadowed == FALSE) {
+				vm_object_lock(VME_OBJECT(entry));
+				VME_OBJECT(entry)->shadowed = TRUE;
+				vm_object_unlock(VME_OBJECT(entry));
+			}
+			VME_OBJECT_SHADOW(entry,
+			    (vm_map_size_t) (entry->vme_end -
+			    entry->vme_start));
+			entry->needs_copy = FALSE;
+
+			vm_map_lock_write_to_read(map);
+		}
+		if ((fault_type & VM_PROT_WRITE) == 0 && *wired == 0) {
+			/*
+			 *	We're attempting to read a copy-on-write
+			 *	page -- don't allow writes.
+			 */
+
+			prot &= (~VM_PROT_WRITE);
+		}
+	}
+
+	/*
+	 *	Create an object if necessary.
+	 */
+	if (VME_OBJECT(entry) == VM_OBJECT_NULL) {
+		if (vm_map_lock_read_to_write(map)) {
+			vm_map_lock_read(map);
+			goto RetryLookup;
+		}
+
+		VME_OBJECT_SET(entry,
+		    vm_object_allocate(
+			    (vm_map_size_t)(entry->vme_end -
+			    entry->vme_start)));
+		VME_OFFSET_SET(entry, 0);
+		assert(entry->use_pmap);
+		vm_map_lock_write_to_read(map);
+	}
+
+	/*
+	 *	Return the object/offset from this entry.  If the entry
+	 *	was copy-on-write or empty, it has been fixed up.  Also
+	 *	return the protection.
+	 */
+
+	*offset = (vaddr - entry->vme_start) + VME_OFFSET(entry);
+	*object = VME_OBJECT(entry);
+	*out_prot = prot;
+	KDBG_FILTERED(MACHDBG_CODE(DBG_MACH_WORKINGSET, VM_MAP_LOOKUP_OBJECT), VM_KERNEL_UNSLIDE_OR_PERM(*object), 0, 0, 0, 0);
+
+	if (fault_info) {
+		fault_info->interruptible = THREAD_UNINT; /* for now... */
+		/* ... the caller will change "interruptible" if needed */
+		fault_info->cluster_size = 0;
+		fault_info->user_tag = VME_ALIAS(entry);
+		fault_info->pmap_options = 0;
+		if (entry->iokit_acct ||
+		    (!entry->is_sub_map && !entry->use_pmap)) {
+			fault_info->pmap_options |= PMAP_OPTIONS_ALT_ACCT;
+		}
+		fault_info->behavior = entry->behavior;
+		fault_info->lo_offset = VME_OFFSET(entry);
+		fault_info->hi_offset =
+		    (entry->vme_end - entry->vme_start) + VME_OFFSET(entry);
+		fault_info->no_cache  = entry->no_cache;
+		fault_info->stealth = FALSE;
+		fault_info->io_sync = FALSE;
+		if (entry->used_for_jit ||
+		    entry->vme_resilient_codesign) {
+			fault_info->cs_bypass = TRUE;
+		} else {
+			fault_info->cs_bypass = FALSE;
+		}
+		fault_info->pmap_cs_associated = FALSE;
+#if CONFIG_PMAP_CS
+		if (entry->pmap_cs_associated) {
+			/*
+			 * The pmap layer will validate this page
+			 * before allowing it to be executed from.
+			 */
+			fault_info->pmap_cs_associated = TRUE;
+		}
+#endif /* CONFIG_PMAP_CS */
+		fault_info->mark_zf_absent = FALSE;
+		fault_info->batch_pmap_op = FALSE;
+		fault_info->resilient_media = entry->vme_resilient_media;
+		fault_info->no_copy_on_read = entry->vme_no_copy_on_read;
+	}
+
+	/*
+	 *	Lock the object to prevent it from disappearing
+	 */
+	if (object_lock_type == OBJECT_LOCK_EXCLUSIVE) {
+		vm_object_lock(*object);
+	} else {
+		vm_object_lock_shared(*object);
+	}
+
+	/*
+	 *	Save the version number
+	 */
+
+	out_version->main_timestamp = map->timestamp;
+
+	return KERN_SUCCESS;
+}
+
+
+/*
+ *	vm_map_verify:
+ *
+ *	Verifies that the map in question has not changed
+ *	since the given version. The map has to be locked
+ *	("shared" mode is fine) before calling this function
+ *	and it will be returned locked too.
+ */
+boolean_t
+vm_map_verify(
+	vm_map_t                map,
+	vm_map_version_t        *version)       /* REF */
+{
+	boolean_t       result;
+
+	vm_map_lock_assert_held(map);
+	result = (map->timestamp == version->main_timestamp);
+
+	return result;
+}
+
+/*
+ *	TEMPORARYTEMPORARYTEMPORARYTEMPORARYTEMPORARYTEMPORARY
+ *	Goes away after regular vm_region_recurse function migrates to
+ *	64 bits
+ *	vm_region_recurse: A form of vm_region which follows the
+ *	submaps in a target map
+ *
+ */
+
+kern_return_t
+vm_map_region_recurse_64(
+	vm_map_t                 map,
+	vm_map_offset_t *address,               /* IN/OUT */
+	vm_map_size_t           *size,                  /* OUT */
+	natural_t               *nesting_depth, /* IN/OUT */
+	vm_region_submap_info_64_t      submap_info,    /* IN/OUT */
+	mach_msg_type_number_t  *count) /* IN/OUT */
+{
+	mach_msg_type_number_t  original_count;
+	vm_region_extended_info_data_t  extended;
+	vm_map_entry_t                  tmp_entry;
+	vm_map_offset_t                 user_address;
+	unsigned int                    user_max_depth;
+
+	/*
+	 * "curr_entry" is the VM map entry preceding or including the
+	 * address we're looking for.
+	 * "curr_map" is the map or sub-map containing "curr_entry".
+	 * "curr_address" is the equivalent of the top map's "user_address"
+	 * in the current map.
+	 * "curr_offset" is the cumulated offset of "curr_map" in the
+	 * target task's address space.
+	 * "curr_depth" is the depth of "curr_map" in the chain of
+	 * sub-maps.
+	 *
+	 * "curr_max_below" and "curr_max_above" limit the range (around
+	 * "curr_address") we should take into account in the current (sub)map.
+	 * They limit the range to what's visible through the map entries
+	 * we've traversed from the top map to the current map.
+	 *
+	 */
+	vm_map_entry_t                  curr_entry;
+	vm_map_address_t                curr_address;
+	vm_map_offset_t                 curr_offset;
+	vm_map_t                        curr_map;
+	unsigned int                    curr_depth;
+	vm_map_offset_t                 curr_max_below, curr_max_above;
+	vm_map_offset_t                 curr_skip;
+
+	/*
+	 * "next_" is the same as "curr_" but for the VM region immediately
+	 * after the address we're looking for.  We need to keep track of this
+	 * too because we want to return info about that region if the
+	 * address we're looking for is not mapped.
+	 */
+	vm_map_entry_t                  next_entry;
+	vm_map_offset_t                 next_offset;
+	vm_map_offset_t                 next_address;
+	vm_map_t                        next_map;
+	unsigned int                    next_depth;
+	vm_map_offset_t                 next_max_below, next_max_above;
+	vm_map_offset_t                 next_skip;
+
+	boolean_t                       look_for_pages;
+	vm_region_submap_short_info_64_t short_info;
+	boolean_t                       do_region_footprint;
+
+	if (map == VM_MAP_NULL) {
+		/* no address space to work on */
+		return KERN_INVALID_ARGUMENT;
+	}
+
+
+	if (*count < VM_REGION_SUBMAP_SHORT_INFO_COUNT_64) {
+		/*
+		 * "info" structure is not big enough and
+		 * would overflow
+		 */
+		return KERN_INVALID_ARGUMENT;
+	}
+
+	do_region_footprint = task_self_region_footprint();
+	original_count = *count;
+
+	if (original_count < VM_REGION_SUBMAP_INFO_V0_COUNT_64) {
+		*count = VM_REGION_SUBMAP_SHORT_INFO_COUNT_64;
+		look_for_pages = FALSE;
+		short_info = (vm_region_submap_short_info_64_t) submap_info;
+		submap_info = NULL;
+	} else {
+		look_for_pages = TRUE;
+		*count = VM_REGION_SUBMAP_INFO_V0_COUNT_64;
+		short_info = NULL;
+
+		if (original_count >= VM_REGION_SUBMAP_INFO_V1_COUNT_64) {
+			*count = VM_REGION_SUBMAP_INFO_V1_COUNT_64;
+		}
+		if (original_count >= VM_REGION_SUBMAP_INFO_V2_COUNT_64) {
+			*count = VM_REGION_SUBMAP_INFO_V2_COUNT_64;
+		}
+	}
+
+	user_address = *address;
+	user_max_depth = *nesting_depth;
+
+	if (not_in_kdp) {
+		vm_map_lock_read(map);
+	}
+
+recurse_again:
+	curr_entry = NULL;
+	curr_map = map;
+	curr_address = user_address;
+	curr_offset = 0;
+	curr_skip = 0;
+	curr_depth = 0;
+	curr_max_above = ((vm_map_offset_t) -1) - curr_address;
+	curr_max_below = curr_address;
+
+	next_entry = NULL;
+	next_map = NULL;
+	next_address = 0;
+	next_offset = 0;
+	next_skip = 0;
+	next_depth = 0;
+	next_max_above = (vm_map_offset_t) -1;
+	next_max_below = (vm_map_offset_t) -1;
+
+	for (;;) {
+		if (vm_map_lookup_entry(curr_map,
+		    curr_address,
+		    &tmp_entry)) {
+			/* tmp_entry contains the address we're looking for */
+			curr_entry = tmp_entry;
+		} else {
+			vm_map_offset_t skip;
+			/*
+			 * The address is not mapped.  "tmp_entry" is the
+			 * map entry preceding the address.  We want the next
+			 * one, if it exists.
+			 */
+			curr_entry = tmp_entry->vme_next;
+
+			if (curr_entry == vm_map_to_entry(curr_map) ||
+			    (curr_entry->vme_start >=
+			    curr_address + curr_max_above)) {
+				/* no next entry at this level: stop looking */
+				if (not_in_kdp) {
+					vm_map_unlock_read(curr_map);
+				}
+				curr_entry = NULL;
+				curr_map = NULL;
+				curr_skip = 0;
+				curr_offset = 0;
+				curr_depth = 0;
+				curr_max_above = 0;
+				curr_max_below = 0;
+				break;
+			}
+
+			/* adjust current address and offset */
+			skip = curr_entry->vme_start - curr_address;
+			curr_address = curr_entry->vme_start;
+			curr_skip += skip;
+			curr_offset += skip;
+			curr_max_above -= skip;
+			curr_max_below = 0;
+		}
+
+		/*
+		 * Is the next entry at this level closer to the address (or
+		 * deeper in the submap chain) than the one we had
+		 * so far ?
+		 */
+		tmp_entry = curr_entry->vme_next;
+		if (tmp_entry == vm_map_to_entry(curr_map)) {
+			/* no next entry at this level */
+		} else if (tmp_entry->vme_start >=
+		    curr_address + curr_max_above) {
+			/*
+			 * tmp_entry is beyond the scope of what we mapped of
+			 * this submap in the upper level: ignore it.
+			 */
+		} else if ((next_entry == NULL) ||
+		    (tmp_entry->vme_start + curr_offset <=
+		    next_entry->vme_start + next_offset)) {
+			/*
+			 * We didn't have a "next_entry" or this one is
+			 * closer to the address we're looking for:
+			 * use this "tmp_entry" as the new "next_entry".
+			 */
+			if (next_entry != NULL) {
+				/* unlock the last "next_map" */
+				if (next_map != curr_map && not_in_kdp) {
+					vm_map_unlock_read(next_map);
+				}
+			}
+			next_entry = tmp_entry;
+			next_map = curr_map;
+			next_depth = curr_depth;
+			next_address = next_entry->vme_start;
+			next_skip = curr_skip;
+			next_skip += (next_address - curr_address);
+			next_offset = curr_offset;
+			next_offset += (next_address - curr_address);
+			next_max_above = MIN(next_max_above, curr_max_above);
+			next_max_above = MIN(next_max_above,
+			    next_entry->vme_end - next_address);
+			next_max_below = MIN(next_max_below, curr_max_below);
+			next_max_below = MIN(next_max_below,
+			    next_address - next_entry->vme_start);
+		}
+
+		/*
+		 * "curr_max_{above,below}" allow us to keep track of the
+		 * portion of the submap that is actually mapped at this level:
+		 * the rest of that submap is irrelevant to us, since it's not
+		 * mapped here.
+		 * The relevant portion of the map starts at
+		 * "VME_OFFSET(curr_entry)" up to the size of "curr_entry".
+		 */
+		curr_max_above = MIN(curr_max_above,
+		    curr_entry->vme_end - curr_address);
+		curr_max_below = MIN(curr_max_below,
+		    curr_address - curr_entry->vme_start);
+
+		if (!curr_entry->is_sub_map ||
+		    curr_depth >= user_max_depth) {
+			/*
+			 * We hit a leaf map or we reached the maximum depth
+			 * we could, so stop looking.  Keep the current map
+			 * locked.
+			 */
+			break;
+		}
+
+		/*
+		 * Get down to the next submap level.
+		 */
+
+		/*
+		 * Lock the next level and unlock the current level,
+		 * unless we need to keep it locked to access the "next_entry"
+		 * later.
+		 */
+		if (not_in_kdp) {
+			vm_map_lock_read(VME_SUBMAP(curr_entry));
+		}
+		if (curr_map == next_map) {
+			/* keep "next_map" locked in case we need it */
+		} else {
+			/* release this map */
+			if (not_in_kdp) {
+				vm_map_unlock_read(curr_map);
+			}
+		}
+
+		/*
+		 * Adjust the offset.  "curr_entry" maps the submap
+		 * at relative address "curr_entry->vme_start" in the
+		 * curr_map but skips the first "VME_OFFSET(curr_entry)"
+		 * bytes of the submap.
+		 * "curr_offset" always represents the offset of a virtual
+		 * address in the curr_map relative to the absolute address
+		 * space (i.e. the top-level VM map).
+		 */
+		curr_offset +=
+		    (VME_OFFSET(curr_entry) - curr_entry->vme_start);
+		curr_address = user_address + curr_offset;
+		/* switch to the submap */
+		curr_map = VME_SUBMAP(curr_entry);
+		curr_depth++;
+		curr_entry = NULL;
+	}
+
+// LP64todo: all the current tools are 32bit, obviously never worked for 64b
+// so probably should be a real 32b ID vs. ptr.
+// Current users just check for equality
+
+	if (curr_entry == NULL) {
+		/* no VM region contains the address... */
+
+		if (do_region_footprint && /* we want footprint numbers */
+		    next_entry == NULL && /* & there are no more regions */
+		    /* & we haven't already provided our fake region: */
+		    user_address <= vm_map_last_entry(map)->vme_end) {
+			ledger_amount_t ledger_resident, ledger_compressed;
+
+			/*
+			 * Add a fake memory region to account for
+			 * purgeable and/or ledger-tagged memory that
+			 * counts towards this task's memory footprint,
+			 * i.e. the resident/compressed pages of non-volatile
+			 * objects owned by that task.
+			 */
+			task_ledgers_footprint(map->pmap->ledger,
+			    &ledger_resident,
+			    &ledger_compressed);
+			if (ledger_resident + ledger_compressed == 0) {
+				/* no purgeable memory usage to report */
+				return KERN_INVALID_ADDRESS;
+			}
+			/* fake region to show nonvolatile footprint */
+			if (look_for_pages) {
+				submap_info->protection = VM_PROT_DEFAULT;
+				submap_info->max_protection = VM_PROT_DEFAULT;
+				submap_info->inheritance = VM_INHERIT_DEFAULT;
+				submap_info->offset = 0;
+				submap_info->user_tag = -1;
+				submap_info->pages_resident = (unsigned int) (ledger_resident / PAGE_SIZE);
+				submap_info->pages_shared_now_private = 0;
+				submap_info->pages_swapped_out = (unsigned int) (ledger_compressed / PAGE_SIZE);
+				submap_info->pages_dirtied = submap_info->pages_resident;
+				submap_info->ref_count = 1;
+				submap_info->shadow_depth = 0;
+				submap_info->external_pager = 0;
+				submap_info->share_mode = SM_PRIVATE;
+				submap_info->is_submap = 0;
+				submap_info->behavior = VM_BEHAVIOR_DEFAULT;
+				submap_info->object_id = INFO_MAKE_FAKE_OBJECT_ID(map, task_ledgers.purgeable_nonvolatile);
+				submap_info->user_wired_count = 0;
+				submap_info->pages_reusable = 0;
+			} else {
+				short_info->user_tag = -1;
+				short_info->offset = 0;
+				short_info->protection = VM_PROT_DEFAULT;
+				short_info->inheritance = VM_INHERIT_DEFAULT;
+				short_info->max_protection = VM_PROT_DEFAULT;
+				short_info->behavior = VM_BEHAVIOR_DEFAULT;
+				short_info->user_wired_count = 0;
+				short_info->is_submap = 0;
+				short_info->object_id = INFO_MAKE_FAKE_OBJECT_ID(map, task_ledgers.purgeable_nonvolatile);
+				short_info->external_pager = 0;
+				short_info->shadow_depth = 0;
+				short_info->share_mode = SM_PRIVATE;
+				short_info->ref_count = 1;
+			}
+			*nesting_depth = 0;
+			*size = (vm_map_size_t) (ledger_resident + ledger_compressed);
+//			*address = user_address;
+			*address = vm_map_last_entry(map)->vme_end;
+			return KERN_SUCCESS;
+		}
+
+		if (next_entry == NULL) {
+			/* ... and no VM region follows it either */
+			return KERN_INVALID_ADDRESS;
+		}
+		/* ... gather info about the next VM region */
+		curr_entry = next_entry;
+		curr_map = next_map;    /* still locked ... */
+		curr_address = next_address;
+		curr_skip = next_skip;
+		curr_offset = next_offset;
+		curr_depth = next_depth;
+		curr_max_above = next_max_above;
+		curr_max_below = next_max_below;
+	} else {
+		/* we won't need "next_entry" after all */
+		if (next_entry != NULL) {
+			/* release "next_map" */
+			if (next_map != curr_map && not_in_kdp) {
+				vm_map_unlock_read(next_map);
+			}
+		}
+	}
+	next_entry = NULL;
+	next_map = NULL;
+	next_offset = 0;
+	next_skip = 0;
+	next_depth = 0;
+	next_max_below = -1;
+	next_max_above = -1;
+
+	if (curr_entry->is_sub_map &&
+	    curr_depth < user_max_depth) {
+		/*
+		 * We're not as deep as we could be:  we must have
+		 * gone back up after not finding anything mapped
+		 * below the original top-level map entry's.
+		 * Let's move "curr_address" forward and recurse again.
+		 */
+		user_address = curr_address;
+		goto recurse_again;
+	}
+
+	*nesting_depth = curr_depth;
+	*size = curr_max_above + curr_max_below;
+	*address = user_address + curr_skip - curr_max_below;
+
+// LP64todo: all the current tools are 32bit, obviously never worked for 64b
+// so probably should be a real 32b ID vs. ptr.
+// Current users just check for equality
+#define INFO_MAKE_OBJECT_ID(p)  ((uint32_t)(uintptr_t)VM_KERNEL_ADDRPERM(p))
+
+	if (look_for_pages) {
+		submap_info->user_tag = VME_ALIAS(curr_entry);
+		submap_info->offset = VME_OFFSET(curr_entry);
+		submap_info->protection = curr_entry->protection;
+		submap_info->inheritance = curr_entry->inheritance;
+		submap_info->max_protection = curr_entry->max_protection;
+		submap_info->behavior = curr_entry->behavior;
+		submap_info->user_wired_count = curr_entry->user_wired_count;
+		submap_info->is_submap = curr_entry->is_sub_map;
+		submap_info->object_id = INFO_MAKE_OBJECT_ID(VME_OBJECT(curr_entry));
+	} else {
+		short_info->user_tag = VME_ALIAS(curr_entry);
+		short_info->offset = VME_OFFSET(curr_entry);
+		short_info->protection = curr_entry->protection;
+		short_info->inheritance = curr_entry->inheritance;
+		short_info->max_protection = curr_entry->max_protection;
+		short_info->behavior = curr_entry->behavior;
+		short_info->user_wired_count = curr_entry->user_wired_count;
+		short_info->is_submap = curr_entry->is_sub_map;
+		short_info->object_id = INFO_MAKE_OBJECT_ID(VME_OBJECT(curr_entry));
+	}
+
+	extended.pages_resident = 0;
+	extended.pages_swapped_out = 0;
+	extended.pages_shared_now_private = 0;
+	extended.pages_dirtied = 0;
+	extended.pages_reusable = 0;
+	extended.external_pager = 0;
+	extended.shadow_depth = 0;
+	extended.share_mode = SM_EMPTY;
+	extended.ref_count = 0;
+
+	if (not_in_kdp) {
+		if (!curr_entry->is_sub_map) {
+			vm_map_offset_t range_start, range_end;
+			range_start = MAX((curr_address - curr_max_below),
+			    curr_entry->vme_start);
+			range_end = MIN((curr_address + curr_max_above),
+			    curr_entry->vme_end);
+			vm_map_region_walk(curr_map,
+			    range_start,
+			    curr_entry,
+			    (VME_OFFSET(curr_entry) +
+			    (range_start -
+			    curr_entry->vme_start)),
+			    range_end - range_start,
+			    &extended,
+			    look_for_pages, VM_REGION_EXTENDED_INFO_COUNT);
+			if (extended.external_pager &&
+			    extended.ref_count == 2 &&
+			    extended.share_mode == SM_SHARED) {
+				extended.share_mode = SM_PRIVATE;
+			}
+		} else {
+			if (curr_entry->use_pmap) {
+				extended.share_mode = SM_TRUESHARED;
+			} else {
+				extended.share_mode = SM_PRIVATE;
+			}
+			extended.ref_count = os_ref_get_count(&VME_SUBMAP(curr_entry)->map_refcnt);
+		}
+	}
+
+	if (look_for_pages) {
+		submap_info->pages_resident = extended.pages_resident;
+		submap_info->pages_swapped_out = extended.pages_swapped_out;
+		submap_info->pages_shared_now_private =
+		    extended.pages_shared_now_private;
+		submap_info->pages_dirtied = extended.pages_dirtied;
+		submap_info->external_pager = extended.external_pager;
+		submap_info->shadow_depth = extended.shadow_depth;
+		submap_info->share_mode = extended.share_mode;
+		submap_info->ref_count = extended.ref_count;
+
+		if (original_count >= VM_REGION_SUBMAP_INFO_V1_COUNT_64) {
+			submap_info->pages_reusable = extended.pages_reusable;
+		}
+		if (original_count >= VM_REGION_SUBMAP_INFO_V2_COUNT_64) {
+			submap_info->object_id_full = (vm_object_id_t) (VME_OBJECT(curr_entry) != NULL) ? VM_KERNEL_ADDRPERM(VME_OBJECT(curr_entry)) : 0ULL;
+		}
+	} else {
+		short_info->external_pager = extended.external_pager;
+		short_info->shadow_depth = extended.shadow_depth;
+		short_info->share_mode = extended.share_mode;
+		short_info->ref_count = extended.ref_count;
+	}
+
+	if (not_in_kdp) {
+		vm_map_unlock_read(curr_map);
+	}
+
+	return KERN_SUCCESS;
+}
+
+/*
+ *	vm_region:
+ *
+ *	User call to obtain information about a region in
+ *	a task's address map. Currently, only one flavor is
+ *	supported.
+ *
+ *	XXX The reserved and behavior fields cannot be filled
+ *	    in until the vm merge from the IK is completed, and
+ *	    vm_reserve is implemented.
+ */
+
+kern_return_t
+vm_map_region(
+	vm_map_t                 map,
+	vm_map_offset_t *address,               /* IN/OUT */
+	vm_map_size_t           *size,                  /* OUT */
+	vm_region_flavor_t       flavor,                /* IN */
+	vm_region_info_t         info,                  /* OUT */
+	mach_msg_type_number_t  *count, /* IN/OUT */
+	mach_port_t             *object_name)           /* OUT */
+{
+	vm_map_entry_t          tmp_entry;
+	vm_map_entry_t          entry;
+	vm_map_offset_t         start;
+
+	if (map == VM_MAP_NULL) {
+		return KERN_INVALID_ARGUMENT;
+	}
+
+	switch (flavor) {
+	case VM_REGION_BASIC_INFO:
+		/* legacy for old 32-bit objects info */
+	{
+		vm_region_basic_info_t  basic;
+
+		if (*count < VM_REGION_BASIC_INFO_COUNT) {
+			return KERN_INVALID_ARGUMENT;
+		}
+
+		basic = (vm_region_basic_info_t) info;
+		*count = VM_REGION_BASIC_INFO_COUNT;
+
+		vm_map_lock_read(map);
+
+		start = *address;
+		if (!vm_map_lookup_entry(map, start, &tmp_entry)) {
+			if ((entry = tmp_entry->vme_next) == vm_map_to_entry(map)) {
+				vm_map_unlock_read(map);
+				return KERN_INVALID_ADDRESS;
+			}
+		} else {
+			entry = tmp_entry;
+		}
+
+		start = entry->vme_start;
+
+		basic->offset = (uint32_t)VME_OFFSET(entry);
+		basic->protection = entry->protection;
+		basic->inheritance = entry->inheritance;
+		basic->max_protection = entry->max_protection;
+		basic->behavior = entry->behavior;
+		basic->user_wired_count = entry->user_wired_count;
+		basic->reserved = entry->is_sub_map;
+		*address = start;
+		*size = (entry->vme_end - start);
+
+		if (object_name) {
+			*object_name = IP_NULL;
+		}
+		if (entry->is_sub_map) {
+			basic->shared = FALSE;
+		} else {
+			basic->shared = entry->is_shared;
+		}
+
+		vm_map_unlock_read(map);
+		return KERN_SUCCESS;
+	}
+
+	case VM_REGION_BASIC_INFO_64:
+	{
+		vm_region_basic_info_64_t       basic;
+
+		if (*count < VM_REGION_BASIC_INFO_COUNT_64) {
+			return KERN_INVALID_ARGUMENT;
+		}
+
+		basic = (vm_region_basic_info_64_t) info;
+		*count = VM_REGION_BASIC_INFO_COUNT_64;
+
+		vm_map_lock_read(map);
+
+		start = *address;
+		if (!vm_map_lookup_entry(map, start, &tmp_entry)) {
+			if ((entry = tmp_entry->vme_next) == vm_map_to_entry(map)) {
+				vm_map_unlock_read(map);
+				return KERN_INVALID_ADDRESS;
+			}
+		} else {
+			entry = tmp_entry;
+		}
+
+		start = entry->vme_start;
+
+		basic->offset = VME_OFFSET(entry);
+		basic->protection = entry->protection;
+		basic->inheritance = entry->inheritance;
+		basic->max_protection = entry->max_protection;
+		basic->behavior = entry->behavior;
+		basic->user_wired_count = entry->user_wired_count;
+		basic->reserved = entry->is_sub_map;
+		*address = start;
+		*size = (entry->vme_end - start);
+
+		if (object_name) {
+			*object_name = IP_NULL;
+		}
+		if (entry->is_sub_map) {
+			basic->shared = FALSE;
+		} else {
+			basic->shared = entry->is_shared;
+		}
+
+		vm_map_unlock_read(map);
+		return KERN_SUCCESS;
+	}
+	case VM_REGION_EXTENDED_INFO:
+		if (*count < VM_REGION_EXTENDED_INFO_COUNT) {
+			return KERN_INVALID_ARGUMENT;
+		}
+	/*fallthru*/
+	case VM_REGION_EXTENDED_INFO__legacy:
+		if (*count < VM_REGION_EXTENDED_INFO_COUNT__legacy) {
+			return KERN_INVALID_ARGUMENT;
+		}
+
+		{
+			vm_region_extended_info_t       extended;
+			mach_msg_type_number_t original_count;
+
+			extended = (vm_region_extended_info_t) info;
+
+			vm_map_lock_read(map);
+
+			start = *address;
+			if (!vm_map_lookup_entry(map, start, &tmp_entry)) {
+				if ((entry = tmp_entry->vme_next) == vm_map_to_entry(map)) {
+					vm_map_unlock_read(map);
+					return KERN_INVALID_ADDRESS;
+				}
+			} else {
+				entry = tmp_entry;
+			}
+			start = entry->vme_start;
+
+			extended->protection = entry->protection;
+			extended->user_tag = VME_ALIAS(entry);
+			extended->pages_resident = 0;
+			extended->pages_swapped_out = 0;
+			extended->pages_shared_now_private = 0;
+			extended->pages_dirtied = 0;
+			extended->external_pager = 0;
+			extended->shadow_depth = 0;
+
+			original_count = *count;
+			if (flavor == VM_REGION_EXTENDED_INFO__legacy) {
+				*count = VM_REGION_EXTENDED_INFO_COUNT__legacy;
+			} else {
+				extended->pages_reusable = 0;
+				*count = VM_REGION_EXTENDED_INFO_COUNT;
+			}
+
+			vm_map_region_walk(map, start, entry, VME_OFFSET(entry), entry->vme_end - start, extended, TRUE, *count);
+
+			if (extended->external_pager && extended->ref_count == 2 && extended->share_mode == SM_SHARED) {
+				extended->share_mode = SM_PRIVATE;
+			}
+
+			if (object_name) {
+				*object_name = IP_NULL;
+			}
+			*address = start;
+			*size = (entry->vme_end - start);
+
+			vm_map_unlock_read(map);
+			return KERN_SUCCESS;
+		}
+	case VM_REGION_TOP_INFO:
+	{
+		vm_region_top_info_t    top;
+
+		if (*count < VM_REGION_TOP_INFO_COUNT) {
+			return KERN_INVALID_ARGUMENT;
+		}
+
+		top = (vm_region_top_info_t) info;
+		*count = VM_REGION_TOP_INFO_COUNT;
+
+		vm_map_lock_read(map);
+
+		start = *address;
+		if (!vm_map_lookup_entry(map, start, &tmp_entry)) {
+			if ((entry = tmp_entry->vme_next) == vm_map_to_entry(map)) {
+				vm_map_unlock_read(map);
+				return KERN_INVALID_ADDRESS;
+			}
+		} else {
+			entry = tmp_entry;
+		}
+		start = entry->vme_start;
+
+		top->private_pages_resident = 0;
+		top->shared_pages_resident = 0;
+
+		vm_map_region_top_walk(entry, top);
+
+		if (object_name) {
+			*object_name = IP_NULL;
+		}
+		*address = start;
+		*size = (entry->vme_end - start);
+
+		vm_map_unlock_read(map);
+		return KERN_SUCCESS;
+	}
+	default:
+		return KERN_INVALID_ARGUMENT;
+	}
+}
+
+#define OBJ_RESIDENT_COUNT(obj, entry_size)                             \
+	MIN((entry_size),                                               \
+	    ((obj)->all_reusable ?                                      \
+	     (obj)->wired_page_count :                                  \
+	     (obj)->resident_page_count - (obj)->reusable_page_count))
+
+void
+vm_map_region_top_walk(
+	vm_map_entry_t             entry,
+	vm_region_top_info_t       top)
+{
+	if (VME_OBJECT(entry) == 0 || entry->is_sub_map) {
+		top->share_mode = SM_EMPTY;
+		top->ref_count = 0;
+		top->obj_id = 0;
+		return;
+	}
+
+	{
+		struct  vm_object *obj, *tmp_obj;
+		int             ref_count;
+		uint32_t        entry_size;
+
+		entry_size = (uint32_t) ((entry->vme_end - entry->vme_start) / PAGE_SIZE_64);
+
+		obj = VME_OBJECT(entry);
+
+		vm_object_lock(obj);
+
+		if ((ref_count = obj->ref_count) > 1 && obj->paging_in_progress) {
+			ref_count--;
+		}
+
+		assert(obj->reusable_page_count <= obj->resident_page_count);
+		if (obj->shadow) {
+			if (ref_count == 1) {
+				top->private_pages_resident =
+				    OBJ_RESIDENT_COUNT(obj, entry_size);
+			} else {
+				top->shared_pages_resident =
+				    OBJ_RESIDENT_COUNT(obj, entry_size);
+			}
+			top->ref_count  = ref_count;
+			top->share_mode = SM_COW;
+
+			while ((tmp_obj = obj->shadow)) {
+				vm_object_lock(tmp_obj);
+				vm_object_unlock(obj);
+				obj = tmp_obj;
+
+				if ((ref_count = obj->ref_count) > 1 && obj->paging_in_progress) {
+					ref_count--;
+				}
+
+				assert(obj->reusable_page_count <= obj->resident_page_count);
+				top->shared_pages_resident +=
+				    OBJ_RESIDENT_COUNT(obj, entry_size);
+				top->ref_count += ref_count - 1;
+			}
+		} else {
+			if (entry->superpage_size) {
+				top->share_mode = SM_LARGE_PAGE;
+				top->shared_pages_resident = 0;
+				top->private_pages_resident = entry_size;
+			} else if (entry->needs_copy) {
+				top->share_mode = SM_COW;
+				top->shared_pages_resident =
+				    OBJ_RESIDENT_COUNT(obj, entry_size);
+			} else {
+				if (ref_count == 1 ||
+				    (ref_count == 2 && obj->named)) {
+					top->share_mode = SM_PRIVATE;
+					top->private_pages_resident =
+					    OBJ_RESIDENT_COUNT(obj,
+					    entry_size);
+				} else {
+					top->share_mode = SM_SHARED;
+					top->shared_pages_resident =
+					    OBJ_RESIDENT_COUNT(obj,
+					    entry_size);
+				}
+			}
+			top->ref_count = ref_count;
+		}
+		/* XXX K64: obj_id will be truncated */
+		top->obj_id = (unsigned int) (uintptr_t)VM_KERNEL_ADDRPERM(obj);
+
+		vm_object_unlock(obj);
+	}
+}
+
+void
+vm_map_region_walk(
+	vm_map_t                        map,
+	vm_map_offset_t                 va,
+	vm_map_entry_t                  entry,
+	vm_object_offset_t              offset,
+	vm_object_size_t                range,
+	vm_region_extended_info_t       extended,
+	boolean_t                       look_for_pages,
+	mach_msg_type_number_t count)
+{
+	struct vm_object *obj, *tmp_obj;
+	vm_map_offset_t       last_offset;
+	int               i;
+	int               ref_count;
+	struct vm_object        *shadow_object;
+	int                     shadow_depth;
+	boolean_t         do_region_footprint;
+
+	do_region_footprint = task_self_region_footprint();
+
+	if ((VME_OBJECT(entry) == 0) ||
+	    (entry->is_sub_map) ||
+	    (VME_OBJECT(entry)->phys_contiguous &&
+	    !entry->superpage_size)) {
+		extended->share_mode = SM_EMPTY;
+		extended->ref_count = 0;
+		return;
+	}
+
+	if (entry->superpage_size) {
+		extended->shadow_depth = 0;
+		extended->share_mode = SM_LARGE_PAGE;
+		extended->ref_count = 1;
+		extended->external_pager = 0;
+		extended->pages_resident = (unsigned int)(range >> PAGE_SHIFT);
+		extended->shadow_depth = 0;
+		return;
+	}
+
+	obj = VME_OBJECT(entry);
+
+	vm_object_lock(obj);
+
+	if ((ref_count = obj->ref_count) > 1 && obj->paging_in_progress) {
+		ref_count--;
+	}
+
+	if (look_for_pages) {
+		for (last_offset = offset + range;
+		    offset < last_offset;
+		    offset += PAGE_SIZE_64, va += PAGE_SIZE) {
+			if (do_region_footprint) {
+				int disp;
+
+				disp = 0;
+				if (map->has_corpse_footprint) {
+					/*
+					 * Query the page info data we saved
+					 * while forking the corpse.
+					 */
+					vm_map_corpse_footprint_query_page_info(
+						map,
+						va,
+						&disp);
+				} else {
+					/*
+					 * Query the pmap.
+					 */
+					pmap_query_page_info(map->pmap,
+					    va,
+					    &disp);
+				}
+				if (disp & PMAP_QUERY_PAGE_PRESENT) {
+					if (!(disp & PMAP_QUERY_PAGE_ALTACCT)) {
+						extended->pages_resident++;
+					}
+					if (disp & PMAP_QUERY_PAGE_REUSABLE) {
+						extended->pages_reusable++;
+					} else if (!(disp & PMAP_QUERY_PAGE_INTERNAL) ||
+					    (disp & PMAP_QUERY_PAGE_ALTACCT)) {
+						/* alternate accounting */
+					} else {
+						extended->pages_dirtied++;
+					}
+				} else if (disp & PMAP_QUERY_PAGE_COMPRESSED) {
+					if (disp & PMAP_QUERY_PAGE_COMPRESSED_ALTACCT) {
+						/* alternate accounting */
+					} else {
+						extended->pages_swapped_out++;
+					}
+				}
+				/* deal with alternate accounting */
+				if (obj->purgable == VM_PURGABLE_NONVOLATILE &&
+				    /* && not tagged as no-footprint? */
+				    VM_OBJECT_OWNER(obj) != NULL &&
+				    VM_OBJECT_OWNER(obj)->map == map) {
+					if ((((va
+					    - entry->vme_start
+					    + VME_OFFSET(entry))
+					    / PAGE_SIZE) <
+					    (obj->resident_page_count +
+					    vm_compressor_pager_get_count(obj->pager)))) {
+						/*
+						 * Non-volatile purgeable object owned
+						 * by this task: report the first
+						 * "#resident + #compressed" pages as
+						 * "resident" (to show that they
+						 * contribute to the footprint) but not
+						 * "dirty" (to avoid double-counting
+						 * with the fake "non-volatile" region
+						 * we'll report at the end of the
+						 * address space to account for all
+						 * (mapped or not) non-volatile memory
+						 * owned by this task.
+						 */
+						extended->pages_resident++;
+					}
+				} else if ((obj->purgable == VM_PURGABLE_VOLATILE ||
+				    obj->purgable == VM_PURGABLE_EMPTY) &&
+				    /* && not tagged as no-footprint? */
+				    VM_OBJECT_OWNER(obj) != NULL &&
+				    VM_OBJECT_OWNER(obj)->map == map) {
+					if ((((va
+					    - entry->vme_start
+					    + VME_OFFSET(entry))
+					    / PAGE_SIZE) <
+					    obj->wired_page_count)) {
+						/*
+						 * Volatile|empty purgeable object owned
+						 * by this task: report the first
+						 * "#wired" pages as "resident" (to
+						 * show that they contribute to the
+						 * footprint) but not "dirty" (to avoid
+						 * double-counting with the fake
+						 * "non-volatile" region we'll report
+						 * at the end of the address space to
+						 * account for all (mapped or not)
+						 * non-volatile memory owned by this
+						 * task.
+						 */
+						extended->pages_resident++;
+					}
+				} else if (obj->purgable != VM_PURGABLE_DENY) {
+					/*
+					 * Pages from purgeable objects
+					 * will be reported as dirty
+					 * appropriately in an extra
+					 * fake memory region at the end of
+					 * the address space.
+					 */
+				} else if (entry->iokit_acct) {
+					/*
+					 * IOKit mappings are considered
+					 * as fully dirty for footprint's
+					 * sake.
+					 */
+					extended->pages_dirtied++;
+				}
+				continue;
+			}
+
+			vm_map_region_look_for_page(map, va, obj,
+			    offset, ref_count,
+			    0, extended, count);
+		}
+
+		if (do_region_footprint) {
+			goto collect_object_info;
+		}
+	} else {
+collect_object_info:
+		shadow_object = obj->shadow;
+		shadow_depth = 0;
+
+		if (!(obj->internal)) {
+			extended->external_pager = 1;
+		}
+
+		if (shadow_object != VM_OBJECT_NULL) {
+			vm_object_lock(shadow_object);
+			for (;
+			    shadow_object != VM_OBJECT_NULL;
+			    shadow_depth++) {
+				vm_object_t     next_shadow;
+
+				if (!(shadow_object->internal)) {
+					extended->external_pager = 1;
+				}
+
+				next_shadow = shadow_object->shadow;
+				if (next_shadow) {
+					vm_object_lock(next_shadow);
+				}
+				vm_object_unlock(shadow_object);
+				shadow_object = next_shadow;
+			}
+		}
+		extended->shadow_depth = shadow_depth;
+	}
+
+	if (extended->shadow_depth || entry->needs_copy) {
+		extended->share_mode = SM_COW;
+	} else {
+		if (ref_count == 1) {
+			extended->share_mode = SM_PRIVATE;
+		} else {
+			if (obj->true_share) {
+				extended->share_mode = SM_TRUESHARED;
+			} else {
+				extended->share_mode = SM_SHARED;
+			}
+		}
+	}
+	extended->ref_count = ref_count - extended->shadow_depth;
+
+	for (i = 0; i < extended->shadow_depth; i++) {
+		if ((tmp_obj = obj->shadow) == 0) {
+			break;
+		}
+		vm_object_lock(tmp_obj);
+		vm_object_unlock(obj);
+
+		if ((ref_count = tmp_obj->ref_count) > 1 && tmp_obj->paging_in_progress) {
+			ref_count--;
+		}
+
+		extended->ref_count += ref_count;
+		obj = tmp_obj;
+	}
+	vm_object_unlock(obj);
+
+	if (extended->share_mode == SM_SHARED) {
+		vm_map_entry_t       cur;
+		vm_map_entry_t       last;
+		int      my_refs;
+
+		obj = VME_OBJECT(entry);
+		last = vm_map_to_entry(map);
+		my_refs = 0;
+
+		if ((ref_count = obj->ref_count) > 1 && obj->paging_in_progress) {
+			ref_count--;
+		}
+		for (cur = vm_map_first_entry(map); cur != last; cur = cur->vme_next) {
+			my_refs += vm_map_region_count_obj_refs(cur, obj);
+		}
+
+		if (my_refs == ref_count) {
+			extended->share_mode = SM_PRIVATE_ALIASED;
+		} else if (my_refs > 1) {
+			extended->share_mode = SM_SHARED_ALIASED;
+		}
+	}
+}
+
+
+/* object is locked on entry and locked on return */
+
+
+static void
+vm_map_region_look_for_page(
+	__unused vm_map_t               map,
+	__unused vm_map_offset_t        va,
+	vm_object_t                     object,
+	vm_object_offset_t              offset,
+	int                             max_refcnt,
+	int                             depth,
+	vm_region_extended_info_t       extended,
+	mach_msg_type_number_t count)
+{
+	vm_page_t       p;
+	vm_object_t     shadow;
+	int             ref_count;
+	vm_object_t     caller_object;
+
+	shadow = object->shadow;
+	caller_object = object;
+
+
+	while (TRUE) {
+		if (!(object->internal)) {
+			extended->external_pager = 1;
+		}
+
+		if ((p = vm_page_lookup(object, offset)) != VM_PAGE_NULL) {
+			if (shadow && (max_refcnt == 1)) {
+				extended->pages_shared_now_private++;
+			}
+
+			if (!p->vmp_fictitious &&
+			    (p->vmp_dirty || pmap_is_modified(VM_PAGE_GET_PHYS_PAGE(p)))) {
+				extended->pages_dirtied++;
+			} else if (count >= VM_REGION_EXTENDED_INFO_COUNT) {
+				if (p->vmp_reusable || object->all_reusable) {
+					extended->pages_reusable++;
+				}
+			}
+
+			extended->pages_resident++;
+
+			if (object != caller_object) {
+				vm_object_unlock(object);
+			}
+
+			return;
+		}
+		if (object->internal &&
+		    object->alive &&
+		    !object->terminating &&
+		    object->pager_ready) {
+			if (VM_COMPRESSOR_PAGER_STATE_GET(object, offset)
+			    == VM_EXTERNAL_STATE_EXISTS) {
+				/* the pager has that page */
+				extended->pages_swapped_out++;
+				if (object != caller_object) {
+					vm_object_unlock(object);
+				}
+				return;
+			}
+		}
+
+		if (shadow) {
+			vm_object_lock(shadow);
+
+			if ((ref_count = shadow->ref_count) > 1 && shadow->paging_in_progress) {
+				ref_count--;
+			}
+
+			if (++depth > extended->shadow_depth) {
+				extended->shadow_depth = depth;
+			}
+
+			if (ref_count > max_refcnt) {
+				max_refcnt = ref_count;
+			}
+
+			if (object != caller_object) {
+				vm_object_unlock(object);
+			}
+
+			offset = offset + object->vo_shadow_offset;
+			object = shadow;
+			shadow = object->shadow;
+			continue;
+		}
+		if (object != caller_object) {
+			vm_object_unlock(object);
+		}
+		break;
+	}
+}
+
+static int
+vm_map_region_count_obj_refs(
+	vm_map_entry_t    entry,
+	vm_object_t       object)
+{
+	int ref_count;
+	vm_object_t chk_obj;
+	vm_object_t tmp_obj;
+
+	if (VME_OBJECT(entry) == 0) {
+		return 0;
+	}
+
+	if (entry->is_sub_map) {
+		return 0;
+	} else {
+		ref_count = 0;
+
+		chk_obj = VME_OBJECT(entry);
+		vm_object_lock(chk_obj);
+
+		while (chk_obj) {
+			if (chk_obj == object) {
+				ref_count++;
+			}
+			tmp_obj = chk_obj->shadow;
+			if (tmp_obj) {
+				vm_object_lock(tmp_obj);
+			}
+			vm_object_unlock(chk_obj);
+
+			chk_obj = tmp_obj;
+		}
+	}
+	return ref_count;
+}
+
+
+/*
+ *	Routine:	vm_map_simplify
+ *
+ *	Description:
+ *		Attempt to simplify the map representation in
+ *		the vicinity of the given starting address.
+ *	Note:
+ *		This routine is intended primarily to keep the
+ *		kernel maps more compact -- they generally don't
+ *		benefit from the "expand a map entry" technology
+ *		at allocation time because the adjacent entry
+ *		is often wired down.
+ */
+void
+vm_map_simplify_entry(
+	vm_map_t        map,
+	vm_map_entry_t  this_entry)
+{
+	vm_map_entry_t  prev_entry;
+
+	counter(c_vm_map_simplify_entry_called++);
+
+	prev_entry = this_entry->vme_prev;
+
+	if ((this_entry != vm_map_to_entry(map)) &&
+	    (prev_entry != vm_map_to_entry(map)) &&
+
+	    (prev_entry->vme_end == this_entry->vme_start) &&
+
+	    (prev_entry->is_sub_map == this_entry->is_sub_map) &&
+	    (VME_OBJECT(prev_entry) == VME_OBJECT(this_entry)) &&
+	    ((VME_OFFSET(prev_entry) + (prev_entry->vme_end -
+	    prev_entry->vme_start))
+	    == VME_OFFSET(this_entry)) &&
+
+	    (prev_entry->behavior == this_entry->behavior) &&
+	    (prev_entry->needs_copy == this_entry->needs_copy) &&
+	    (prev_entry->protection == this_entry->protection) &&
+	    (prev_entry->max_protection == this_entry->max_protection) &&
+	    (prev_entry->inheritance == this_entry->inheritance) &&
+	    (prev_entry->use_pmap == this_entry->use_pmap) &&
+	    (VME_ALIAS(prev_entry) == VME_ALIAS(this_entry)) &&
+	    (prev_entry->no_cache == this_entry->no_cache) &&
+	    (prev_entry->permanent == this_entry->permanent) &&
+	    (prev_entry->map_aligned == this_entry->map_aligned) &&
+	    (prev_entry->zero_wired_pages == this_entry->zero_wired_pages) &&
+	    (prev_entry->used_for_jit == this_entry->used_for_jit) &&
+	    (prev_entry->pmap_cs_associated == this_entry->pmap_cs_associated) &&
+	    /* from_reserved_zone: OK if that field doesn't match */
+	    (prev_entry->iokit_acct == this_entry->iokit_acct) &&
+	    (prev_entry->vme_resilient_codesign ==
+	    this_entry->vme_resilient_codesign) &&
+	    (prev_entry->vme_resilient_media ==
+	    this_entry->vme_resilient_media) &&
+	    (prev_entry->vme_no_copy_on_read == this_entry->vme_no_copy_on_read) &&
+
+	    (prev_entry->wired_count == this_entry->wired_count) &&
+	    (prev_entry->user_wired_count == this_entry->user_wired_count) &&
+
+	    ((prev_entry->vme_atomic == FALSE) && (this_entry->vme_atomic == FALSE)) &&
+	    (prev_entry->in_transition == FALSE) &&
+	    (this_entry->in_transition == FALSE) &&
+	    (prev_entry->needs_wakeup == FALSE) &&
+	    (this_entry->needs_wakeup == FALSE) &&
+	    (prev_entry->is_shared == FALSE) &&
+	    (this_entry->is_shared == FALSE) &&
+	    (prev_entry->superpage_size == FALSE) &&
+	    (this_entry->superpage_size == FALSE)
+	    ) {
+		vm_map_store_entry_unlink(map, prev_entry);
+		assert(prev_entry->vme_start < this_entry->vme_end);
+		if (prev_entry->map_aligned) {
+			assert(VM_MAP_PAGE_ALIGNED(prev_entry->vme_start,
+			    VM_MAP_PAGE_MASK(map)));
+		}
+		this_entry->vme_start = prev_entry->vme_start;
+		VME_OFFSET_SET(this_entry, VME_OFFSET(prev_entry));
+
+		if (map->holelistenabled) {
+			vm_map_store_update_first_free(map, this_entry, TRUE);
+		}
+
+		if (prev_entry->is_sub_map) {
+			vm_map_deallocate(VME_SUBMAP(prev_entry));
+		} else {
+			vm_object_deallocate(VME_OBJECT(prev_entry));
+		}
+		vm_map_entry_dispose(map, prev_entry);
+		SAVE_HINT_MAP_WRITE(map, this_entry);
+		counter(c_vm_map_simplified++);
+	}
+}
+
+void
+vm_map_simplify(
+	vm_map_t        map,
+	vm_map_offset_t start)
+{
+	vm_map_entry_t  this_entry;
+
+	vm_map_lock(map);
+	if (vm_map_lookup_entry(map, start, &this_entry)) {
+		vm_map_simplify_entry(map, this_entry);
+		vm_map_simplify_entry(map, this_entry->vme_next);
+	}
+	counter(c_vm_map_simplify_called++);
+	vm_map_unlock(map);
+}
+
+static void
+vm_map_simplify_range(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end)
+{
+	vm_map_entry_t  entry;
+
+	/*
+	 * The map should be locked (for "write") by the caller.
+	 */
+
+	if (start >= end) {
+		/* invalid address range */
+		return;
+	}
+
+	start = vm_map_trunc_page(start,
+	    VM_MAP_PAGE_MASK(map));
+	end = vm_map_round_page(end,
+	    VM_MAP_PAGE_MASK(map));
+
+	if (!vm_map_lookup_entry(map, start, &entry)) {
+		/* "start" is not mapped and "entry" ends before "start" */
+		if (entry == vm_map_to_entry(map)) {
+			/* start with first entry in the map */
+			entry = vm_map_first_entry(map);
+		} else {
+			/* start with next entry */
+			entry = entry->vme_next;
+		}
+	}
+
+	while (entry != vm_map_to_entry(map) &&
+	    entry->vme_start <= end) {
+		/* try and coalesce "entry" with its previous entry */
+		vm_map_simplify_entry(map, entry);
+		entry = entry->vme_next;
+	}
+}
+
+
+/*
+ *	Routine:	vm_map_machine_attribute
+ *	Purpose:
+ *		Provide machine-specific attributes to mappings,
+ *		such as cachability etc. for machines that provide
+ *		them.  NUMA architectures and machines with big/strange
+ *		caches will use this.
+ *	Note:
+ *		Responsibilities for locking and checking are handled here,
+ *		everything else in the pmap module. If any non-volatile
+ *		information must be kept, the pmap module should handle
+ *		it itself. [This assumes that attributes do not
+ *		need to be inherited, which seems ok to me]
+ */
+kern_return_t
+vm_map_machine_attribute(
+	vm_map_t                        map,
+	vm_map_offset_t         start,
+	vm_map_offset_t         end,
+	vm_machine_attribute_t  attribute,
+	vm_machine_attribute_val_t* value)              /* IN/OUT */
+{
+	kern_return_t   ret;
+	vm_map_size_t sync_size;
+	vm_map_entry_t entry;
+
+	if (start < vm_map_min(map) || end > vm_map_max(map)) {
+		return KERN_INVALID_ADDRESS;
+	}
+
+	/* Figure how much memory we need to flush (in page increments) */
+	sync_size = end - start;
+
+	vm_map_lock(map);
+
+	if (attribute != MATTR_CACHE) {
+		/* If we don't have to find physical addresses, we */
+		/* don't have to do an explicit traversal here.    */
+		ret = pmap_attribute(map->pmap, start, end - start,
+		    attribute, value);
+		vm_map_unlock(map);
+		return ret;
+	}
+
+	ret = KERN_SUCCESS;                                                                             /* Assume it all worked */
+
+	while (sync_size) {
+		if (vm_map_lookup_entry(map, start, &entry)) {
+			vm_map_size_t   sub_size;
+			if ((entry->vme_end - start) > sync_size) {
+				sub_size = sync_size;
+				sync_size = 0;
+			} else {
+				sub_size = entry->vme_end - start;
+				sync_size -= sub_size;
+			}
+			if (entry->is_sub_map) {
+				vm_map_offset_t sub_start;
+				vm_map_offset_t sub_end;
+
+				sub_start = (start - entry->vme_start)
+				    + VME_OFFSET(entry);
+				sub_end = sub_start + sub_size;
+				vm_map_machine_attribute(
+					VME_SUBMAP(entry),
+					sub_start,
+					sub_end,
+					attribute, value);
+			} else {
+				if (VME_OBJECT(entry)) {
+					vm_page_t               m;
+					vm_object_t             object;
+					vm_object_t             base_object;
+					vm_object_t             last_object;
+					vm_object_offset_t      offset;
+					vm_object_offset_t      base_offset;
+					vm_map_size_t           range;
+					range = sub_size;
+					offset = (start - entry->vme_start)
+					    + VME_OFFSET(entry);
+					base_offset = offset;
+					object = VME_OBJECT(entry);
+					base_object = object;
+					last_object = NULL;
+
+					vm_object_lock(object);
+
+					while (range) {
+						m = vm_page_lookup(
+							object, offset);
+
+						if (m && !m->vmp_fictitious) {
+							ret =
+							    pmap_attribute_cache_sync(
+								VM_PAGE_GET_PHYS_PAGE(m),
+								PAGE_SIZE,
+								attribute, value);
+						} else if (object->shadow) {
+							offset = offset + object->vo_shadow_offset;
+							last_object = object;
+							object = object->shadow;
+							vm_object_lock(last_object->shadow);
+							vm_object_unlock(last_object);
+							continue;
+						}
+						range -= PAGE_SIZE;
+
+						if (base_object != object) {
+							vm_object_unlock(object);
+							vm_object_lock(base_object);
+							object = base_object;
+						}
+						/* Bump to the next page */
+						base_offset += PAGE_SIZE;
+						offset = base_offset;
+					}
+					vm_object_unlock(object);
+				}
+			}
+			start += sub_size;
+		} else {
+			vm_map_unlock(map);
+			return KERN_FAILURE;
+		}
+	}
+
+	vm_map_unlock(map);
+
+	return ret;
+}
+
+/*
+ *	vm_map_behavior_set:
+ *
+ *	Sets the paging reference behavior of the specified address
+ *	range in the target map.  Paging reference behavior affects
+ *	how pagein operations resulting from faults on the map will be
+ *	clustered.
+ */
+kern_return_t
+vm_map_behavior_set(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end,
+	vm_behavior_t   new_behavior)
+{
+	vm_map_entry_t  entry;
+	vm_map_entry_t  temp_entry;
+
+	if (start > end ||
+	    start < vm_map_min(map) ||
+	    end > vm_map_max(map)) {
+		return KERN_NO_SPACE;
+	}
+
+	switch (new_behavior) {
+	/*
+	 * This first block of behaviors all set a persistent state on the specified
+	 * memory range.  All we have to do here is to record the desired behavior
+	 * in the vm_map_entry_t's.
+	 */
+
+	case VM_BEHAVIOR_DEFAULT:
+	case VM_BEHAVIOR_RANDOM:
+	case VM_BEHAVIOR_SEQUENTIAL:
+	case VM_BEHAVIOR_RSEQNTL:
+	case VM_BEHAVIOR_ZERO_WIRED_PAGES:
+		vm_map_lock(map);
+
+		/*
+		 *	The entire address range must be valid for the map.
+		 *      Note that vm_map_range_check() does a
+		 *	vm_map_lookup_entry() internally and returns the
+		 *	entry containing the start of the address range if
+		 *	the entire range is valid.
+		 */
+		if (vm_map_range_check(map, start, end, &temp_entry)) {
+			entry = temp_entry;
+			vm_map_clip_start(map, entry, start);
+		} else {
+			vm_map_unlock(map);
+			return KERN_INVALID_ADDRESS;
+		}
+
+		while ((entry != vm_map_to_entry(map)) && (entry->vme_start < end)) {
+			vm_map_clip_end(map, entry, end);
+			if (entry->is_sub_map) {
+				assert(!entry->use_pmap);
+			}
+
+			if (new_behavior == VM_BEHAVIOR_ZERO_WIRED_PAGES) {
+				entry->zero_wired_pages = TRUE;
+			} else {
+				entry->behavior = new_behavior;
+			}
+			entry = entry->vme_next;
+		}
+
+		vm_map_unlock(map);
+		break;
+
+	/*
+	 * The rest of these are different from the above in that they cause
+	 * an immediate action to take place as opposed to setting a behavior that
+	 * affects future actions.
+	 */
+
+	case VM_BEHAVIOR_WILLNEED:
+		return vm_map_willneed(map, start, end);
+
+	case VM_BEHAVIOR_DONTNEED:
+		return vm_map_msync(map, start, end - start, VM_SYNC_DEACTIVATE | VM_SYNC_CONTIGUOUS);
+
+	case VM_BEHAVIOR_FREE:
+		return vm_map_msync(map, start, end - start, VM_SYNC_KILLPAGES | VM_SYNC_CONTIGUOUS);
+
+	case VM_BEHAVIOR_REUSABLE:
+		return vm_map_reusable_pages(map, start, end);
+
+	case VM_BEHAVIOR_REUSE:
+		return vm_map_reuse_pages(map, start, end);
+
+	case VM_BEHAVIOR_CAN_REUSE:
+		return vm_map_can_reuse(map, start, end);
+
+#if MACH_ASSERT
+	case VM_BEHAVIOR_PAGEOUT:
+		return vm_map_pageout(map, start, end);
+#endif /* MACH_ASSERT */
+
+	default:
+		return KERN_INVALID_ARGUMENT;
+	}
+
+	return KERN_SUCCESS;
+}
+
+
+/*
+ * Internals for madvise(MADV_WILLNEED) system call.
+ *
+ * The implementation is to do:-
+ * a) read-ahead if the mapping corresponds to a mapped regular file
+ * b) or, fault in the pages (zero-fill, decompress etc) if it's an anonymous mapping
+ */
+
+
+static kern_return_t
+vm_map_willneed(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end
+	)
+{
+	vm_map_entry_t                  entry;
+	vm_object_t                     object;
+	memory_object_t                 pager;
+	struct vm_object_fault_info     fault_info = {};
+	kern_return_t                   kr;
+	vm_object_size_t                len;
+	vm_object_offset_t              offset;
+
+	fault_info.interruptible = THREAD_UNINT;        /* ignored value */
+	fault_info.behavior      = VM_BEHAVIOR_SEQUENTIAL;
+	fault_info.stealth       = TRUE;
+
+	/*
+	 * The MADV_WILLNEED operation doesn't require any changes to the
+	 * vm_map_entry_t's, so the read lock is sufficient.
+	 */
+
+	vm_map_lock_read(map);
+
+	/*
+	 * The madvise semantics require that the address range be fully
+	 * allocated with no holes.  Otherwise, we're required to return
+	 * an error.
+	 */
+
+	if (!vm_map_range_check(map, start, end, &entry)) {
+		vm_map_unlock_read(map);
+		return KERN_INVALID_ADDRESS;
+	}
+
+	/*
+	 * Examine each vm_map_entry_t in the range.
+	 */
+	for (; entry != vm_map_to_entry(map) && start < end;) {
+		/*
+		 * The first time through, the start address could be anywhere
+		 * within the vm_map_entry we found.  So adjust the offset to
+		 * correspond.  After that, the offset will always be zero to
+		 * correspond to the beginning of the current vm_map_entry.
+		 */
+		offset = (start - entry->vme_start) + VME_OFFSET(entry);
+
+		/*
+		 * Set the length so we don't go beyond the end of the
+		 * map_entry or beyond the end of the range we were given.
+		 * This range could span also multiple map entries all of which
+		 * map different files, so make sure we only do the right amount
+		 * of I/O for each object.  Note that it's possible for there
+		 * to be multiple map entries all referring to the same object
+		 * but with different page permissions, but it's not worth
+		 * trying to optimize that case.
+		 */
+		len = MIN(entry->vme_end - start, end - start);
+
+		if ((vm_size_t) len != len) {
+			/* 32-bit overflow */
+			len = (vm_size_t) (0 - PAGE_SIZE);
+		}
+		fault_info.cluster_size = (vm_size_t) len;
+		fault_info.lo_offset    = offset;
+		fault_info.hi_offset    = offset + len;
+		fault_info.user_tag     = VME_ALIAS(entry);
+		fault_info.pmap_options = 0;
+		if (entry->iokit_acct ||
+		    (!entry->is_sub_map && !entry->use_pmap)) {
+			fault_info.pmap_options |= PMAP_OPTIONS_ALT_ACCT;
+		}
+
+		/*
+		 * If the entry is a submap OR there's no read permission
+		 * to this mapping, then just skip it.
+		 */
+		if ((entry->is_sub_map) || (entry->protection & VM_PROT_READ) == 0) {
+			entry = entry->vme_next;
+			start = entry->vme_start;
+			continue;
+		}
+
+		object = VME_OBJECT(entry);
+
+		if (object == NULL ||
+		    (object && object->internal)) {
+			/*
+			 * Memory range backed by anonymous memory.
+			 */
+			vm_size_t region_size = 0, effective_page_size = 0;
+			vm_map_offset_t addr = 0, effective_page_mask = 0;
+
+			region_size = len;
+			addr = start;
+
+			effective_page_mask = MAX(vm_map_page_mask(current_map()), PAGE_MASK);
+			effective_page_size = effective_page_mask + 1;
+
+			vm_map_unlock_read(map);
+
+			while (region_size) {
+				vm_pre_fault(
+					vm_map_trunc_page(addr, effective_page_mask),
+					VM_PROT_READ | VM_PROT_WRITE);
+
+				region_size -= effective_page_size;
+				addr += effective_page_size;
+			}
+		} else {
+			/*
+			 * Find the file object backing this map entry.  If there is
+			 * none, then we simply ignore the "will need" advice for this
+			 * entry and go on to the next one.
+			 */
+			if ((object = find_vnode_object(entry)) == VM_OBJECT_NULL) {
+				entry = entry->vme_next;
+				start = entry->vme_start;
+				continue;
+			}
+
+			vm_object_paging_begin(object);
+			pager = object->pager;
+			vm_object_unlock(object);
+
+			/*
+			 * The data_request() could take a long time, so let's
+			 * release the map lock to avoid blocking other threads.
+			 */
+			vm_map_unlock_read(map);
+
+			/*
+			 * Get the data from the object asynchronously.
+			 *
+			 * Note that memory_object_data_request() places limits on the
+			 * amount of I/O it will do.  Regardless of the len we
+			 * specified, it won't do more than MAX_UPL_TRANSFER_BYTES and it
+			 * silently truncates the len to that size.  This isn't
+			 * necessarily bad since madvise shouldn't really be used to
+			 * page in unlimited amounts of data.  Other Unix variants
+			 * limit the willneed case as well.  If this turns out to be an
+			 * issue for developers, then we can always adjust the policy
+			 * here and still be backwards compatible since this is all
+			 * just "advice".
+			 */
+			kr = memory_object_data_request(
+				pager,
+				offset + object->paging_offset,
+				0,      /* ignored */
+				VM_PROT_READ,
+				(memory_object_fault_info_t)&fault_info);
+
+			vm_object_lock(object);
+			vm_object_paging_end(object);
+			vm_object_unlock(object);
+
+			/*
+			 * If we couldn't do the I/O for some reason, just give up on
+			 * the madvise.  We still return success to the user since
+			 * madvise isn't supposed to fail when the advice can't be
+			 * taken.
+			 */
+
+			if (kr != KERN_SUCCESS) {
+				return KERN_SUCCESS;
+			}
+		}
+
+		start += len;
+		if (start >= end) {
+			/* done */
+			return KERN_SUCCESS;
+		}
+
+		/* look up next entry */
+		vm_map_lock_read(map);
+		if (!vm_map_lookup_entry(map, start, &entry)) {
+			/*
+			 * There's a new hole in the address range.
+			 */
+			vm_map_unlock_read(map);
+			return KERN_INVALID_ADDRESS;
+		}
+	}
+
+	vm_map_unlock_read(map);
+	return KERN_SUCCESS;
+}
+
+static boolean_t
+vm_map_entry_is_reusable(
+	vm_map_entry_t entry)
+{
+	/* Only user map entries */
+
+	vm_object_t object;
+
+	if (entry->is_sub_map) {
+		return FALSE;
+	}
+
+	switch (VME_ALIAS(entry)) {
+	case VM_MEMORY_MALLOC:
+	case VM_MEMORY_MALLOC_SMALL:
+	case VM_MEMORY_MALLOC_LARGE:
+	case VM_MEMORY_REALLOC:
+	case VM_MEMORY_MALLOC_TINY:
+	case VM_MEMORY_MALLOC_LARGE_REUSABLE:
+	case VM_MEMORY_MALLOC_LARGE_REUSED:
+		/*
+		 * This is a malloc() memory region: check if it's still
+		 * in its original state and can be re-used for more
+		 * malloc() allocations.
+		 */
+		break;
+	default:
+		/*
+		 * Not a malloc() memory region: let the caller decide if
+		 * it's re-usable.
+		 */
+		return TRUE;
+	}
+
+	if (/*entry->is_shared ||*/
+		entry->is_sub_map ||
+		entry->in_transition ||
+		entry->protection != VM_PROT_DEFAULT ||
+		entry->max_protection != VM_PROT_ALL ||
+		entry->inheritance != VM_INHERIT_DEFAULT ||
+		entry->no_cache ||
+		entry->permanent ||
+		entry->superpage_size != FALSE ||
+		entry->zero_wired_pages ||
+		entry->wired_count != 0 ||
+		entry->user_wired_count != 0) {
+		return FALSE;
+	}
+
+	object = VME_OBJECT(entry);
+	if (object == VM_OBJECT_NULL) {
+		return TRUE;
+	}
+	if (
+#if 0
+		/*
+		 * Let's proceed even if the VM object is potentially
+		 * shared.
+		 * We check for this later when processing the actual
+		 * VM pages, so the contents will be safe if shared.
+		 *
+		 * But we can still mark this memory region as "reusable" to
+		 * acknowledge that the caller did let us know that the memory
+		 * could be re-used and should not be penalized for holding
+		 * on to it.  This allows its "resident size" to not include
+		 * the reusable range.
+		 */
+		object->ref_count == 1 &&
+#endif
+		object->wired_page_count == 0 &&
+		object->copy == VM_OBJECT_NULL &&
+		object->shadow == VM_OBJECT_NULL &&
+		object->internal &&
+		object->purgable == VM_PURGABLE_DENY &&
+		object->copy_strategy != MEMORY_OBJECT_COPY_DELAY &&
+		!object->true_share &&
+		object->wimg_bits == VM_WIMG_USE_DEFAULT &&
+		!object->code_signed) {
+		return TRUE;
+	}
+	return FALSE;
+}
+
+static kern_return_t
+vm_map_reuse_pages(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end)
+{
+	vm_map_entry_t                  entry;
+	vm_object_t                     object;
+	vm_object_offset_t              start_offset, end_offset;
+
+	/*
+	 * The MADV_REUSE operation doesn't require any changes to the
+	 * vm_map_entry_t's, so the read lock is sufficient.
+	 */
+
+	vm_map_lock_read(map);
+	assert(map->pmap != kernel_pmap);       /* protect alias access */
+
+	/*
+	 * The madvise semantics require that the address range be fully
+	 * allocated with no holes.  Otherwise, we're required to return
+	 * an error.
+	 */
+
+	if (!vm_map_range_check(map, start, end, &entry)) {
+		vm_map_unlock_read(map);
+		vm_page_stats_reusable.reuse_pages_failure++;
+		return KERN_INVALID_ADDRESS;
+	}
+
+	/*
+	 * Examine each vm_map_entry_t in the range.
+	 */
+	for (; entry != vm_map_to_entry(map) && entry->vme_start < end;
+	    entry = entry->vme_next) {
+		/*
+		 * Sanity check on the VM map entry.
+		 */
+		if (!vm_map_entry_is_reusable(entry)) {
+			vm_map_unlock_read(map);
+			vm_page_stats_reusable.reuse_pages_failure++;
+			return KERN_INVALID_ADDRESS;
+		}
+
+		/*
+		 * The first time through, the start address could be anywhere
+		 * within the vm_map_entry we found.  So adjust the offset to
+		 * correspond.
+		 */
+		if (entry->vme_start < start) {
+			start_offset = start - entry->vme_start;
+		} else {
+			start_offset = 0;
+		}
+		end_offset = MIN(end, entry->vme_end) - entry->vme_start;
+		start_offset += VME_OFFSET(entry);
+		end_offset += VME_OFFSET(entry);
+
+		assert(!entry->is_sub_map);
+		object = VME_OBJECT(entry);
+		if (object != VM_OBJECT_NULL) {
+			vm_object_lock(object);
+			vm_object_reuse_pages(object, start_offset, end_offset,
+			    TRUE);
+			vm_object_unlock(object);
+		}
+
+		if (VME_ALIAS(entry) == VM_MEMORY_MALLOC_LARGE_REUSABLE) {
+			/*
+			 * XXX
+			 * We do not hold the VM map exclusively here.
+			 * The "alias" field is not that critical, so it's
+			 * safe to update it here, as long as it is the only
+			 * one that can be modified while holding the VM map
+			 * "shared".
+			 */
+			VME_ALIAS_SET(entry, VM_MEMORY_MALLOC_LARGE_REUSED);
+		}
+	}
+
+	vm_map_unlock_read(map);
+	vm_page_stats_reusable.reuse_pages_success++;
+	return KERN_SUCCESS;
+}
+
+
+static kern_return_t
+vm_map_reusable_pages(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end)
+{
+	vm_map_entry_t                  entry;
+	vm_object_t                     object;
+	vm_object_offset_t              start_offset, end_offset;
+	vm_map_offset_t                 pmap_offset;
+
+	/*
+	 * The MADV_REUSABLE operation doesn't require any changes to the
+	 * vm_map_entry_t's, so the read lock is sufficient.
+	 */
+
+	vm_map_lock_read(map);
+	assert(map->pmap != kernel_pmap);       /* protect alias access */
+
+	/*
+	 * The madvise semantics require that the address range be fully
+	 * allocated with no holes.  Otherwise, we're required to return
+	 * an error.
+	 */
+
+	if (!vm_map_range_check(map, start, end, &entry)) {
+		vm_map_unlock_read(map);
+		vm_page_stats_reusable.reusable_pages_failure++;
+		return KERN_INVALID_ADDRESS;
+	}
+
+	/*
+	 * Examine each vm_map_entry_t in the range.
+	 */
+	for (; entry != vm_map_to_entry(map) && entry->vme_start < end;
+	    entry = entry->vme_next) {
+		int kill_pages = 0;
+
+		/*
+		 * Sanity check on the VM map entry.
+		 */
+		if (!vm_map_entry_is_reusable(entry)) {
+			vm_map_unlock_read(map);
+			vm_page_stats_reusable.reusable_pages_failure++;
+			return KERN_INVALID_ADDRESS;
+		}
+
+		if (!(entry->protection & VM_PROT_WRITE) && !entry->used_for_jit) {
+			/* not writable: can't discard contents */
+			vm_map_unlock_read(map);
+			vm_page_stats_reusable.reusable_nonwritable++;
+			vm_page_stats_reusable.reusable_pages_failure++;
+			return KERN_PROTECTION_FAILURE;
+		}
+
+		/*
+		 * The first time through, the start address could be anywhere
+		 * within the vm_map_entry we found.  So adjust the offset to
+		 * correspond.
+		 */
+		if (entry->vme_start < start) {
+			start_offset = start - entry->vme_start;
+			pmap_offset = start;
+		} else {
+			start_offset = 0;
+			pmap_offset = entry->vme_start;
+		}
+		end_offset = MIN(end, entry->vme_end) - entry->vme_start;
+		start_offset += VME_OFFSET(entry);
+		end_offset += VME_OFFSET(entry);
+
+		assert(!entry->is_sub_map);
+		object = VME_OBJECT(entry);
+		if (object == VM_OBJECT_NULL) {
+			continue;
+		}
+
+
+		vm_object_lock(object);
+		if (((object->ref_count == 1) ||
+		    (object->copy_strategy != MEMORY_OBJECT_COPY_SYMMETRIC &&
+		    object->copy == VM_OBJECT_NULL)) &&
+		    object->shadow == VM_OBJECT_NULL &&
+		    /*
+		     * "iokit_acct" entries are billed for their virtual size
+		     * (rather than for their resident pages only), so they
+		     * wouldn't benefit from making pages reusable, and it
+		     * would be hard to keep track of pages that are both
+		     * "iokit_acct" and "reusable" in the pmap stats and
+		     * ledgers.
+		     */
+		    !(entry->iokit_acct ||
+		    (!entry->is_sub_map && !entry->use_pmap))) {
+			if (object->ref_count != 1) {
+				vm_page_stats_reusable.reusable_shared++;
+			}
+			kill_pages = 1;
+		} else {
+			kill_pages = -1;
+		}
+		if (kill_pages != -1) {
+			vm_object_deactivate_pages(object,
+			    start_offset,
+			    end_offset - start_offset,
+			    kill_pages,
+			    TRUE /*reusable_pages*/,
+			    map->pmap,
+			    pmap_offset);
+		} else {
+			vm_page_stats_reusable.reusable_pages_shared++;
+		}
+		vm_object_unlock(object);
+
+		if (VME_ALIAS(entry) == VM_MEMORY_MALLOC_LARGE ||
+		    VME_ALIAS(entry) == VM_MEMORY_MALLOC_LARGE_REUSED) {
+			/*
+			 * XXX
+			 * We do not hold the VM map exclusively here.
+			 * The "alias" field is not that critical, so it's
+			 * safe to update it here, as long as it is the only
+			 * one that can be modified while holding the VM map
+			 * "shared".
+			 */
+			VME_ALIAS_SET(entry, VM_MEMORY_MALLOC_LARGE_REUSABLE);
+		}
+	}
+
+	vm_map_unlock_read(map);
+	vm_page_stats_reusable.reusable_pages_success++;
+	return KERN_SUCCESS;
+}
+
+
+static kern_return_t
+vm_map_can_reuse(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end)
+{
+	vm_map_entry_t                  entry;
+
+	/*
+	 * The MADV_REUSABLE operation doesn't require any changes to the
+	 * vm_map_entry_t's, so the read lock is sufficient.
+	 */
+
+	vm_map_lock_read(map);
+	assert(map->pmap != kernel_pmap);       /* protect alias access */
+
+	/*
+	 * The madvise semantics require that the address range be fully
+	 * allocated with no holes.  Otherwise, we're required to return
+	 * an error.
+	 */
+
+	if (!vm_map_range_check(map, start, end, &entry)) {
+		vm_map_unlock_read(map);
+		vm_page_stats_reusable.can_reuse_failure++;
+		return KERN_INVALID_ADDRESS;
+	}
+
+	/*
+	 * Examine each vm_map_entry_t in the range.
+	 */
+	for (; entry != vm_map_to_entry(map) && entry->vme_start < end;
+	    entry = entry->vme_next) {
+		/*
+		 * Sanity check on the VM map entry.
+		 */
+		if (!vm_map_entry_is_reusable(entry)) {
+			vm_map_unlock_read(map);
+			vm_page_stats_reusable.can_reuse_failure++;
+			return KERN_INVALID_ADDRESS;
+		}
+	}
+
+	vm_map_unlock_read(map);
+	vm_page_stats_reusable.can_reuse_success++;
+	return KERN_SUCCESS;
+}
+
+
+#if MACH_ASSERT
+static kern_return_t
+vm_map_pageout(
+	vm_map_t        map,
+	vm_map_offset_t start,
+	vm_map_offset_t end)
+{
+	vm_map_entry_t                  entry;
+
+	/*
+	 * The MADV_PAGEOUT operation doesn't require any changes to the
+	 * vm_map_entry_t's, so the read lock is sufficient.
+	 */
+
+	vm_map_lock_read(map);
+
+	/*
+	 * The madvise semantics require that the address range be fully
+	 * allocated with no holes.  Otherwise, we're required to return
+	 * an error.
+	 */
+
+	if (!vm_map_range_check(map, start, end, &entry)) {
+		vm_map_unlock_read(map);
+		return KERN_INVALID_ADDRESS;
+	}
+
+	/*
+	 * Examine each vm_map_entry_t in the range.
+	 */
+	for (; entry != vm_map_to_entry(map) && entry->vme_start < end;
+	    entry = entry->vme_next) {
+		vm_object_t     object;
+
+		/*
+		 * Sanity check on the VM map entry.
+		 */
+		if (entry->is_sub_map) {
+			vm_map_t submap;
+			vm_map_offset_t submap_start;
+			vm_map_offset_t submap_end;
+			vm_map_entry_t submap_entry;
+
+			submap = VME_SUBMAP(entry);
+			submap_start = VME_OFFSET(entry);
+			submap_end = submap_start + (entry->vme_end -
+			    entry->vme_start);
+
+			vm_map_lock_read(submap);
+
+			if (!vm_map_range_check(submap,
+			    submap_start,
+			    submap_end,
+			    &submap_entry)) {
+				vm_map_unlock_read(submap);
+				vm_map_unlock_read(map);
+				return KERN_INVALID_ADDRESS;
+			}
+
+			object = VME_OBJECT(submap_entry);
+			if (submap_entry->is_sub_map ||
+			    object == VM_OBJECT_NULL ||
+			    !object->internal) {
+				vm_map_unlock_read(submap);
+				continue;
+			}
+
+			vm_object_pageout(object);
+
+			vm_map_unlock_read(submap);
+			submap = VM_MAP_NULL;
+			submap_entry = VM_MAP_ENTRY_NULL;
+			continue;
+		}
+
+		object = VME_OBJECT(entry);
+		if (entry->is_sub_map ||
+		    object == VM_OBJECT_NULL ||
+		    !object->internal) {
+			continue;
+		}
+
+		vm_object_pageout(object);
+	}
+
+	vm_map_unlock_read(map);
+	return KERN_SUCCESS;
+}
+#endif /* MACH_ASSERT */
+
+
+/*
+ *	Routine:	vm_map_entry_insert
+ *
+ *	Description:	This routine inserts a new vm_entry in a locked map.
+ */
+vm_map_entry_t
+vm_map_entry_insert(
+	vm_map_t                map,
+	vm_map_entry_t          insp_entry,
+	vm_map_offset_t         start,
+	vm_map_offset_t         end,
+	vm_object_t             object,
+	vm_object_offset_t      offset,
+	boolean_t               needs_copy,
+	boolean_t               is_shared,
+	boolean_t               in_transition,
+	vm_prot_t               cur_protection,
+	vm_prot_t               max_protection,
+	vm_behavior_t           behavior,
+	vm_inherit_t            inheritance,
+	unsigned                wired_count,
+	boolean_t               no_cache,
+	boolean_t               permanent,
+	boolean_t               no_copy_on_read,
+	unsigned int            superpage_size,
+	boolean_t               clear_map_aligned,
+	boolean_t               is_submap,
+	boolean_t               used_for_jit,
+	int                     alias)
+{
+	vm_map_entry_t  new_entry;
+
+	assert(insp_entry != (vm_map_entry_t)0);
+	vm_map_lock_assert_exclusive(map);
+
+#if DEVELOPMENT || DEBUG
+	vm_object_offset_t      end_offset = 0;
+	assertf(!os_add_overflow(end - start, offset, &end_offset), "size 0x%llx, offset 0x%llx caused overflow", (uint64_t)(end - start), offset);
+#endif /* DEVELOPMENT || DEBUG */
+
+	new_entry = vm_map_entry_create(map, !map->hdr.entries_pageable);
+
+	if (VM_MAP_PAGE_SHIFT(map) != PAGE_SHIFT) {
+		new_entry->map_aligned = TRUE;
+	} else {
+		new_entry->map_aligned = FALSE;
+	}
+	if (clear_map_aligned &&
+	    (!VM_MAP_PAGE_ALIGNED(start, VM_MAP_PAGE_MASK(map)) ||
+	    !VM_MAP_PAGE_ALIGNED(end, VM_MAP_PAGE_MASK(map)))) {
+		new_entry->map_aligned = FALSE;
+	}
+
+	new_entry->vme_start = start;
+	new_entry->vme_end = end;
+	assert(page_aligned(new_entry->vme_start));
+	assert(page_aligned(new_entry->vme_end));
+	if (new_entry->map_aligned) {
+		assert(VM_MAP_PAGE_ALIGNED(new_entry->vme_start,
+		    VM_MAP_PAGE_MASK(map)));
+		assert(VM_MAP_PAGE_ALIGNED(new_entry->vme_end,
+		    VM_MAP_PAGE_MASK(map)));
+	}
+	assert(new_entry->vme_start < new_entry->vme_end);
+
+	VME_OBJECT_SET(new_entry, object);
+	VME_OFFSET_SET(new_entry, offset);
+	new_entry->is_shared = is_shared;
+	new_entry->is_sub_map = is_submap;
+	new_entry->needs_copy = needs_copy;
+	new_entry->in_transition = in_transition;
+	new_entry->needs_wakeup = FALSE;
+	new_entry->inheritance = inheritance;
+	new_entry->protection = cur_protection;
+	new_entry->max_protection = max_protection;
+	new_entry->behavior = behavior;
+	new_entry->wired_count = wired_count;
+	new_entry->user_wired_count = 0;
+	if (is_submap) {
+		/*
+		 * submap: "use_pmap" means "nested".
+		 * default: false.
+		 */
+		new_entry->use_pmap = FALSE;
+	} else {
+		/*
+		 * object: "use_pmap" means "use pmap accounting" for footprint.
+		 * default: true.
+		 */
+		new_entry->use_pmap = TRUE;
+	}
+	VME_ALIAS_SET(new_entry, alias);
+	new_entry->zero_wired_pages = FALSE;
+	new_entry->no_cache = no_cache;
+	new_entry->permanent = permanent;
+	if (superpage_size) {
+		new_entry->superpage_size = TRUE;
+	} else {
+		new_entry->superpage_size = FALSE;
+	}
+	if (used_for_jit) {
+#if CONFIG_EMBEDDED
+		if (!(map->jit_entry_exists))
+#endif /* CONFIG_EMBEDDED */
+		{
+			new_entry->used_for_jit = TRUE;
+			map->jit_entry_exists = TRUE;
+		}
+	} else {
+		new_entry->used_for_jit = FALSE;
+	}
+	new_entry->pmap_cs_associated = FALSE;
+	new_entry->iokit_acct = FALSE;
+	new_entry->vme_resilient_codesign = FALSE;
+	new_entry->vme_resilient_media = FALSE;
+	new_entry->vme_atomic = FALSE;
+	new_entry->vme_no_copy_on_read = no_copy_on_read;
+
+	/*
+	 *	Insert the new entry into the list.
+	 */
+
+	vm_map_store_entry_link(map, insp_entry, new_entry,
+	    VM_MAP_KERNEL_FLAGS_NONE);
+	map->size += end - start;
+
+	/*
+	 *	Update the free space hint and the lookup hint.
+	 */
+
+	SAVE_HINT_MAP_WRITE(map, new_entry);
+	return new_entry;
+}
+
+/*
+ *	Routine:	vm_map_remap_extract
+ *
+ *	Descritpion:	This routine returns a vm_entry list from a map.
+ */
+static kern_return_t
+vm_map_remap_extract(
+	vm_map_t                map,
+	vm_map_offset_t         addr,
+	vm_map_size_t           size,
+	boolean_t               copy,
+	struct vm_map_header    *map_header,
+	vm_prot_t               *cur_protection,
+	vm_prot_t               *max_protection,
+	/* What, no behavior? */
+	vm_inherit_t            inheritance,
+	boolean_t               pageable,
+	boolean_t               same_map,
+	vm_map_kernel_flags_t   vmk_flags)
+{
+	kern_return_t           result;
+	vm_map_size_t           mapped_size;
+	vm_map_size_t           tmp_size;
+	vm_map_entry_t          src_entry;     /* result of last map lookup */
+	vm_map_entry_t          new_entry;
+	vm_object_offset_t      offset;
+	vm_map_offset_t         map_address;
+	vm_map_offset_t         src_start;     /* start of entry to map */
+	vm_map_offset_t         src_end;       /* end of region to be mapped */
+	vm_object_t             object;
+	vm_map_version_t        version;
+	boolean_t               src_needs_copy;
+	boolean_t               new_entry_needs_copy;
+	vm_map_entry_t          saved_src_entry;
+	boolean_t               src_entry_was_wired;
+	vm_prot_t               max_prot_for_prot_copy;
+
+	assert(map != VM_MAP_NULL);
+	assert(size != 0);
+	assert(size == vm_map_round_page(size, PAGE_MASK));
+	assert(inheritance == VM_INHERIT_NONE ||
+	    inheritance == VM_INHERIT_COPY ||
+	    inheritance == VM_INHERIT_SHARE);
+
+	/*
+	 *	Compute start and end of region.
+	 */
+	src_start = vm_map_trunc_page(addr, PAGE_MASK);
+	src_end = vm_map_round_page(src_start + size, PAGE_MASK);
+
+
+	/*
+	 *	Initialize map_header.
+	 */
+	map_header->links.next = CAST_TO_VM_MAP_ENTRY(&map_header->links);
+	map_header->links.prev = CAST_TO_VM_MAP_ENTRY(&map_header->links);
+	map_header->nentries = 0;
+	map_header->entries_pageable = pageable;
+	map_header->page_shift = PAGE_SHIFT;
+
+	vm_map_store_init( map_header );
+
+	if (copy && vmk_flags.vmkf_remap_prot_copy) {
+		max_prot_for_prot_copy = *max_protection & VM_PROT_ALL;
+	} else {
+		max_prot_for_prot_copy = VM_PROT_NONE;
+	}
+	*cur_protection = VM_PROT_ALL;
+	*max_protection = VM_PROT_ALL;
+
+	map_address = 0;
+	mapped_size = 0;
+	result = KERN_SUCCESS;
+
+	/*
+	 *	The specified source virtual space might correspond to
+	 *	multiple map entries, need to loop on them.
+	 */
+	vm_map_lock(map);
+	while (mapped_size != size) {
+		vm_map_size_t   entry_size;
+
+		/*
+		 *	Find the beginning of the region.
+		 */
+		if (!vm_map_lookup_entry(map, src_start, &src_entry)) {
+			result = KERN_INVALID_ADDRESS;
+			break;
+		}
+
+		if (src_start < src_entry->vme_start ||
+		    (mapped_size && src_start != src_entry->vme_start)) {
+			result = KERN_INVALID_ADDRESS;
+			break;
+		}
+
+		tmp_size = size - mapped_size;
+		if (src_end > src_entry->vme_end) {
+			tmp_size -= (src_end - src_entry->vme_end);
+		}
+
+		entry_size = (vm_map_size_t)(src_entry->vme_end -
+		    src_entry->vme_start);
+
+		if (src_entry->is_sub_map) {
+			vm_map_reference(VME_SUBMAP(src_entry));
+			object = VM_OBJECT_NULL;
+		} else {
+			object = VME_OBJECT(src_entry);
+			if (src_entry->iokit_acct) {
+				/*
+				 * This entry uses "IOKit accounting".
+				 */
+			} else if (object != VM_OBJECT_NULL &&
+			    (object->purgable != VM_PURGABLE_DENY ||
+			    object->vo_ledger_tag != VM_LEDGER_TAG_NONE)) {
+				/*
+				 * Purgeable objects have their own accounting:
+				 * no pmap accounting for them.
+				 */
+				assertf(!src_entry->use_pmap,
+				    "map=%p src_entry=%p [0x%llx:0x%llx] 0x%x/0x%x %d",
+				    map,
+				    src_entry,
+				    (uint64_t)src_entry->vme_start,
+				    (uint64_t)src_entry->vme_end,
+				    src_entry->protection,
+				    src_entry->max_protection,
+				    VME_ALIAS(src_entry));
+			} else {
+				/*
+				 * Not IOKit or purgeable:
+				 * must be accounted by pmap stats.
+				 */
+				assertf(src_entry->use_pmap,
+				    "map=%p src_entry=%p [0x%llx:0x%llx] 0x%x/0x%x %d",
+				    map,
+				    src_entry,
+				    (uint64_t)src_entry->vme_start,
+				    (uint64_t)src_entry->vme_end,
+				    src_entry->protection,
+				    src_entry->max_protection,
+				    VME_ALIAS(src_entry));
+			}
+
+			if (object == VM_OBJECT_NULL) {
+				object = vm_object_allocate(entry_size);
+				VME_OFFSET_SET(src_entry, 0);
+				VME_OBJECT_SET(src_entry, object);
+				assert(src_entry->use_pmap);
+			} else if (object->copy_strategy !=
+			    MEMORY_OBJECT_COPY_SYMMETRIC) {
+				/*
+				 *	We are already using an asymmetric
+				 *	copy, and therefore we already have
+				 *	the right object.
+				 */
+				assert(!src_entry->needs_copy);
+			} else if (src_entry->needs_copy || object->shadowed ||
+			    (object->internal && !object->true_share &&
+			    !src_entry->is_shared &&
+			    object->vo_size > entry_size)) {
+				VME_OBJECT_SHADOW(src_entry, entry_size);
+				assert(src_entry->use_pmap);
+
+				if (!src_entry->needs_copy &&
+				    (src_entry->protection & VM_PROT_WRITE)) {
+					vm_prot_t prot;
+
+					assert(!pmap_has_prot_policy(src_entry->protection));
+
+					prot = src_entry->protection & ~VM_PROT_WRITE;
+
+					if (override_nx(map,
+					    VME_ALIAS(src_entry))
+					    && prot) {
+						prot |= VM_PROT_EXECUTE;
+					}
+
+					assert(!pmap_has_prot_policy(prot));
+
+					if (map->mapped_in_other_pmaps) {
+						vm_object_pmap_protect(
+							VME_OBJECT(src_entry),
+							VME_OFFSET(src_entry),
+							entry_size,
+							PMAP_NULL,
+							src_entry->vme_start,
+							prot);
+					} else {
+						pmap_protect(vm_map_pmap(map),
+						    src_entry->vme_start,
+						    src_entry->vme_end,
+						    prot);
+					}
+				}
+
+				object = VME_OBJECT(src_entry);
+				src_entry->needs_copy = FALSE;
+			}
+
+
+			vm_object_lock(object);
+			vm_object_reference_locked(object); /* object ref. for new entry */
+			if (object->copy_strategy ==
+			    MEMORY_OBJECT_COPY_SYMMETRIC) {
+				object->copy_strategy =
+				    MEMORY_OBJECT_COPY_DELAY;
+			}
+			vm_object_unlock(object);
+		}
+
+		offset = (VME_OFFSET(src_entry) +
+		    (src_start - src_entry->vme_start));
+
+		new_entry = _vm_map_entry_create(map_header, !map_header->entries_pageable);
+		vm_map_entry_copy(new_entry, src_entry);
+		if (new_entry->is_sub_map) {
+			/* clr address space specifics */
+			new_entry->use_pmap = FALSE;
+		} else if (copy) {
+			/*
+			 * We're dealing with a copy-on-write operation,
+			 * so the resulting mapping should not inherit the
+			 * original mapping's accounting settings.
+			 * "use_pmap" should be reset to its default (TRUE)
+			 * so that the new mapping gets accounted for in
+			 * the task's memory footprint.
+			 */
+			new_entry->use_pmap = TRUE;
+		}
+		/* "iokit_acct" was cleared in vm_map_entry_copy() */
+		assert(!new_entry->iokit_acct);
+
+		new_entry->map_aligned = FALSE;
+
+		new_entry->vme_start = map_address;
+		new_entry->vme_end = map_address + tmp_size;
+		assert(new_entry->vme_start < new_entry->vme_end);
+		if (copy && vmk_flags.vmkf_remap_prot_copy) {
+			/*
+			 * Remapping for vm_map_protect(VM_PROT_COPY)
+			 * to convert a read-only mapping into a
+			 * copy-on-write version of itself but
+			 * with write access:
+			 * keep the original inheritance and add
+			 * VM_PROT_WRITE to the max protection.
+			 */
+			new_entry->inheritance = src_entry->inheritance;
+			new_entry->protection &= max_prot_for_prot_copy;
+			new_entry->max_protection |= VM_PROT_WRITE;
+		} else {
+			new_entry->inheritance = inheritance;
+		}
+		VME_OFFSET_SET(new_entry, offset);
+
+		/*
+		 * The new region has to be copied now if required.
+		 */
+RestartCopy:
+		if (!copy) {
+			if (src_entry->used_for_jit == TRUE) {
+				if (same_map) {
+				} else {
+#if CONFIG_EMBEDDED
+					/*
+					 * Cannot allow an entry describing a JIT
+					 * region to be shared across address spaces.
+					 */
+					result = KERN_INVALID_ARGUMENT;
+					break;
+#endif /* CONFIG_EMBEDDED */
+				}
+			}
+
+			src_entry->is_shared = TRUE;
+			new_entry->is_shared = TRUE;
+			if (!(new_entry->is_sub_map)) {
+				new_entry->needs_copy = FALSE;
+			}
+		} else if (src_entry->is_sub_map) {
+			/* make this a COW sub_map if not already */
+			assert(new_entry->wired_count == 0);
+			new_entry->needs_copy = TRUE;
+			object = VM_OBJECT_NULL;
+		} else if (src_entry->wired_count == 0 &&
+		    vm_object_copy_quickly(VME_OBJECT_PTR(new_entry),
+		    VME_OFFSET(new_entry),
+		    (new_entry->vme_end -
+		    new_entry->vme_start),
+		    &src_needs_copy,
+		    &new_entry_needs_copy)) {
+			new_entry->needs_copy = new_entry_needs_copy;
+			new_entry->is_shared = FALSE;
+			assertf(new_entry->use_pmap, "map %p new_entry %p\n", map, new_entry);
+
+			/*
+			 * Handle copy_on_write semantics.
+			 */
+			if (src_needs_copy && !src_entry->needs_copy) {
+				vm_prot_t prot;
+
+				assert(!pmap_has_prot_policy(src_entry->protection));
+
+				prot = src_entry->protection & ~VM_PROT_WRITE;
+
+				if (override_nx(map,
+				    VME_ALIAS(src_entry))
+				    && prot) {
+					prot |= VM_PROT_EXECUTE;
+				}
+
+				assert(!pmap_has_prot_policy(prot));
+
+				vm_object_pmap_protect(object,
+				    offset,
+				    entry_size,
+				    ((src_entry->is_shared
+				    || map->mapped_in_other_pmaps) ?
+				    PMAP_NULL : map->pmap),
+				    src_entry->vme_start,
+				    prot);
+
+				assert(src_entry->wired_count == 0);
+				src_entry->needs_copy = TRUE;
+			}
+			/*
+			 * Throw away the old object reference of the new entry.
+			 */
+			vm_object_deallocate(object);
+		} else {
+			new_entry->is_shared = FALSE;
+			assertf(new_entry->use_pmap, "map %p new_entry %p\n", map, new_entry);
+
+			src_entry_was_wired = (src_entry->wired_count > 0);
+			saved_src_entry = src_entry;
+			src_entry = VM_MAP_ENTRY_NULL;
+
+			/*
+			 * The map can be safely unlocked since we
+			 * already hold a reference on the object.
+			 *
+			 * Record the timestamp of the map for later
+			 * verification, and unlock the map.
+			 */
+			version.main_timestamp = map->timestamp;
+			vm_map_unlock(map);     /* Increments timestamp once! */
+
+			/*
+			 * Perform the copy.
+			 */
+			if (src_entry_was_wired > 0) {
+				vm_object_lock(object);
+				result = vm_object_copy_slowly(
+					object,
+					offset,
+					(new_entry->vme_end -
+					new_entry->vme_start),
+					THREAD_UNINT,
+					VME_OBJECT_PTR(new_entry));
+
+				VME_OFFSET_SET(new_entry, 0);
+				new_entry->needs_copy = FALSE;
+			} else {
+				vm_object_offset_t new_offset;
+
+				new_offset = VME_OFFSET(new_entry);
+				result = vm_object_copy_strategically(
+					object,
+					offset,
+					(new_entry->vme_end -
+					new_entry->vme_start),
+					VME_OBJECT_PTR(new_entry),
+					&new_offset,
+					&new_entry_needs_copy);
+				if (new_offset != VME_OFFSET(new_entry)) {
+					VME_OFFSET_SET(new_entry, new_offset);
+				}
+
+				new_entry->needs_copy = new_entry_needs_copy;
+			}
+
+			/*
+			 * Throw away the old object reference of the new entry.
+			 */
+			vm_object_deallocate(object);
+
+			if (result != KERN_SUCCESS &&
+			    result != KERN_MEMORY_RESTART_COPY) {
+				_vm_map_entry_dispose(map_header, new_entry);
+				vm_map_lock(map);
+				break;
+			}
+
+			/*
+			 * Verify that the map has not substantially
+			 * changed while the copy was being made.
+			 */
+
+			vm_map_lock(map);
+			if (version.main_timestamp + 1 != map->timestamp) {
+				/*
+				 * Simple version comparison failed.
+				 *
+				 * Retry the lookup and verify that the
+				 * same object/offset are still present.
+				 */
+				saved_src_entry = VM_MAP_ENTRY_NULL;
+				vm_object_deallocate(VME_OBJECT(new_entry));
+				_vm_map_entry_dispose(map_header, new_entry);
+				if (result == KERN_MEMORY_RESTART_COPY) {
+					result = KERN_SUCCESS;
+				}
+				continue;
+			}
+			/* map hasn't changed: src_entry is still valid */
+			src_entry = saved_src_entry;
+			saved_src_entry = VM_MAP_ENTRY_NULL;
+
+			if (result == KERN_MEMORY_RESTART_COPY) {
+				vm_object_reference(object);
+				goto RestartCopy;
+			}
+		}
+
+		_vm_map_store_entry_link(map_header,
+		    map_header->links.prev, new_entry);
+
+		/*Protections for submap mapping are irrelevant here*/
+		if (!src_entry->is_sub_map) {
+			*cur_protection &= src_entry->protection;
+			*max_protection &= src_entry->max_protection;
+		}
+		map_address += tmp_size;
+		mapped_size += tmp_size;
+		src_start += tmp_size;
+	} /* end while */
+
+	vm_map_unlock(map);
+	if (result != KERN_SUCCESS) {
+		/*
+		 * Free all allocated elements.
+		 */
+		for (src_entry = map_header->links.next;
+		    src_entry != CAST_TO_VM_MAP_ENTRY(&map_header->links);
+		    src_entry = new_entry) {
+			new_entry = src_entry->vme_next;
+			_vm_map_store_entry_unlink(map_header, src_entry);
+			if (src_entry->is_sub_map) {
+				vm_map_deallocate(VME_SUBMAP(src_entry));
+			} else {
+				vm_object_deallocate(VME_OBJECT(src_entry));
+			}
+			_vm_map_entry_dispose(map_header, src_entry);
+		}
+	}
+	return result;
+}
+
+/*
+ *	Routine:	vm_remap
+ *
+ *			Map portion of a task's address space.
+ *			Mapped region must not overlap more than
+ *			one vm memory object. Protections and
+ *			inheritance attributes remain the same
+ *			as in the original task and are	out parameters.
+ *			Source and Target task can be identical
+ *			Other attributes are identical as for vm_map()
+ */
+kern_return_t
+vm_map_remap(
+	vm_map_t                target_map,
+	vm_map_address_t        *address,
+	vm_map_size_t           size,
+	vm_map_offset_t         mask,
+	int                     flags,
+	vm_map_kernel_flags_t   vmk_flags,
+	vm_tag_t                tag,
+	vm_map_t                src_map,
+	vm_map_offset_t         memory_address,
+	boolean_t               copy,
+	vm_prot_t               *cur_protection,
+	vm_prot_t               *max_protection,
+	vm_inherit_t            inheritance)
+{
+	kern_return_t           result;
+	vm_map_entry_t          entry;
+	vm_map_entry_t          insp_entry = VM_MAP_ENTRY_NULL;
+	vm_map_entry_t          new_entry;
+	struct vm_map_header    map_header;
+	vm_map_offset_t         offset_in_mapping;
+
+	if (target_map == VM_MAP_NULL) {
+		return KERN_INVALID_ARGUMENT;
+	}
+
+	switch (inheritance) {
+	case VM_INHERIT_NONE:
+	case VM_INHERIT_COPY:
+	case VM_INHERIT_SHARE:
+		if (size != 0 && src_map != VM_MAP_NULL) {
+			break;
+		}
+	/*FALL THRU*/
+	default:
+		return KERN_INVALID_ARGUMENT;
+	}
+
+	/*
+	 * If the user is requesting that we return the address of the
+	 * first byte of the data (rather than the base of the page),
+	 * then we use different rounding semantics: specifically,
+	 * we assume that (memory_address, size) describes a region
+	 * all of whose pages we must cover, rather than a base to be truncated
+	 * down and a size to be added to that base.  So we figure out
+	 * the highest page that the requested region includes and make
+	 * sure that the size will cover it.
+	 *
+	 * The key example we're worried about it is of the form:
+	 *
+	 *              memory_address = 0x1ff0, size = 0x20
+	 *
+	 * With the old semantics, we round down the memory_address to 0x1000
+	 * and round up the size to 0x1000, resulting in our covering *only*
+	 * page 0x1000.  With the new semantics, we'd realize that the region covers
+	 * 0x1ff0-0x2010, and compute a size of 0x2000.  Thus, we cover both page
+	 * 0x1000 and page 0x2000 in the region we remap.
+	 */
+	if ((flags & VM_FLAGS_RETURN_DATA_ADDR) != 0) {
+		offset_in_mapping = memory_address - vm_map_trunc_page(memory_address, PAGE_MASK);
+		size = vm_map_round_page(memory_address + size - vm_map_trunc_page(memory_address, PAGE_MASK), PAGE_MASK);
+	} else {
+		size = vm_map_round_page(size, PAGE_MASK);
+	}
+	if (size == 0) {
+		return KERN_INVALID_ARGUMENT;
+	}
+
+	if (flags & VM_FLAGS_RESILIENT_MEDIA) {
+		/* must be copy-on-write to be "media resilient" */
+		if (!copy) {
+			return KERN_INVALID_ARGUMENT;
+		}
+	}
+
+	result = vm_map_remap_extract(src_map, memory_address,
+	    size, copy, &map_header,
+	    cur_protection,
+	    max_protection,
+	    inheritance,
+	    target_map->hdr.entries_pageable,
+	    src_map == target_map,
+	    vmk_flags);
+
+	if (result != KERN_SUCCESS) {
+		return result;
+	}
+
+	/*
+	 * Allocate/check a range of free virtual address
+	 * space for the target
+	 */
+	*address = vm_map_trunc_page(*address,
+	    VM_MAP_PAGE_MASK(target_map));
+	vm_map_lock(target_map);
+	result = vm_map_remap_range_allocate(target_map, address, size,
+	    mask, flags, vmk_flags, tag,
+	    &insp_entry);
+
+	for (entry = map_header.links.next;
+	    entry != CAST_TO_VM_MAP_ENTRY(&map_header.links);
+	    entry = new_entry) {
+		new_entry = entry->vme_next;
+		_vm_map_store_entry_unlink(&map_header, entry);
+		if (result == KERN_SUCCESS) {
+			if (flags & VM_FLAGS_RESILIENT_CODESIGN) {
+				/* no codesigning -> read-only access */
+				entry->max_protection = VM_PROT_READ;
+				entry->protection = VM_PROT_READ;
+				entry->vme_resilient_codesign = TRUE;
+			}
+			entry->vme_start += *address;
+			entry->vme_end += *address;
+			assert(!entry->map_aligned);
+			if ((flags & VM_FLAGS_RESILIENT_MEDIA) &&
+			    !entry->is_sub_map &&
+			    (VME_OBJECT(entry) == VM_OBJECT_NULL ||
+			    VME_OBJECT(entry)->internal)) {
+				entry->vme_resilient_media = TRUE;
+			}
+			vm_map_store_entry_link(target_map, insp_entry, entry,
+			    vmk_flags);
+			insp_entry = entry;
+		} else {
+			if (!entry->is_sub_map) {
+				vm_object_deallocate(VME_OBJECT(entry));
+			} else {
+				vm_map_deallocate(VME_SUBMAP(entry));
+			}
+			_vm_map_entry_dispose(&map_header, entry);
+		}
+	}
+
+	if (flags & VM_FLAGS_RESILIENT_CODESIGN) {
+		*cur_protection = VM_PROT_READ;
+		*max_protection = VM_PROT_READ;
+	}
+
+	if (target_map->disable_vmentry_reuse == TRUE) {
+		assert(!target_map->is_nested_map);
+		if (target_map->highest_entry_end < insp_entry->vme_end) {
+			target_map->highest_entry_end = insp_entry->vme_end;
+		}
+	}
+
+	if (result == KERN_SUCCESS) {
+		target_map->size += size;
+		SAVE_HINT_MAP_WRITE(target_map, insp_entry);
+
+#if PMAP_CS
+		if (*max_protection & VM_PROT_EXECUTE) {
+			vm_map_address_t region_start = 0, region_size = 0;
+			struct pmap_cs_code_directory *region_cd = NULL;
+			vm_map_address_t base = 0;
+			struct pmap_cs_lookup_results results = {};
+			vm_map_size_t page_addr = vm_map_trunc_page(memory_address, PAGE_MASK);
+			vm_map_size_t assoc_size = vm_map_round_page(memory_address + size - page_addr, PAGE_MASK);
+
+			pmap_cs_lookup(src_map->pmap, memory_address, &results);
+			region_size = results.region_size;
+			region_start = results.region_start;
+			region_cd = results.region_cd_entry;
+			base = results.base;
+
+			if (region_cd != NULL && (page_addr != region_start || assoc_size != region_size)) {
+				*cur_protection = VM_PROT_READ;
+				*max_protection = VM_PROT_READ;
+				printf("mismatched remap of executable range 0x%llx-0x%llx to 0x%llx, "
+				    "region_start 0x%llx, region_size 0x%llx, cd_entry %sNULL, making non-executable.\n",
+				    page_addr, page_addr + assoc_size, *address,
+				    region_start, region_size,
+				    region_cd != NULL ? "not " : ""                     // Don't leak kernel slide
+				    );
+			}
+		}
+#endif
+	}
+	vm_map_unlock(target_map);
+
+	if (result == KERN_SUCCESS && target_map->wiring_required) {
+		result = vm_map_wire_kernel(target_map, *address,
+		    *address + size, *cur_protection, VM_KERN_MEMORY_MLOCK,
+		    TRUE);
+	}
+
+	/*
+	 * If requested, return the address of the data pointed to by the
+	 * request, rather than the base of the resulting page.
+	 */
+	if ((flags & VM_FLAGS_RETURN_DATA_ADDR) != 0) {
+		*address += offset_in_mapping;
+	}
+
+	return result;
+}
+
+/*
+ *	Routine:	vm_map_remap_range_allocate
+ *
+ *	Description:
+ *		Allocate a range in the specified virtual address map.
+ *		returns the address and the map entry just before the allocated
+ *		range
+ *
+ *	Map must be locked.
+ */
+
+static kern_return_t
+vm_map_remap_range_allocate(
+	vm_map_t                map,
+	vm_map_address_t        *address,       /* IN/OUT */
+	vm_map_size_t           size,
+	vm_map_offset_t         mask,
+	int                     flags,
+	vm_map_kernel_flags_t   vmk_flags,
+	__unused vm_tag_t       tag,
+	vm_map_entry_t          *map_entry)     /* OUT */
+{
+	vm_map_entry_t  entry;
+	vm_map_offset_t start;
+	vm_map_offset_t end;
+	vm_map_offset_t desired_empty_end;
+	kern_return_t   kr;
+	vm_map_entry_t          hole_entry;
+
+StartAgain:;
+
+	start = *address;
+
+	if (flags & VM_FLAGS_ANYWHERE) {
+		if (flags & VM_FLAGS_RANDOM_ADDR) {
+			/*
+			 * Get a random start address.
+			 */
+			kr = vm_map_random_address_for_size(map, address, size);
+			if (kr != KERN_SUCCESS) {
+				return kr;
+			}
+			start = *address;
+		}
+
+		/*
+		 *	Calculate the first possible address.
 		 */
-		
-		assert(!(object->shadowed && old_entry->is_shared));
-		vm_object_shadow(&old_entry->object.vm_object,
-				 &old_entry->offset,
-				 (vm_size_t) (old_entry->vme_end -
-					      old_entry->vme_start));
-		
+
+		if (start < map->min_offset) {
+			start = map->min_offset;
+		}
+		if (start > map->max_offset) {
+			return KERN_NO_SPACE;
+		}
+
 		/*
-		 *	If we're making a shadow for other than
-		 *	copy on write reasons, then we have
-		 *	to remove write permission.
+		 *	Look for the first possible address;
+		 *	if there's already something at this
+		 *	address, we have to start after it.
 		 */
 
-/* CDY FIX this! page_protect! */
-		if (!old_entry->needs_copy &&
-		    (old_entry->protection & VM_PROT_WRITE)) {
-			if(old_entry->is_sub_map && old_entry->use_pmap) {
-				pmap_protect(old_entry->object.sub_map->pmap,
-				     old_entry->vme_start,
-				     old_entry->vme_end,
-				     old_entry->protection & ~VM_PROT_WRITE);
+		if (map->disable_vmentry_reuse == TRUE) {
+			VM_MAP_HIGHEST_ENTRY(map, entry, start);
+		} else {
+			if (map->holelistenabled) {
+				hole_entry = CAST_TO_VM_MAP_ENTRY(map->holes_list);
+
+				if (hole_entry == NULL) {
+					/*
+					 * No more space in the map?
+					 */
+					return KERN_NO_SPACE;
+				} else {
+					boolean_t found_hole = FALSE;
+
+					do {
+						if (hole_entry->vme_start >= start) {
+							start = hole_entry->vme_start;
+							found_hole = TRUE;
+							break;
+						}
+
+						if (hole_entry->vme_end > start) {
+							found_hole = TRUE;
+							break;
+						}
+						hole_entry = hole_entry->vme_next;
+					} while (hole_entry != CAST_TO_VM_MAP_ENTRY(map->holes_list));
+
+					if (found_hole == FALSE) {
+						return KERN_NO_SPACE;
+					}
+
+					entry = hole_entry;
+				}
 			} else {
-				pmap_protect(vm_map_pmap(old_map),
-				     old_entry->vme_start,
-				     old_entry->vme_end,
-				     old_entry->protection & ~VM_PROT_WRITE);
+				assert(first_free_is_valid(map));
+				if (start == map->min_offset) {
+					if ((entry = map->first_free) != vm_map_to_entry(map)) {
+						start = entry->vme_end;
+					}
+				} else {
+					vm_map_entry_t  tmp_entry;
+					if (vm_map_lookup_entry(map, start, &tmp_entry)) {
+						start = tmp_entry->vme_end;
+					}
+					entry = tmp_entry;
+				}
 			}
+			start = vm_map_round_page(start,
+			    VM_MAP_PAGE_MASK(map));
 		}
-		
-		old_entry->needs_copy = FALSE;
-		object = old_entry->object.vm_object;
-	}
-	
-	/*
-	 *	If object was using a symmetric copy strategy,
-	 *	change its copy strategy to the default
-	 *	asymmetric copy strategy, which is copy_delay
-	 *	in the non-norma case and copy_call in the
-	 *	norma case. Bump the reference count for the
-	 *	new entry.
-	 */
-	
-	if(old_entry->is_sub_map) {
-		vm_map_lock(old_entry->object.sub_map);
-		vm_map_reference(old_entry->object.sub_map);
-		vm_map_unlock(old_entry->object.sub_map);
-	} else {
-		vm_object_lock(object);
-		object->ref_count++;
-		vm_object_res_reference(object);
-		if (object->copy_strategy == MEMORY_OBJECT_COPY_SYMMETRIC) {
-			object->copy_strategy = MEMORY_OBJECT_COPY_DELAY;
+
+		/*
+		 *	In any case, the "entry" always precedes
+		 *	the proposed new region throughout the
+		 *	loop:
+		 */
+
+		while (TRUE) {
+			vm_map_entry_t  next;
+
+			/*
+			 *	Find the end of the proposed new region.
+			 *	Be sure we didn't go beyond the end, or
+			 *	wrap around the address.
+			 */
+
+			end = ((start + mask) & ~mask);
+			end = vm_map_round_page(end,
+			    VM_MAP_PAGE_MASK(map));
+			if (end < start) {
+				return KERN_NO_SPACE;
+			}
+			start = end;
+			end += size;
+
+			/* We want an entire page of empty space, but don't increase the allocation size. */
+			desired_empty_end = vm_map_round_page(end, VM_MAP_PAGE_MASK(map));
+
+			if ((desired_empty_end > map->max_offset) || (desired_empty_end < start)) {
+				if (map->wait_for_space) {
+					if (size <= (map->max_offset -
+					    map->min_offset)) {
+						assert_wait((event_t) map, THREAD_INTERRUPTIBLE);
+						vm_map_unlock(map);
+						thread_block(THREAD_CONTINUE_NULL);
+						vm_map_lock(map);
+						goto StartAgain;
+					}
+				}
+
+				return KERN_NO_SPACE;
+			}
+
+			next = entry->vme_next;
+
+			if (map->holelistenabled) {
+				if (entry->vme_end >= desired_empty_end) {
+					break;
+				}
+			} else {
+				/*
+				 *	If there are no more entries, we must win.
+				 *
+				 *	OR
+				 *
+				 *	If there is another entry, it must be
+				 *	after the end of the potential new region.
+				 */
+
+				if (next == vm_map_to_entry(map)) {
+					break;
+				}
+
+				if (next->vme_start >= desired_empty_end) {
+					break;
+				}
+			}
+
+			/*
+			 *	Didn't fit -- move to the next entry.
+			 */
+
+			entry = next;
+
+			if (map->holelistenabled) {
+				if (entry == CAST_TO_VM_MAP_ENTRY(map->holes_list)) {
+					/*
+					 * Wrapped around
+					 */
+					return KERN_NO_SPACE;
+				}
+				start = entry->vme_start;
+			} else {
+				start = entry->vme_end;
+			}
 		}
-		vm_object_unlock(object);
-	}
-	
-	/*
-	 *	Clone the entry, using object ref from above.
-	 *	Mark both entries as shared.
-	 */
-	
-	new_entry = vm_map_entry_create(new_map);
-	vm_map_entry_copy(new_entry, old_entry);
-	old_entry->is_shared = TRUE;
-	new_entry->is_shared = TRUE;
-	
-	/*
-	 *	Insert the entry into the new map -- we
-	 *	know we're inserting at the end of the new
-	 *	map.
-	 */
-	
-	vm_map_entry_link(new_map, vm_map_last_entry(new_map), new_entry);
-	
-	/*
-	 *	Update the physical map
-	 */
-	
-	if (old_entry->is_sub_map) {
-		/* Bill Angell pmap support goes here */
+
+		if (map->holelistenabled) {
+			if (vm_map_lookup_entry(map, entry->vme_start, &entry)) {
+				panic("Found an existing entry (%p) instead of potential hole at address: 0x%llx.\n", entry, (unsigned long long)entry->vme_start);
+			}
+		}
+
+		*address = start;
 	} else {
-		pmap_copy(new_map->pmap, old_map->pmap, new_entry->vme_start,
-		  old_entry->vme_end - old_entry->vme_start,
-		  old_entry->vme_start);
-	}
-}
+		vm_map_entry_t          temp_entry;
+
+		/*
+		 *	Verify that:
+		 *		the address doesn't itself violate
+		 *		the mask requirement.
+		 */
+
+		if ((start & mask) != 0) {
+			return KERN_NO_SPACE;
+		}
 
-boolean_t
-vm_map_fork_copy(
-	vm_map_t	old_map,
-	vm_map_entry_t	*old_entry_p,
-	vm_map_t	new_map)
-{
-	vm_map_entry_t old_entry = *old_entry_p;
-	vm_size_t entry_size = old_entry->vme_end - old_entry->vme_start;
-	vm_offset_t start = old_entry->vme_start;
-	vm_map_copy_t copy;
-	vm_map_entry_t last = vm_map_last_entry(new_map);
 
-	vm_map_unlock(old_map);
-	/*
-	 *	Use maxprot version of copyin because we
-	 *	care about whether this memory can ever
-	 *	be accessed, not just whether it's accessible
-	 *	right now.
-	 */
-	if (vm_map_copyin_maxprot(old_map, start, entry_size, FALSE, &copy)
-	    != KERN_SUCCESS) {
 		/*
-		 *	The map might have changed while it
-		 *	was unlocked, check it again.  Skip
-		 *	any blank space or permanently
-		 *	unreadable region.
+		 *	...	the address is within bounds
 		 */
-		vm_map_lock(old_map);
-		if (!vm_map_lookup_entry(old_map, start, &last) ||
-		    last->max_protection & VM_PROT_READ ==
-					 VM_PROT_NONE) {
-			last = last->vme_next;
+
+		end = start + size;
+
+		if ((start < map->min_offset) ||
+		    (end > map->max_offset) ||
+		    (start >= end)) {
+			return KERN_INVALID_ADDRESS;
 		}
-		*old_entry_p = last;
 
 		/*
-		 * XXX	For some error returns, want to
-		 * XXX	skip to the next element.  Note
-		 *	that INVALID_ADDRESS and
-		 *	PROTECTION_FAILURE are handled above.
+		 * If we're asked to overwrite whatever was mapped in that
+		 * range, first deallocate that range.
 		 */
-		
-		return FALSE;
+		if (flags & VM_FLAGS_OVERWRITE) {
+			vm_map_t zap_map;
+			int remove_flags = VM_MAP_REMOVE_SAVE_ENTRIES | VM_MAP_REMOVE_NO_MAP_ALIGN;
+
+			/*
+			 * We use a "zap_map" to avoid having to unlock
+			 * the "map" in vm_map_delete(), which would compromise
+			 * the atomicity of the "deallocate" and then "remap"
+			 * combination.
+			 */
+			zap_map = vm_map_create(PMAP_NULL,
+			    start,
+			    end,
+			    map->hdr.entries_pageable);
+			if (zap_map == VM_MAP_NULL) {
+				return KERN_RESOURCE_SHORTAGE;
+			}
+			vm_map_set_page_shift(zap_map, VM_MAP_PAGE_SHIFT(map));
+			vm_map_disable_hole_optimization(zap_map);
+
+			if (vmk_flags.vmkf_overwrite_immutable) {
+				remove_flags |= VM_MAP_REMOVE_IMMUTABLE;
+			}
+			kr = vm_map_delete(map, start, end,
+			    remove_flags,
+			    zap_map);
+			if (kr == KERN_SUCCESS) {
+				vm_map_destroy(zap_map,
+				    VM_MAP_REMOVE_NO_PMAP_CLEANUP);
+				zap_map = VM_MAP_NULL;
+			}
+		}
+
+		/*
+		 *	...	the starting address isn't allocated
+		 */
+
+		if (vm_map_lookup_entry(map, start, &temp_entry)) {
+			return KERN_NO_SPACE;
+		}
+
+		entry = temp_entry;
+
+		/*
+		 *	...	the next region doesn't overlap the
+		 *		end point.
+		 */
+
+		if ((entry->vme_next != vm_map_to_entry(map)) &&
+		    (entry->vme_next->vme_start < end)) {
+			return KERN_NO_SPACE;
+		}
 	}
-	
-	/*
-	 *	Insert the copy into the new map
-	 */
-	
-	vm_map_copy_insert(new_map, last, copy);
-	
+	*map_entry = entry;
+	return KERN_SUCCESS;
+}
+
+/*
+ *	vm_map_switch:
+ *
+ *	Set the address map for the current thread to the specified map
+ */
+
+vm_map_t
+vm_map_switch(
+	vm_map_t        map)
+{
+	int             mycpu;
+	thread_t        thread = current_thread();
+	vm_map_t        oldmap = thread->map;
+
+	mp_disable_preemption();
+	mycpu = cpu_number();
+
 	/*
-	 *	Pick up the traversal at the end of
-	 *	the copied region.
+	 *	Deactivate the current map and activate the requested map
 	 */
-	
-	vm_map_lock(old_map);
-	start += entry_size;
-	if (! vm_map_lookup_entry(old_map, start, &last)) {
-		last = last->vme_next;
+	PMAP_SWITCH_USER(thread, map, mycpu);
+
+	mp_enable_preemption();
+	return oldmap;
+}
+
+
+/*
+ *	Routine:	vm_map_write_user
+ *
+ *	Description:
+ *		Copy out data from a kernel space into space in the
+ *		destination map. The space must already exist in the
+ *		destination map.
+ *		NOTE:  This routine should only be called by threads
+ *		which can block on a page fault. i.e. kernel mode user
+ *		threads.
+ *
+ */
+kern_return_t
+vm_map_write_user(
+	vm_map_t                map,
+	void                    *src_p,
+	vm_map_address_t        dst_addr,
+	vm_size_t               size)
+{
+	kern_return_t   kr = KERN_SUCCESS;
+
+	if (current_map() == map) {
+		if (copyout(src_p, dst_addr, size)) {
+			kr = KERN_INVALID_ADDRESS;
+		}
 	} else {
-		vm_map_clip_start(old_map, last, start);
+		vm_map_t        oldmap;
+
+		/* take on the identity of the target map while doing */
+		/* the transfer */
+
+		vm_map_reference(map);
+		oldmap = vm_map_switch(map);
+		if (copyout(src_p, dst_addr, size)) {
+			kr = KERN_INVALID_ADDRESS;
+		}
+		vm_map_switch(oldmap);
+		vm_map_deallocate(map);
 	}
-	*old_entry_p = last;
-
-	return TRUE;
+	return kr;
 }
 
 /*
- *	vm_map_fork:
+ *	Routine:	vm_map_read_user
  *
- *	Create and return a new map based on the old
- *	map, according to the inheritance values on the
- *	regions in that map.
+ *	Description:
+ *		Copy in data from a user space source map into the
+ *		kernel map. The space must already exist in the
+ *		kernel map.
+ *		NOTE:  This routine should only be called by threads
+ *		which can block on a page fault. i.e. kernel mode user
+ *		threads.
  *
- *	The source map must not be locked.
  */
-vm_map_t
-vm_map_fork(
-	vm_map_t	old_map)
+kern_return_t
+vm_map_read_user(
+	vm_map_t                map,
+	vm_map_address_t        src_addr,
+	void                    *dst_p,
+	vm_size_t               size)
 {
-	pmap_t		new_pmap = pmap_create((vm_size_t) 0);
-	vm_map_t	new_map;
-	vm_map_entry_t	old_entry;
-	vm_size_t	new_size = 0, entry_size;
-	vm_map_entry_t	new_entry;
-	boolean_t	src_needs_copy;
-	boolean_t	new_entry_needs_copy;
-
-	vm_map_reference_swap(old_map);
-	vm_map_lock(old_map);
-
-	new_map = vm_map_create(new_pmap,
-			old_map->min_offset,
-			old_map->max_offset,
-			old_map->hdr.entries_pageable);
-
-	for (
-	    old_entry = vm_map_first_entry(old_map);
-	    old_entry != vm_map_to_entry(old_map);
-	    ) {
-
-		entry_size = old_entry->vme_end - old_entry->vme_start;
-
-		switch (old_entry->inheritance) {
-		case VM_INHERIT_NONE:
-			break;
-
-		case VM_INHERIT_SHARE:
-			vm_map_fork_share(old_map, old_entry, new_map);
-			new_size += entry_size;
-			break;
-
-		case VM_INHERIT_COPY:
-
-			/*
-			 *	Inline the copy_quickly case;
-			 *	upon failure, fall back on call
-			 *	to vm_map_fork_copy.
-			 */
-
-			if(old_entry->is_sub_map)
-				break;
-			if (old_entry->wired_count != 0) {
-				goto slow_vm_map_fork_copy;
-			}
-
-			new_entry = vm_map_entry_create(new_map);
-			vm_map_entry_copy(new_entry, old_entry);
-			/* clear address space specifics */
-			new_entry->use_pmap = FALSE;
+	kern_return_t   kr = KERN_SUCCESS;
 
-			if (! vm_object_copy_quickly(
-						&new_entry->object.vm_object,
-						old_entry->offset,
-						(old_entry->vme_end -
-							old_entry->vme_start),
-						&src_needs_copy,
-						&new_entry_needs_copy)) {
-				vm_map_entry_dispose(new_map, new_entry);
-				goto slow_vm_map_fork_copy;
-			}
-
-			/*
-			 *	Handle copy-on-write obligations
-			 */
-			
-			if (src_needs_copy && !old_entry->needs_copy) {
-				vm_object_pmap_protect(
-					old_entry->object.vm_object,
-					old_entry->offset,
-					(old_entry->vme_end -
-							old_entry->vme_start),
-					((old_entry->is_shared 
-						|| old_entry->is_sub_map)
-							? PMAP_NULL :
-							old_map->pmap),
-					old_entry->vme_start,
-					old_entry->protection & ~VM_PROT_WRITE);
+	if (current_map() == map) {
+		if (copyin(src_addr, dst_p, size)) {
+			kr = KERN_INVALID_ADDRESS;
+		}
+	} else {
+		vm_map_t        oldmap;
 
-				old_entry->needs_copy = TRUE;
-			}
-			new_entry->needs_copy = new_entry_needs_copy;
-			
-			/*
-			 *	Insert the entry at the end
-			 *	of the map.
-			 */
-			
-			vm_map_entry_link(new_map, vm_map_last_entry(new_map),
-					  new_entry);
-			new_size += entry_size;
-			break;
+		/* take on the identity of the target map while doing */
+		/* the transfer */
 
-		slow_vm_map_fork_copy:
-			if (vm_map_fork_copy(old_map, &old_entry, new_map)) {
-				new_size += entry_size;
-			}
-			continue;
+		vm_map_reference(map);
+		oldmap = vm_map_switch(map);
+		if (copyin(src_addr, dst_p, size)) {
+			kr = KERN_INVALID_ADDRESS;
 		}
-		old_entry = old_entry->vme_next;
+		vm_map_switch(oldmap);
+		vm_map_deallocate(map);
 	}
-
-	new_map->size = new_size;
-	vm_map_unlock(old_map);
-	vm_map_deallocate(old_map);
-
-	return(new_map);
+	return kr;
 }
 
 
 /*
- *	vm_map_lookup_locked:
- *
- *	Finds the VM object, offset, and
- *	protection for a given virtual address in the
- *	specified map, assuming a page fault of the
- *	type specified.
- *
- *	Returns the (object, offset, protection) for
- *	this address, whether it is wired down, and whether
- *	this map has the only reference to the data in question.
- *	In order to later verify this lookup, a "version"
- *	is returned.
- *
- *	The map MUST be locked by the caller and WILL be
- *	locked on exit.  In order to guarantee the
- *	existence of the returned object, it is returned
- *	locked.
+ *	vm_map_check_protection:
  *
- *	If a lookup is requested with "write protection"
- *	specified, the map may be changed to perform virtual
- *	copying operations, although the data referenced will
- *	remain the same.
+ *	Assert that the target map allows the specified
+ *	privilege on the entire address region given.
+ *	The entire region must be allocated.
  */
-kern_return_t
-vm_map_lookup_locked(
-	vm_map_t		*var_map,	/* IN/OUT */
-	register vm_offset_t	vaddr,
-	register vm_prot_t	fault_type,
-	vm_map_version_t	*out_version,	/* OUT */
-	vm_object_t		*object,	/* OUT */
-	vm_object_offset_t	*offset,	/* OUT */
-	vm_prot_t		*out_prot,	/* OUT */
-	boolean_t		*wired,		/* OUT */
-	int			*behavior,	/* OUT */
-	vm_object_offset_t	*lo_offset,	/* OUT */
-	vm_object_offset_t	*hi_offset,	/* OUT */
-	vm_map_t		*pmap_map)
-{
-	vm_map_entry_t			entry;
-	register vm_map_t		map = *var_map;
-	vm_map_t			old_map = *var_map;
-	vm_map_t			cow_sub_map_parent = VM_MAP_NULL;
-	vm_offset_t			cow_parent_vaddr;
-	vm_offset_t			old_start;
-	vm_offset_t			old_end;
-	register vm_prot_t		prot;
-
-	*pmap_map = map;
-	RetryLookup: ;
+boolean_t
+vm_map_check_protection(vm_map_t map, vm_map_offset_t start,
+    vm_map_offset_t end, vm_prot_t protection)
+{
+	vm_map_entry_t entry;
+	vm_map_entry_t tmp_entry;
 
-	/*
-	 *	If the map has an interesting hint, try it before calling
-	 *	full blown lookup routine.
-	 */
+	vm_map_lock(map);
 
-	mutex_lock(&map->s_lock);
-	entry = map->hint;
-	mutex_unlock(&map->s_lock);
+	if (start < vm_map_min(map) || end > vm_map_max(map) || start > end) {
+		vm_map_unlock(map);
+		return FALSE;
+	}
 
-	if ((entry == vm_map_to_entry(map)) ||
-	    (vaddr < entry->vme_start) || (vaddr >= entry->vme_end)) {
-		vm_map_entry_t	tmp_entry;
+	if (!vm_map_lookup_entry(map, start, &tmp_entry)) {
+		vm_map_unlock(map);
+		return FALSE;
+	}
+
+	entry = tmp_entry;
+
+	while (start < end) {
+		if (entry == vm_map_to_entry(map)) {
+			vm_map_unlock(map);
+			return FALSE;
+		}
 
 		/*
-		 *	Entry was either not a valid hint, or the vaddr
-		 *	was not contained in the entry, so do a full lookup.
+		 *	No holes allowed!
 		 */
-		if (!vm_map_lookup_entry(map, vaddr, &tmp_entry)) {
-			if((cow_sub_map_parent) && (cow_sub_map_parent != map))
-				vm_map_unlock(cow_sub_map_parent);
-			if((*pmap_map != map) 
-					&& (*pmap_map != cow_sub_map_parent))
-				vm_map_unlock(*pmap_map);
-			return KERN_INVALID_ADDRESS;
-		}
 
-		entry = tmp_entry;
-	}
-	if(map == old_map) {
-		old_start = entry->vme_start;
-		old_end = entry->vme_end;
-	}
+		if (start < entry->vme_start) {
+			vm_map_unlock(map);
+			return FALSE;
+		}
 
-	/*
-	 *	Handle submaps.  Drop lock on upper map, submap is
-	 *	returned locked.
-	 */
+		/*
+		 * Check protection associated with entry.
+		 */
 
-submap_recurse:
-	if (entry->is_sub_map) {
-		vm_offset_t		local_vaddr;
-		vm_offset_t		end_delta;
-		vm_offset_t		start_delta; 
-		vm_offset_t		object_start_delta; 
-		vm_map_entry_t		submap_entry;
-		boolean_t		mapped_needs_copy=FALSE;
+		if ((entry->protection & protection) != protection) {
+			vm_map_unlock(map);
+			return FALSE;
+		}
 
-		local_vaddr = vaddr;
+		/* go to next entry */
 
-		if ((!entry->needs_copy) && (entry->use_pmap)) {
-			/* if pmap_map equals map we unlock below */
-			if ((*pmap_map != map) && 
-					(*pmap_map != cow_sub_map_parent))
-				vm_map_unlock(*pmap_map);
-			*pmap_map = entry->object.sub_map;
-		}
+		start = entry->vme_end;
+		entry = entry->vme_next;
+	}
+	vm_map_unlock(map);
+	return TRUE;
+}
 
-		if(entry->needs_copy) {
-			if (!mapped_needs_copy) {
-				if (vm_map_lock_read_to_write(map)) {
-					vm_map_lock_read(map);
-					if(*pmap_map == entry->object.sub_map)
-						*pmap_map = map;
-					goto RetryLookup;
-				}
-				vm_map_lock_read(entry->object.sub_map);
-				cow_sub_map_parent = map;
-				/* reset base to map before cow object */
-				/* this is the map which will accept   */
-				/* the new cow object */
-				old_start = entry->vme_start;
-				old_end = entry->vme_end;
-				cow_parent_vaddr = vaddr;
-				mapped_needs_copy = TRUE;
-			} else {
-				vm_map_lock_read(entry->object.sub_map);
-				if((cow_sub_map_parent != map) &&
-							(*pmap_map != map))
-					vm_map_unlock(map);
-			}
-		} else {
-			vm_map_lock_read(entry->object.sub_map);
-			/* leave map locked if it is a target */
-			/* cow sub_map above otherwise, just  */
-			/* follow the maps down to the object */
-			/* here we unlock knowing we are not  */
-			/* revisiting the map.  */
-			if((*pmap_map != map) && (map != cow_sub_map_parent))
-				vm_map_unlock_read(map);
-		}
+kern_return_t
+vm_map_purgable_control(
+	vm_map_t                map,
+	vm_map_offset_t         address,
+	vm_purgable_t           control,
+	int                     *state)
+{
+	vm_map_entry_t          entry;
+	vm_object_t             object;
+	kern_return_t           kr;
+	boolean_t               was_nonvolatile;
 
-		*var_map = map = entry->object.sub_map;
+	/*
+	 * Vet all the input parameters and current type and state of the
+	 * underlaying object.  Return with an error if anything is amiss.
+	 */
+	if (map == VM_MAP_NULL) {
+		return KERN_INVALID_ARGUMENT;
+	}
 
-		/* calculate the offset in the submap for vaddr */
-		local_vaddr = (local_vaddr - entry->vme_start) + entry->offset;
+	if (control != VM_PURGABLE_SET_STATE &&
+	    control != VM_PURGABLE_GET_STATE &&
+	    control != VM_PURGABLE_PURGE_ALL &&
+	    control != VM_PURGABLE_SET_STATE_FROM_KERNEL) {
+		return KERN_INVALID_ARGUMENT;
+	}
 
-RetrySubMap:
-		if(!vm_map_lookup_entry(map, local_vaddr, &submap_entry)) {
-			if((cow_sub_map_parent) && (cow_sub_map_parent != map)){
-				vm_map_unlock(cow_sub_map_parent);
-			}
-			if((*pmap_map != map) 
-					&& (*pmap_map != cow_sub_map_parent)) {
-				vm_map_unlock(*pmap_map);
-			}
-			*pmap_map = map;
-			return KERN_INVALID_ADDRESS;
-		}
-		/* find the attenuated shadow of the underlying object */
-		/* on our target map */
+	if (control == VM_PURGABLE_PURGE_ALL) {
+		vm_purgeable_object_purge_all();
+		return KERN_SUCCESS;
+	}
 
-		/* in english the submap object may extend beyond the     */
-		/* region mapped by the entry or, may only fill a portion */
-		/* of it.  For our purposes, we only care if the object   */
-		/* doesn't fill.  In this case the area which will        */
-		/* ultimately be clipped in the top map will only need    */
-		/* to be as big as the portion of the underlying entry    */
-		/* which is mapped */
-		start_delta = submap_entry->vme_start > entry->offset ?
-	  	            submap_entry->vme_start - entry->offset : 0;
+	if ((control == VM_PURGABLE_SET_STATE ||
+	    control == VM_PURGABLE_SET_STATE_FROM_KERNEL) &&
+	    (((*state & ~(VM_PURGABLE_ALL_MASKS)) != 0) ||
+	    ((*state & VM_PURGABLE_STATE_MASK) > VM_PURGABLE_STATE_MASK))) {
+		return KERN_INVALID_ARGUMENT;
+	}
 
-		end_delta = 
-		   (entry->offset + start_delta + (old_end - old_start)) <=
-			submap_entry->vme_end ?
-				0 : (entry->offset + 
-					(old_end - old_start))
-					- submap_entry->vme_end; 
+	vm_map_lock_read(map);
 
-		old_start += start_delta;
-		old_end -= end_delta;
+	if (!vm_map_lookup_entry(map, address, &entry) || entry->is_sub_map) {
+		/*
+		 * Must pass a valid non-submap address.
+		 */
+		vm_map_unlock_read(map);
+		return KERN_INVALID_ADDRESS;
+	}
 
-		if(submap_entry->is_sub_map) {
-			entry = submap_entry;
-			vaddr = local_vaddr;
-			goto submap_recurse;
-		}
+	if ((entry->protection & VM_PROT_WRITE) == 0) {
+		/*
+		 * Can't apply purgable controls to something you can't write.
+		 */
+		vm_map_unlock_read(map);
+		return KERN_PROTECTION_FAILURE;
+	}
 
-		if(((fault_type & VM_PROT_WRITE) && cow_sub_map_parent)) {
+	object = VME_OBJECT(entry);
+	if (object == VM_OBJECT_NULL ||
+	    object->purgable == VM_PURGABLE_DENY) {
+		/*
+		 * Object must already be present and be purgeable.
+		 */
+		vm_map_unlock_read(map);
+		return KERN_INVALID_ARGUMENT;
+	}
 
-			vm_object_t	copy_object;
-			vm_offset_t	local_start;
-			vm_offset_t	local_end;
-			boolean_t		copied_slowly = FALSE;
+	vm_object_lock(object);
 
-			if (vm_map_lock_read_to_write(map)) {
-				vm_map_lock_read(map);
-				old_start -= start_delta;
-				old_end += end_delta;
-				goto RetrySubMap;
-			}
+#if 00
+	if (VME_OFFSET(entry) != 0 ||
+	    entry->vme_end - entry->vme_start != object->vo_size) {
+		/*
+		 * Can only apply purgable controls to the whole (existing)
+		 * object at once.
+		 */
+		vm_map_unlock_read(map);
+		vm_object_unlock(object);
+		return KERN_INVALID_ARGUMENT;
+	}
+#endif
 
+	assert(!entry->is_sub_map);
+	assert(!entry->use_pmap); /* purgeable has its own accounting */
 
-			if (submap_entry->object.vm_object == VM_OBJECT_NULL) {
-				submap_entry->object.vm_object = 
-					vm_object_allocate(
-						(vm_size_t)
-						(submap_entry->vme_end 
-						- submap_entry->vme_start));
-					submap_entry->offset = 0;
-			}
-			local_start =  local_vaddr - 
-					(cow_parent_vaddr - old_start);
-			local_end = local_vaddr + 
-					(old_end - cow_parent_vaddr);
-			vm_map_clip_start(map, submap_entry, local_start);
-			vm_map_clip_end(map, submap_entry, local_end);
+	vm_map_unlock_read(map);
 
-			/* This is the COW case, lets connect */
-			/* an entry in our space to the underlying */
-			/* object in the submap, bypassing the  */
-			/* submap. */
+	was_nonvolatile = (object->purgable == VM_PURGABLE_NONVOLATILE);
 
+	kr = vm_object_purgable_control(object, control, state);
 
-			if(submap_entry->wired_count != 0) {
-					vm_object_lock(
-					     submap_entry->object.vm_object);
-					vm_object_copy_slowly(
-						submap_entry->object.vm_object,
-						submap_entry->offset,
-						submap_entry->vme_end -
-							submap_entry->vme_start,
-						FALSE,
-						&copy_object);
-					copied_slowly = TRUE;
-			} else {
-				
-				/* set up shadow object */
-				copy_object = submap_entry->object.vm_object;
-				vm_object_reference(copy_object);
-				submap_entry->object.vm_object->shadowed = TRUE;
-				submap_entry->needs_copy = TRUE;
-				vm_object_pmap_protect(
-					submap_entry->object.vm_object,
-					submap_entry->offset,
-					submap_entry->vme_end - 
-						submap_entry->vme_start,
-					submap_entry->is_shared ?
-						PMAP_NULL : map->pmap,
-					submap_entry->vme_start,
-					submap_entry->protection &
-						~VM_PROT_WRITE);
-			}
-			
+	if (was_nonvolatile &&
+	    object->purgable != VM_PURGABLE_NONVOLATILE &&
+	    map->pmap == kernel_pmap) {
+#if DEBUG
+		object->vo_purgeable_volatilizer = kernel_task;
+#endif /* DEBUG */
+	}
 
-			/* This works diffently than the   */
-			/* normal submap case. We go back  */
-			/* to the parent of the cow map and*/
-			/* clip out the target portion of  */
-			/* the sub_map, substituting the   */
-			/* new copy object,                */
+	vm_object_unlock(object);
 
-			vm_map_unlock(map);
-			local_start = old_start;
-			local_end = old_end;
-			map = cow_sub_map_parent;
-			*var_map = cow_sub_map_parent;
-			vaddr = cow_parent_vaddr;
-			cow_sub_map_parent = NULL;
+	return kr;
+}
 
-			if(!vm_map_lookup_entry(map, 
-					vaddr, &entry)) {
-				        vm_object_deallocate(
-							copy_object);
-					vm_map_lock_write_to_read(map);
-					return KERN_INVALID_ADDRESS;
-			}
-					
-			/* clip out the portion of space */
-			/* mapped by the sub map which   */
-			/* corresponds to the underlying */
-			/* object */
-			vm_map_clip_start(map, entry, local_start);
-			vm_map_clip_end(map, entry, local_end);
+kern_return_t
+vm_map_page_query_internal(
+	vm_map_t        target_map,
+	vm_map_offset_t offset,
+	int             *disposition,
+	int             *ref_count)
+{
+	kern_return_t                   kr;
+	vm_page_info_basic_data_t       info;
+	mach_msg_type_number_t          count;
+
+	count = VM_PAGE_INFO_BASIC_COUNT;
+	kr = vm_map_page_info(target_map,
+	    offset,
+	    VM_PAGE_INFO_BASIC,
+	    (vm_page_info_t) &info,
+	    &count);
+	if (kr == KERN_SUCCESS) {
+		*disposition = info.disposition;
+		*ref_count = info.ref_count;
+	} else {
+		*disposition = 0;
+		*ref_count = 0;
+	}
 
+	return kr;
+}
 
-			/* substitute copy object for */
-			/* shared map entry           */
-			vm_map_deallocate(entry->object.sub_map);
-			entry->is_sub_map = FALSE;
-			entry->object.vm_object = copy_object;
+kern_return_t
+vm_map_page_info(
+	vm_map_t                map,
+	vm_map_offset_t         offset,
+	vm_page_info_flavor_t   flavor,
+	vm_page_info_t          info,
+	mach_msg_type_number_t  *count)
+{
+	return vm_map_page_range_info_internal(map,
+	           offset,                     /* start of range */
+	           (offset + 1),                     /* this will get rounded in the call to the page boundary */
+	           flavor,
+	           info,
+	           count);
+}
 
-			entry->protection |= VM_PROT_WRITE;
-			entry->max_protection |= VM_PROT_WRITE;
-			if(copied_slowly) {
-				entry->offset = 0;
-				entry->needs_copy = FALSE;
-				entry->is_shared = FALSE;
-			} else {
-				entry->offset = submap_entry->offset;
-				entry->needs_copy = TRUE;
-				if(entry->inheritance == VM_INHERIT_SHARE) 
-					entry->inheritance = VM_INHERIT_COPY;
-				if (map != old_map)
-					entry->is_shared = TRUE;
-			}
-			if(entry->inheritance == VM_INHERIT_SHARE) 
-				entry->inheritance = VM_INHERIT_COPY;
+kern_return_t
+vm_map_page_range_info_internal(
+	vm_map_t                map,
+	vm_map_offset_t         start_offset,
+	vm_map_offset_t         end_offset,
+	vm_page_info_flavor_t   flavor,
+	vm_page_info_t          info,
+	mach_msg_type_number_t  *count)
+{
+	vm_map_entry_t          map_entry = VM_MAP_ENTRY_NULL;
+	vm_object_t             object = VM_OBJECT_NULL, curr_object = VM_OBJECT_NULL;
+	vm_page_t               m = VM_PAGE_NULL;
+	kern_return_t           retval = KERN_SUCCESS;
+	int                     disposition = 0;
+	int                     ref_count = 0;
+	int                     depth = 0, info_idx = 0;
+	vm_page_info_basic_t    basic_info = 0;
+	vm_map_offset_t         offset_in_page = 0, offset_in_object = 0, curr_offset_in_object = 0;
+	vm_map_offset_t         start = 0, end = 0, curr_s_offset = 0, curr_e_offset = 0;
+	boolean_t               do_region_footprint;
+	ledger_amount_t         ledger_resident, ledger_compressed;
 
-			vm_map_lock_write_to_read(map);
-		} else {
-			if((cow_sub_map_parent)
-					&& (cow_sub_map_parent != *pmap_map)
-					&& (cow_sub_map_parent != map)) {
-				vm_map_unlock(cow_sub_map_parent);
+	switch (flavor) {
+	case VM_PAGE_INFO_BASIC:
+		if (*count != VM_PAGE_INFO_BASIC_COUNT) {
+			/*
+			 * The "vm_page_info_basic_data" structure was not
+			 * properly padded, so allow the size to be off by
+			 * one to maintain backwards binary compatibility...
+			 */
+			if (*count != VM_PAGE_INFO_BASIC_COUNT - 1) {
+				return KERN_INVALID_ARGUMENT;
 			}
-			entry = submap_entry;
-			vaddr = local_vaddr;
 		}
+		break;
+	default:
+		return KERN_INVALID_ARGUMENT;
 	}
-		
-	/*
-	 *	Check whether this task is allowed to have
-	 *	this page.
-	 */
 
-	prot = entry->protection;
-	if ((fault_type & (prot)) != fault_type) {
-	  if (*pmap_map != map) {
-		vm_map_unlock(*pmap_map);
-	  }
-	  *pmap_map = map;
-	  return KERN_PROTECTION_FAILURE;
+	do_region_footprint = task_self_region_footprint();
+	disposition = 0;
+	ref_count = 0;
+	depth = 0;
+	info_idx = 0; /* Tracks the next index within the info structure to be filled.*/
+	retval = KERN_SUCCESS;
+
+	offset_in_page = start_offset & PAGE_MASK;
+	start = vm_map_trunc_page(start_offset, PAGE_MASK);
+	end = vm_map_round_page(end_offset, PAGE_MASK);
+
+	if (end < start) {
+		return KERN_INVALID_ARGUMENT;
 	}
 
-	/*
-	 *	If this page is not pageable, we have to get
-	 *	it for all possible accesses.
-	 */
+	assert((end - start) <= MAX_PAGE_RANGE_QUERY);
 
-	if (*wired = (entry->wired_count != 0))
-		prot = fault_type = entry->protection;
+	vm_map_lock_read(map);
 
-	/*
-	 *	If the entry was copy-on-write, we either ...
-	 */
+	task_ledgers_footprint(map->pmap->ledger, &ledger_resident, &ledger_compressed);
 
-	if (entry->needs_copy) {
-	    	/*
-		 *	If we want to write the page, we may as well
-		 *	handle that now since we've got the map locked.
-		 *
-		 *	If we don't need to write the page, we just
-		 *	demote the permissions allowed.
+	for (curr_s_offset = start; curr_s_offset < end;) {
+		/*
+		 * New lookup needs reset of these variables.
 		 */
+		curr_object = object = VM_OBJECT_NULL;
+		offset_in_object = 0;
+		ref_count = 0;
+		depth = 0;
 
-		if (fault_type & VM_PROT_WRITE || *wired) {
+		if (do_region_footprint &&
+		    curr_s_offset >= vm_map_last_entry(map)->vme_end) {
 			/*
-			 *	Make a new object, and place it in the
-			 *	object chain.  Note that no new references
-			 *	have appeared -- one just moved from the
-			 *	map to the new object.
+			 * Request for "footprint" info about a page beyond
+			 * the end of address space: this must be for
+			 * the fake region vm_map_region_recurse_64()
+			 * reported to account for non-volatile purgeable
+			 * memory owned by this task.
 			 */
+			disposition = 0;
 
-			if (vm_map_lock_read_to_write(map)) {
-				vm_map_lock_read(map);
-				goto RetryLookup;
+			if (curr_s_offset - vm_map_last_entry(map)->vme_end <=
+			    (unsigned) ledger_compressed) {
+				/*
+				 * We haven't reported all the "non-volatile
+				 * compressed" pages yet, so report this fake
+				 * page as "compressed".
+				 */
+				disposition |= VM_PAGE_QUERY_PAGE_PAGED_OUT;
+			} else {
+				/*
+				 * We've reported all the non-volatile
+				 * compressed page but not all the non-volatile
+				 * pages , so report this fake page as
+				 * "resident dirty".
+				 */
+				disposition |= VM_PAGE_QUERY_PAGE_PRESENT;
+				disposition |= VM_PAGE_QUERY_PAGE_DIRTY;
+				disposition |= VM_PAGE_QUERY_PAGE_REF;
 			}
-			vm_object_shadow(&entry->object.vm_object,
-					 &entry->offset,
-					 (vm_size_t) (entry->vme_end -
-						      entry->vme_start));
-
-			entry->object.vm_object->shadowed = TRUE;
-			entry->needs_copy = FALSE;
-			vm_map_lock_write_to_read(map);
-		}
-		else {
-			/*
-			 *	We're attempting to read a copy-on-write
-			 *	page -- don't allow writes.
-			 */
-
-			prot &= (~VM_PROT_WRITE);
+			switch (flavor) {
+			case VM_PAGE_INFO_BASIC:
+				basic_info = (vm_page_info_basic_t) (((uintptr_t) info) + (info_idx * sizeof(struct vm_page_info_basic)));
+				basic_info->disposition = disposition;
+				basic_info->ref_count = 1;
+				basic_info->object_id = INFO_MAKE_FAKE_OBJECT_ID(map, task_ledgers.purgeable_nonvolatile);
+				basic_info->offset = 0;
+				basic_info->depth = 0;
+
+				info_idx++;
+				break;
+			}
+			curr_s_offset += PAGE_SIZE;
+			continue;
 		}
-	}
 
-	/*
-	 *	Create an object if necessary.
-	 */
-	if (entry->object.vm_object == VM_OBJECT_NULL) {
+		/*
+		 * First, find the map entry covering "curr_s_offset", going down
+		 * submaps if necessary.
+		 */
+		if (!vm_map_lookup_entry(map, curr_s_offset, &map_entry)) {
+			/* no entry -> no object -> no page */
 
-		if (vm_map_lock_read_to_write(map)) {
-			vm_map_lock_read(map);
-			goto RetryLookup;
-		}
+			if (curr_s_offset < vm_map_min(map)) {
+				/*
+				 * Illegal address that falls below map min.
+				 */
+				curr_e_offset = MIN(end, vm_map_min(map));
+			} else if (curr_s_offset >= vm_map_max(map)) {
+				/*
+				 * Illegal address that falls on/after map max.
+				 */
+				curr_e_offset = end;
+			} else if (map_entry == vm_map_to_entry(map)) {
+				/*
+				 * Hit a hole.
+				 */
+				if (map_entry->vme_next == vm_map_to_entry(map)) {
+					/*
+					 * Empty map.
+					 */
+					curr_e_offset = MIN(map->max_offset, end);
+				} else {
+					/*
+					 * Hole at start of the map.
+					 */
+					curr_e_offset = MIN(map_entry->vme_next->vme_start, end);
+				}
+			} else {
+				if (map_entry->vme_next == vm_map_to_entry(map)) {
+					/*
+					 * Hole at the end of the map.
+					 */
+					curr_e_offset = MIN(map->max_offset, end);
+				} else {
+					curr_e_offset = MIN(map_entry->vme_next->vme_start, end);
+				}
+			}
 
-		entry->object.vm_object = vm_object_allocate(
-			(vm_size_t)(entry->vme_end - entry->vme_start));
-		entry->offset = 0;
-		vm_map_lock_write_to_read(map);
-	}
+			assert(curr_e_offset >= curr_s_offset);
 
-	/*
-	 *	Return the object/offset from this entry.  If the entry
-	 *	was copy-on-write or empty, it has been fixed up.  Also
-	 *	return the protection.
-	 */
+			uint64_t num_pages = (curr_e_offset - curr_s_offset) >> PAGE_SHIFT;
 
-        *offset = (vaddr - entry->vme_start) + entry->offset;
-        *object = entry->object.vm_object;
-	*out_prot = prot;
-	*behavior = entry->behavior;
-	*lo_offset = entry->offset;
-	*hi_offset = (entry->vme_end - entry->vme_start) + entry->offset;
+			void *info_ptr = (void*) (((uintptr_t) info) + (info_idx * sizeof(struct vm_page_info_basic)));
 
-	/*
-	 *	Lock the object to prevent it from disappearing
-	 */
+			bzero(info_ptr, num_pages * sizeof(struct vm_page_info_basic));
 
-	vm_object_lock(*object);
+			curr_s_offset = curr_e_offset;
 
-	/*
-	 *	Save the version number
-	 */
+			info_idx += num_pages;
 
-	out_version->main_timestamp = map->timestamp;
+			continue;
+		}
 
-	return KERN_SUCCESS;
-}
+		/* compute offset from this map entry's start */
+		offset_in_object = curr_s_offset - map_entry->vme_start;
 
+		/* compute offset into this map entry's object (or submap) */
+		offset_in_object += VME_OFFSET(map_entry);
 
-/*
- *	vm_map_verify:
- *
- *	Verifies that the map in question has not changed
- *	since the given version.  If successful, the map
- *	will not change until vm_map_verify_done() is called.
- */
-boolean_t
-vm_map_verify(
-	register vm_map_t		map,
-	register vm_map_version_t	*version)	/* REF */
-{
-	boolean_t	result;
+		if (map_entry->is_sub_map) {
+			vm_map_t sub_map = VM_MAP_NULL;
+			vm_page_info_t submap_info = 0;
+			vm_map_offset_t submap_s_offset = 0, submap_e_offset = 0, range_len = 0;
 
-	vm_map_lock_read(map);
-	result = (map->timestamp == version->main_timestamp);
+			range_len = MIN(map_entry->vme_end, end) - curr_s_offset;
 
-	if (!result)
-		vm_map_unlock_read(map);
+			submap_s_offset = offset_in_object;
+			submap_e_offset = submap_s_offset + range_len;
 
-	return(result);
-}
+			sub_map = VME_SUBMAP(map_entry);
 
-/*
- *	vm_map_verify_done:
- *
- *	Releases locks acquired by a vm_map_verify.
- *
- *	This is now a macro in vm/vm_map.h.  It does a
- *	vm_map_unlock_read on the map.
- */
+			vm_map_reference(sub_map);
+			vm_map_unlock_read(map);
 
+			submap_info = (vm_page_info_t) (((uintptr_t) info) + (info_idx * sizeof(struct vm_page_info_basic)));
 
-/*
- *	vm_region:
- *
- *	User call to obtain information about a region in
- *	a task's address map. Currently, only one flavor is
- *	supported.
- *
- *	XXX The reserved and behavior fields cannot be filled
- *	    in until the vm merge from the IK is completed, and
- *	    vm_reserve is implemented.
- *
- *	XXX Dependency: syscall_vm_region() also supports only one flavor.
- */
+			retval = vm_map_page_range_info_internal(sub_map,
+			    submap_s_offset,
+			    submap_e_offset,
+			    VM_PAGE_INFO_BASIC,
+			    (vm_page_info_t) submap_info,
+			    count);
 
-kern_return_t
-vm_region(
-	vm_map_t		 map,
-	vm_offset_t	        *address,		/* IN/OUT */
-	vm_size_t		*size,			/* OUT */
-	vm_region_flavor_t	 flavor,		/* IN */
-	vm_region_info_t	 info,			/* OUT */
-	mach_msg_type_number_t	*count,			/* IN/OUT */
-	ipc_port_t		*object_name)		/* OUT */
-{
-	vm_map_entry_t		tmp_entry;
-	register
-	vm_map_entry_t		entry;
-	register
-	vm_offset_t		start;
-	vm_region_basic_info_t	basic;
-	vm_region_extended_info_t	extended;
-	vm_region_top_info_t	top;
-
-	if (map == VM_MAP_NULL) 
-		return(KERN_INVALID_ARGUMENT);
+			assert(retval == KERN_SUCCESS);
 
-	switch (flavor) {
-	
-	case VM_REGION_BASIC_INFO:
-	{
-	    if (*count < VM_REGION_BASIC_INFO_COUNT)
-		return(KERN_INVALID_ARGUMENT);
+			vm_map_lock_read(map);
+			vm_map_deallocate(sub_map);
 
-	    basic = (vm_region_basic_info_t) info;
-	    *count = VM_REGION_BASIC_INFO_COUNT;
+			/* Move the "info" index by the number of pages we inspected.*/
+			info_idx += range_len >> PAGE_SHIFT;
 
-	    vm_map_lock_read(map);
+			/* Move our current offset by the size of the range we inspected.*/
+			curr_s_offset += range_len;
 
-	    start = *address;
-	    if (!vm_map_lookup_entry(map, start, &tmp_entry)) {
-		if ((entry = tmp_entry->vme_next) == vm_map_to_entry(map)) {
-			vm_map_unlock_read(map);
-		   	return(KERN_INVALID_ADDRESS);
+			continue;
 		}
-	    } else {
-		entry = tmp_entry;
-	    }
-
-	    start = entry->vme_start;
-
-	    basic->offset = entry->offset;
-	    basic->protection = entry->protection;
-	    basic->inheritance = entry->inheritance;
-	    basic->max_protection = entry->max_protection;
-	    basic->behavior = entry->behavior;
-	    basic->user_wired_count = entry->user_wired_count;
-	    basic->reserved = entry->is_sub_map;
-	    *address = start;
-	    *size = (entry->vme_end - start);
-
-	    if (object_name) *object_name = IP_NULL;
-	    if (entry->is_sub_map) {
-	        basic->shared = FALSE;
-	    } else {
-	        basic->shared = entry->is_shared;
-	    }
-
-	    vm_map_unlock_read(map);
-	    return(KERN_SUCCESS);
-	}
-	case VM_REGION_EXTENDED_INFO:
-	{
 
-	    if (*count < VM_REGION_EXTENDED_INFO_COUNT)
-		return(KERN_INVALID_ARGUMENT);
+		object = VME_OBJECT(map_entry);
+		if (object == VM_OBJECT_NULL) {
+			/*
+			 * We don't have an object here and, hence,
+			 * no pages to inspect. We'll fill up the
+			 * info structure appropriately.
+			 */
 
-	    extended = (vm_region_extended_info_t) info;
-	    *count = VM_REGION_EXTENDED_INFO_COUNT;
+			curr_e_offset = MIN(map_entry->vme_end, end);
 
-	    vm_map_lock_read(map);
+			uint64_t num_pages = (curr_e_offset - curr_s_offset) >> PAGE_SHIFT;
 
-	    start = *address;
-	    if (!vm_map_lookup_entry(map, start, &tmp_entry)) {
-		if ((entry = tmp_entry->vme_next) == vm_map_to_entry(map)) {
-			vm_map_unlock_read(map);
-		   	return(KERN_INVALID_ADDRESS);
+			void *info_ptr = (void*) (((uintptr_t) info) + (info_idx * sizeof(struct vm_page_info_basic)));
+
+			bzero(info_ptr, num_pages * sizeof(struct vm_page_info_basic));
+
+			curr_s_offset = curr_e_offset;
+
+			info_idx += num_pages;
+
+			continue;
+		}
+
+		if (do_region_footprint) {
+			int pmap_disp;
+
+			disposition = 0;
+			pmap_disp = 0;
+			if (map->has_corpse_footprint) {
+				/*
+				 * Query the page info data we saved
+				 * while forking the corpse.
+				 */
+				vm_map_corpse_footprint_query_page_info(
+					map,
+					curr_s_offset,
+					&pmap_disp);
+			} else {
+				/*
+				 * Query the pmap.
+				 */
+				pmap_query_page_info(map->pmap,
+				    curr_s_offset,
+				    &pmap_disp);
+			}
+			if (object->purgable == VM_PURGABLE_NONVOLATILE &&
+			    /* && not tagged as no-footprint? */
+			    VM_OBJECT_OWNER(object) != NULL &&
+			    VM_OBJECT_OWNER(object)->map == map) {
+				if ((((curr_s_offset
+				    - map_entry->vme_start
+				    + VME_OFFSET(map_entry))
+				    / PAGE_SIZE) <
+				    (object->resident_page_count +
+				    vm_compressor_pager_get_count(object->pager)))) {
+					/*
+					 * Non-volatile purgeable object owned
+					 * by this task: report the first
+					 * "#resident + #compressed" pages as
+					 * "resident" (to show that they
+					 * contribute to the footprint) but not
+					 * "dirty" (to avoid double-counting
+					 * with the fake "non-volatile" region
+					 * we'll report at the end of the
+					 * address space to account for all
+					 * (mapped or not) non-volatile memory
+					 * owned by this task.
+					 */
+					disposition |= VM_PAGE_QUERY_PAGE_PRESENT;
+				}
+			} else if ((object->purgable == VM_PURGABLE_VOLATILE ||
+			    object->purgable == VM_PURGABLE_EMPTY) &&
+			    /* && not tagged as no-footprint? */
+			    VM_OBJECT_OWNER(object) != NULL &&
+			    VM_OBJECT_OWNER(object)->map == map) {
+				if ((((curr_s_offset
+				    - map_entry->vme_start
+				    + VME_OFFSET(map_entry))
+				    / PAGE_SIZE) <
+				    object->wired_page_count)) {
+					/*
+					 * Volatile|empty purgeable object owned
+					 * by this task: report the first
+					 * "#wired" pages as "resident" (to
+					 * show that they contribute to the
+					 * footprint) but not "dirty" (to avoid
+					 * double-counting with the fake
+					 * "non-volatile" region we'll report
+					 * at the end of the address space to
+					 * account for all (mapped or not)
+					 * non-volatile memory owned by this
+					 * task.
+					 */
+					disposition |= VM_PAGE_QUERY_PAGE_PRESENT;
+				}
+			} else if (map_entry->iokit_acct &&
+			    object->internal &&
+			    object->purgable == VM_PURGABLE_DENY) {
+				/*
+				 * Non-purgeable IOKit memory: phys_footprint
+				 * includes the entire virtual mapping.
+				 */
+				assertf(!map_entry->use_pmap, "offset 0x%llx map_entry %p", (uint64_t) curr_s_offset, map_entry);
+				disposition |= VM_PAGE_QUERY_PAGE_PRESENT;
+				disposition |= VM_PAGE_QUERY_PAGE_DIRTY;
+			} else if (pmap_disp & (PMAP_QUERY_PAGE_ALTACCT |
+			    PMAP_QUERY_PAGE_COMPRESSED_ALTACCT)) {
+				/* alternate accounting */
+#if CONFIG_EMBEDDED && (DEVELOPMENT || DEBUG)
+				if (map->pmap->footprint_was_suspended ||
+				    /*
+				     * XXX corpse does not know if original
+				     * pmap had its footprint suspended...
+				     */
+				    map->has_corpse_footprint) {
+					/*
+					 * The assertion below can fail if dyld
+					 * suspended footprint accounting
+					 * while doing some adjustments to
+					 * this page;  the mapping would say
+					 * "use pmap accounting" but the page
+					 * would be marked "alternate
+					 * accounting".
+					 */
+				} else
+#endif /* CONFIG_EMBEDDED && (DEVELOPMENT || DEBUG) */
+				assertf(!map_entry->use_pmap, "offset 0x%llx map_entry %p", (uint64_t) curr_s_offset, map_entry);
+				pmap_disp = 0;
+			} else {
+				if (pmap_disp & PMAP_QUERY_PAGE_PRESENT) {
+					assertf(map_entry->use_pmap, "offset 0x%llx map_entry %p", (uint64_t) curr_s_offset, map_entry);
+					disposition |= VM_PAGE_QUERY_PAGE_PRESENT;
+					disposition |= VM_PAGE_QUERY_PAGE_REF;
+					if (pmap_disp & PMAP_QUERY_PAGE_INTERNAL) {
+						disposition |= VM_PAGE_QUERY_PAGE_DIRTY;
+					} else {
+						disposition |= VM_PAGE_QUERY_PAGE_EXTERNAL;
+					}
+					if (pmap_disp & PMAP_QUERY_PAGE_REUSABLE) {
+						disposition |= VM_PAGE_QUERY_PAGE_REUSABLE;
+					}
+				} else if (pmap_disp & PMAP_QUERY_PAGE_COMPRESSED) {
+					assertf(map_entry->use_pmap, "offset 0x%llx map_entry %p", (uint64_t) curr_s_offset, map_entry);
+					disposition |= VM_PAGE_QUERY_PAGE_PAGED_OUT;
+				}
+			}
+			switch (flavor) {
+			case VM_PAGE_INFO_BASIC:
+				basic_info = (vm_page_info_basic_t) (((uintptr_t) info) + (info_idx * sizeof(struct vm_page_info_basic)));
+				basic_info->disposition = disposition;
+				basic_info->ref_count = 1;
+				basic_info->object_id = INFO_MAKE_FAKE_OBJECT_ID(map, task_ledgers.purgeable_nonvolatile);
+				basic_info->offset = 0;
+				basic_info->depth = 0;
+
+				info_idx++;
+				break;
+			}
+			curr_s_offset += PAGE_SIZE;
+			continue;
 		}
-	    } else {
-		entry = tmp_entry;
-	    }
-	    start = entry->vme_start;
-
-	    extended->protection = entry->protection;
-	    extended->user_tag = entry->alias;
-	    extended->pages_resident = 0;
-	    extended->pages_swapped_out = 0;
-	    extended->pages_shared_now_private = 0;
-	    extended->pages_dirtied = 0;
-	    extended->external_pager = 0;
-	    extended->shadow_depth = 0;
-
-	    vm_region_walk(entry, extended, entry->offset, entry->vme_end - start, map, start);
 
-	    if (extended->external_pager && extended->ref_count == 2 && extended->share_mode == SM_SHARED)
-	            extended->share_mode = SM_PRIVATE;
+		vm_object_reference(object);
+		/*
+		 * Shared mode -- so we can allow other readers
+		 * to grab the lock too.
+		 */
+		vm_object_lock_shared(object);
 
-	    if (object_name)
-	        *object_name = IP_NULL;
-	    *address = start;
-	    *size = (entry->vme_end - start);
+		curr_e_offset = MIN(map_entry->vme_end, end);
 
-	    vm_map_unlock_read(map);
-	    return(KERN_SUCCESS);
-	}
-	case VM_REGION_TOP_INFO:
-	{   
+		vm_map_unlock_read(map);
 
-	    if (*count < VM_REGION_TOP_INFO_COUNT)
-		return(KERN_INVALID_ARGUMENT);
+		map_entry = NULL; /* map is unlocked, the entry is no longer valid. */
 
-	    top = (vm_region_top_info_t) info;
-	    *count = VM_REGION_TOP_INFO_COUNT;
+		curr_object = object;
 
-	    vm_map_lock_read(map);
+		for (; curr_s_offset < curr_e_offset;) {
+			if (object == curr_object) {
+				ref_count = curr_object->ref_count - 1; /* account for our object reference above. */
+			} else {
+				ref_count = curr_object->ref_count;
+			}
 
-	    start = *address;
-	    if (!vm_map_lookup_entry(map, start, &tmp_entry)) {
-		if ((entry = tmp_entry->vme_next) == vm_map_to_entry(map)) {
-			vm_map_unlock_read(map);
-		   	return(KERN_INVALID_ADDRESS);
-		}
-	    } else {
-		entry = tmp_entry;
+			curr_offset_in_object = offset_in_object;
 
-	    }
-	    start = entry->vme_start;
+			for (;;) {
+				m = vm_page_lookup(curr_object, curr_offset_in_object);
 
-	    top->private_pages_resident = 0;
-	    top->shared_pages_resident = 0;
+				if (m != VM_PAGE_NULL) {
+					disposition |= VM_PAGE_QUERY_PAGE_PRESENT;
+					break;
+				} else {
+					if (curr_object->internal &&
+					    curr_object->alive &&
+					    !curr_object->terminating &&
+					    curr_object->pager_ready) {
+						if (VM_COMPRESSOR_PAGER_STATE_GET(curr_object, curr_offset_in_object)
+						    == VM_EXTERNAL_STATE_EXISTS) {
+							/* the pager has that page */
+							disposition |= VM_PAGE_QUERY_PAGE_PAGED_OUT;
+							break;
+						}
+					}
 
-	    vm_region_top_walk(entry, top);
+					/*
+					 * Go down the VM object shadow chain until we find the page
+					 * we're looking for.
+					 */
 
-	    if (object_name)
-	        *object_name = IP_NULL;
-	    *address = start;
-	    *size = (entry->vme_end - start);
+					if (curr_object->shadow != VM_OBJECT_NULL) {
+						vm_object_t shadow = VM_OBJECT_NULL;
 
-	    vm_map_unlock_read(map);
-	    return(KERN_SUCCESS);
-	}
-	default:
-	    return(KERN_INVALID_ARGUMENT);
-	}
-}
+						curr_offset_in_object += curr_object->vo_shadow_offset;
+						shadow = curr_object->shadow;
 
-/*
- *	vm_region_recurse: A form of vm_region which follows the
- *	submaps in a target map
- *
- */
+						vm_object_lock_shared(shadow);
+						vm_object_unlock(curr_object);
 
-kern_return_t
-vm_region_recurse(
-	vm_map_t		 map,
-	vm_offset_t	        *address,		/* IN/OUT */
-	vm_size_t		*size,			/* OUT */
-	natural_t	 	*nesting_depth,		/* IN/OUT */
-	vm_region_recurse_info_t info,			/* IN/OUT */
-	mach_msg_type_number_t	*count)			/* IN/OUT */
-{
-	vm_map_entry_t		tmp_entry;
-	register
-	vm_map_entry_t		entry;
-	register
-	vm_offset_t		start;
-
-	unsigned int			recurse_count;
-	vm_map_t			submap;
-	vm_map_t			base_map;
-	vm_map_entry_t			base_entry;
-	vm_offset_t			base_next;
-	vm_offset_t			base_addr;
-	vm_offset_t			baddr_start_delta;
-	vm_region_submap_info_t		submap_info;
-	vm_region_extended_info_data_t	extended;
-
-	if (map == VM_MAP_NULL) 
-		return(KERN_INVALID_ARGUMENT);
-
-	submap_info = (vm_region_submap_info_t) info;
-	*count = VM_REGION_SUBMAP_INFO_COUNT;
-
-	if (*count < VM_REGION_SUBMAP_INFO_COUNT)
-		return(KERN_INVALID_ARGUMENT);
+						curr_object = shadow;
+						depth++;
+						continue;
+					} else {
+						break;
+					}
+				}
+			}
 
-	start = *address;
-	base_map = map;
-	recurse_count = *nesting_depth;
+			/* The ref_count is not strictly accurate, it measures the number   */
+			/* of entities holding a ref on the object, they may not be mapping */
+			/* the object or may not be mapping the section holding the         */
+			/* target page but its still a ball park number and though an over- */
+			/* count, it picks up the copy-on-write cases                       */
 
-LOOKUP_NEXT_BASE_ENTRY:
-	vm_map_lock_read(map);
-        if (!vm_map_lookup_entry(map, start, &tmp_entry)) {
-		if ((entry = tmp_entry->vme_next) == vm_map_to_entry(map)) {
-			vm_map_unlock_read(map);
-			return(KERN_INVALID_ADDRESS);
-		}
-	} else {
-		entry = tmp_entry;
-	}
-	*size = entry->vme_end - entry->vme_start;
-	start = entry->vme_start;
-	base_addr = start;
-	baddr_start_delta = *address - start;
-	base_next = entry->vme_end;
-	base_entry = entry;
+			/* We could also get a picture of page sharing from pmap_attributes */
+			/* but this would under count as only faulted-in mappings would     */
+			/* show up.							    */
 
-	while(entry->is_sub_map && recurse_count) {
-		recurse_count--;
-		vm_map_lock_read(entry->object.sub_map);
+			if ((curr_object == object) && curr_object->shadow) {
+				disposition |= VM_PAGE_QUERY_PAGE_COPIED;
+			}
 
+			if (!curr_object->internal) {
+				disposition |= VM_PAGE_QUERY_PAGE_EXTERNAL;
+			}
 
-		if(entry == base_entry) {
-			start = entry->offset;
-		start += *address - entry->vme_start;
-		}
+			if (m != VM_PAGE_NULL) {
+				if (m->vmp_fictitious) {
+					disposition |= VM_PAGE_QUERY_PAGE_FICTITIOUS;
+				} else {
+					if (m->vmp_dirty || pmap_is_modified(VM_PAGE_GET_PHYS_PAGE(m))) {
+						disposition |= VM_PAGE_QUERY_PAGE_DIRTY;
+					}
 
-		submap = entry->object.sub_map;
-		vm_map_unlock_read(map);
-		map = submap;
+					if (m->vmp_reference || pmap_is_referenced(VM_PAGE_GET_PHYS_PAGE(m))) {
+						disposition |= VM_PAGE_QUERY_PAGE_REF;
+					}
 
-		if (!vm_map_lookup_entry(map, start, &tmp_entry)) {
-			if ((entry = tmp_entry->vme_next) 
-						== vm_map_to_entry(map)) {
-				vm_map_unlock_read(map);
-		        	map = base_map;
-	                	start = base_next;
-				recurse_count = 0;
-				*nesting_depth = 0;
-				goto LOOKUP_NEXT_BASE_ENTRY;
-			}
-		} else {
-			entry = tmp_entry;
+					if (m->vmp_q_state == VM_PAGE_ON_SPECULATIVE_Q) {
+						disposition |= VM_PAGE_QUERY_PAGE_SPECULATIVE;
+					}
 
-		}
-		if(start <= entry->vme_start) {
-			vm_offset_t	old_start = start;
-			if(baddr_start_delta) {
-				base_addr += (baddr_start_delta);
-				*size -= baddr_start_delta;
-				baddr_start_delta = 0;
-			}
-			if(base_next <= 
-				(base_addr += (entry->vme_start - start))) {
-				vm_map_unlock_read(map);
-				map = base_map;
-				start = base_next;
-				recurse_count = 0;
-				*nesting_depth = 0;
-				goto LOOKUP_NEXT_BASE_ENTRY;
-			}
-			*size -= entry->vme_start - start;
-			if (*size > (entry->vme_end - entry->vme_start)) {
-				*size = entry->vme_end - entry->vme_start;
-			}
-			start = 0;
-		} else {
-			if(baddr_start_delta) {
-				if((start - entry->vme_start) 
-						< baddr_start_delta) {
-					base_addr += start - entry->vme_start;
-					*size -= start - entry->vme_start;
-				} else {
-					base_addr += baddr_start_delta;
-					*size += baddr_start_delta;
+					if (m->vmp_cs_validated) {
+						disposition |= VM_PAGE_QUERY_PAGE_CS_VALIDATED;
+					}
+					if (m->vmp_cs_tainted) {
+						disposition |= VM_PAGE_QUERY_PAGE_CS_TAINTED;
+					}
+					if (m->vmp_cs_nx) {
+						disposition |= VM_PAGE_QUERY_PAGE_CS_NX;
+					}
+					if (m->vmp_reusable || curr_object->all_reusable) {
+						disposition |= VM_PAGE_QUERY_PAGE_REUSABLE;
+					}
 				}
-				baddr_start_delta = 0;
-			}
-			base_addr += entry->vme_start;
-			if(base_addr >= base_next) {
-				vm_map_unlock_read(map);
-				map = base_map;
-				start = base_next;
-				recurse_count = 0;
-				*nesting_depth = 0;
-				goto LOOKUP_NEXT_BASE_ENTRY;
 			}
-			if (*size > (entry->vme_end - start))
-				*size = entry->vme_end - start;
 
-			start = entry->vme_start - start;
-		}
+			switch (flavor) {
+			case VM_PAGE_INFO_BASIC:
+				basic_info = (vm_page_info_basic_t) (((uintptr_t) info) + (info_idx * sizeof(struct vm_page_info_basic)));
+				basic_info->disposition = disposition;
+				basic_info->ref_count = ref_count;
+				basic_info->object_id = (vm_object_id_t) (uintptr_t)
+				    VM_KERNEL_ADDRPERM(curr_object);
+				basic_info->offset =
+				    (memory_object_offset_t) curr_offset_in_object + offset_in_page;
+				basic_info->depth = depth;
+
+				info_idx++;
+				break;
+			}
 
-		start += entry->offset;
+			disposition = 0;
+			offset_in_page = 0; // This doesn't really make sense for any offset other than the starting offset.
 
-	}
-	*nesting_depth -= recurse_count;
-	if(entry != base_entry) {
-		start = entry->vme_start + (start - entry->offset);
-	}
+			/*
+			 * Move to next offset in the range and in our object.
+			 */
+			curr_s_offset += PAGE_SIZE;
+			offset_in_object += PAGE_SIZE;
+			curr_offset_in_object = offset_in_object;
 
+			if (curr_object != object) {
+				vm_object_unlock(curr_object);
 
-	submap_info->user_tag = entry->alias;
-	submap_info->offset = entry->offset;
-	submap_info->protection = entry->protection;
-	submap_info->inheritance = entry->inheritance;
-	submap_info->max_protection = entry->max_protection;
-	submap_info->behavior = entry->behavior;
-	submap_info->user_wired_count = entry->user_wired_count;
-	submap_info->is_submap = entry->is_sub_map;
-	submap_info->object_id = (vm_offset_t)entry->object.vm_object;
-	*address = base_addr;
+				curr_object = object;
 
+				vm_object_lock_shared(curr_object);
+			} else {
+				vm_object_lock_yield_shared(curr_object);
+			}
+		}
 
-	extended.pages_resident = 0;
-	extended.pages_swapped_out = 0;
-	extended.pages_shared_now_private = 0;
-	extended.pages_dirtied = 0;
-	extended.external_pager = 0;
-	extended.shadow_depth = 0;
+		vm_object_unlock(curr_object);
+		vm_object_deallocate(curr_object);
 
-	if(!entry->is_sub_map) {
-		vm_region_walk(entry, &extended, entry->offset, 
-				entry->vme_end - start, map, start);
-		submap_info->share_mode = extended.share_mode;
-		if (extended.external_pager && extended.ref_count == 2 
-					&& extended.share_mode == SM_SHARED)
-			submap_info->share_mode = SM_PRIVATE;
-		submap_info->ref_count = extended.ref_count;
-	} else {
-		if(entry->use_pmap) 
-			submap_info->share_mode =  SM_TRUESHARED;
-		else
-			submap_info->share_mode = SM_PRIVATE;
-		submap_info->ref_count = entry->object.sub_map->ref_count;
+		vm_map_lock_read(map);
 	}
 
-	submap_info->pages_resident = extended.pages_resident;
-	submap_info->pages_swapped_out = extended.pages_swapped_out;
-	submap_info->pages_shared_now_private = 
-				extended.pages_shared_now_private;
-	submap_info->pages_dirtied = extended.pages_dirtied;
-	submap_info->external_pager = extended.external_pager;
-	submap_info->shadow_depth = extended.shadow_depth;
-
 	vm_map_unlock_read(map);
-	return(KERN_SUCCESS);
+	return retval;
 }
 
 /*
- *	TEMPORARYTEMPORARYTEMPORARYTEMPORARYTEMPORARYTEMPORARY
- *	Goes away after regular vm_region_recurse function migrates to
- *	64 bits
- *	vm_region_recurse: A form of vm_region which follows the
- *	submaps in a target map
+ *	vm_map_msync
+ *
+ *	Synchronises the memory range specified with its backing store
+ *	image by either flushing or cleaning the contents to the appropriate
+ *	memory manager engaging in a memory object synchronize dialog with
+ *	the manager.  The client doesn't return until the manager issues
+ *	m_o_s_completed message.  MIG Magically converts user task parameter
+ *	to the task's address map.
+ *
+ *	interpretation of sync_flags
+ *	VM_SYNC_INVALIDATE	- discard pages, only return precious
+ *				  pages to manager.
+ *
+ *	VM_SYNC_INVALIDATE & (VM_SYNC_SYNCHRONOUS | VM_SYNC_ASYNCHRONOUS)
+ *				- discard pages, write dirty or precious
+ *				  pages back to memory manager.
+ *
+ *	VM_SYNC_SYNCHRONOUS | VM_SYNC_ASYNCHRONOUS
+ *				- write dirty or precious pages back to
+ *				  the memory manager.
  *
+ *	VM_SYNC_CONTIGUOUS	- does everything normally, but if there
+ *				  is a hole in the region, and we would
+ *				  have returned KERN_SUCCESS, return
+ *				  KERN_INVALID_ADDRESS instead.
+ *
+ *	NOTE
+ *	The memory object attributes have not yet been implemented, this
+ *	function will have to deal with the invalidate attribute
+ *
+ *	RETURNS
+ *	KERN_INVALID_TASK		Bad task parameter
+ *	KERN_INVALID_ARGUMENT		both sync and async were specified.
+ *	KERN_SUCCESS			The usual.
+ *	KERN_INVALID_ADDRESS		There was a hole in the region.
  */
 
 kern_return_t
-vm_region_recurse_64(
-	vm_map_t		 map,
-	vm_offset_t	        *address,		/* IN/OUT */
-	vm_size_t		*size,			/* OUT */
-	natural_t	 	*nesting_depth,		/* IN/OUT */
-	vm_region_recurse_info_t info,			/* IN/OUT */
-	mach_msg_type_number_t	*count)			/* IN/OUT */
-{
-	vm_map_entry_t		tmp_entry;
-	register
-	vm_map_entry_t		entry;
-	register
-	vm_offset_t		start;
-
-	unsigned int			recurse_count;
-	vm_map_t			submap;
-	vm_map_t			base_map;
-	vm_map_entry_t			base_entry;
-	vm_offset_t			base_next;
-	vm_offset_t			base_addr;
-	vm_offset_t			baddr_start_delta;
-	vm_region_submap_info_64_t	submap_info;
-	vm_region_extended_info_data_t	extended;
-
-	if (map == VM_MAP_NULL) 
-		return(KERN_INVALID_ARGUMENT);
-
-	submap_info = (vm_region_submap_info_64_t) info;
-	*count = VM_REGION_SUBMAP_INFO_COUNT;
-
-	if (*count < VM_REGION_SUBMAP_INFO_COUNT)
-		return(KERN_INVALID_ARGUMENT);
+vm_map_msync(
+	vm_map_t                map,
+	vm_map_address_t        address,
+	vm_map_size_t           size,
+	vm_sync_t               sync_flags)
+{
+	vm_map_entry_t          entry;
+	vm_map_size_t           amount_left;
+	vm_object_offset_t      offset;
+	boolean_t               do_sync_req;
+	boolean_t               had_hole = FALSE;
+	vm_map_offset_t         pmap_offset;
+
+	if ((sync_flags & VM_SYNC_ASYNCHRONOUS) &&
+	    (sync_flags & VM_SYNC_SYNCHRONOUS)) {
+		return KERN_INVALID_ARGUMENT;
+	}
 
-	start = *address;
-	base_map = map;
-	recurse_count = *nesting_depth;
+	/*
+	 * align address and size on page boundaries
+	 */
+	size = (vm_map_round_page(address + size,
+	    VM_MAP_PAGE_MASK(map)) -
+	    vm_map_trunc_page(address,
+	    VM_MAP_PAGE_MASK(map)));
+	address = vm_map_trunc_page(address,
+	    VM_MAP_PAGE_MASK(map));
+
+	if (map == VM_MAP_NULL) {
+		return KERN_INVALID_TASK;
+	}
 
-LOOKUP_NEXT_BASE_ENTRY:
-	vm_map_lock_read(map);
-        if (!vm_map_lookup_entry(map, start, &tmp_entry)) {
-		if ((entry = tmp_entry->vme_next) == vm_map_to_entry(map)) {
-			vm_map_unlock_read(map);
-			return(KERN_INVALID_ADDRESS);
-		}
-	} else {
-		entry = tmp_entry;
+	if (size == 0) {
+		return KERN_SUCCESS;
 	}
-	*size = entry->vme_end - entry->vme_start;
-	start = entry->vme_start;
-	base_addr = start;
-	baddr_start_delta = *address - start;
-	base_next = entry->vme_end;
-	base_entry = entry;
 
-	while(entry->is_sub_map && recurse_count) {
-		recurse_count--;
-		vm_map_lock_read(entry->object.sub_map);
+	amount_left = size;
 
+	while (amount_left > 0) {
+		vm_object_size_t        flush_size;
+		vm_object_t             object;
 
-		if(entry == base_entry) {
-			start = entry->offset;
-		start += *address - entry->vme_start;
-		}
+		vm_map_lock(map);
+		if (!vm_map_lookup_entry(map,
+		    address,
+		    &entry)) {
+			vm_map_size_t   skip;
 
-		submap = entry->object.sub_map;
-		vm_map_unlock_read(map);
-		map = submap;
+			/*
+			 * hole in the address map.
+			 */
+			had_hole = TRUE;
 
-		if (!vm_map_lookup_entry(map, start, &tmp_entry)) {
-			if ((entry = tmp_entry->vme_next) 
-						== vm_map_to_entry(map)) {
-				vm_map_unlock_read(map);
-		        	map = base_map;
-	                	start = base_next;
-				recurse_count = 0;
-				*nesting_depth = 0;
-				goto LOOKUP_NEXT_BASE_ENTRY;
+			if (sync_flags & VM_SYNC_KILLPAGES) {
+				/*
+				 * For VM_SYNC_KILLPAGES, there should be
+				 * no holes in the range, since we couldn't
+				 * prevent someone else from allocating in
+				 * that hole and we wouldn't want to "kill"
+				 * their pages.
+				 */
+				vm_map_unlock(map);
+				break;
 			}
-		} else {
-			entry = tmp_entry;
 
-		}
-		if(start <= entry->vme_start) {
-			vm_offset_t	old_start = start;
-			if(baddr_start_delta) {
-				base_addr += (baddr_start_delta);
-				*size -= baddr_start_delta;
-				baddr_start_delta = 0;
+			/*
+			 * Check for empty map.
+			 */
+			if (entry == vm_map_to_entry(map) &&
+			    entry->vme_next == entry) {
+				vm_map_unlock(map);
+				break;
 			}
-			if(base_next <= 
-				(base_addr += (entry->vme_start - start))) {
-				vm_map_unlock_read(map);
-				map = base_map;
-				start = base_next;
-				recurse_count = 0;
-				*nesting_depth = 0;
-				goto LOOKUP_NEXT_BASE_ENTRY;
+			/*
+			 * Check that we don't wrap and that
+			 * we have at least one real map entry.
+			 */
+			if ((map->hdr.nentries == 0) ||
+			    (entry->vme_next->vme_start < address)) {
+				vm_map_unlock(map);
+				break;
 			}
-			*size -= entry->vme_start - start;
-			if (*size > (entry->vme_end - entry->vme_start)) {
-				*size = entry->vme_end - entry->vme_start;
+			/*
+			 * Move up to the next entry if needed
+			 */
+			skip = (entry->vme_next->vme_start - address);
+			if (skip >= amount_left) {
+				amount_left = 0;
+			} else {
+				amount_left -= skip;
 			}
-			start = 0;
+			address = entry->vme_next->vme_start;
+			vm_map_unlock(map);
+			continue;
+		}
+
+		offset = address - entry->vme_start;
+		pmap_offset = address;
+
+		/*
+		 * do we have more to flush than is contained in this
+		 * entry ?
+		 */
+		if (amount_left + entry->vme_start + offset > entry->vme_end) {
+			flush_size = entry->vme_end -
+			    (entry->vme_start + offset);
 		} else {
-			if(baddr_start_delta) {
-				if((start - entry->vme_start) 
-						< baddr_start_delta) {
-					base_addr += start - entry->vme_start;
-					*size -= start - entry->vme_start;
+			flush_size = amount_left;
+		}
+		amount_left -= flush_size;
+		address += flush_size;
+
+		if (entry->is_sub_map == TRUE) {
+			vm_map_t        local_map;
+			vm_map_offset_t local_offset;
+
+			local_map = VME_SUBMAP(entry);
+			local_offset = VME_OFFSET(entry);
+			vm_map_reference(local_map);
+			vm_map_unlock(map);
+			if (vm_map_msync(
+				    local_map,
+				    local_offset,
+				    flush_size,
+				    sync_flags) == KERN_INVALID_ADDRESS) {
+				had_hole = TRUE;
+			}
+			vm_map_deallocate(local_map);
+			continue;
+		}
+		object = VME_OBJECT(entry);
+
+		/*
+		 * We can't sync this object if the object has not been
+		 * created yet
+		 */
+		if (object == VM_OBJECT_NULL) {
+			vm_map_unlock(map);
+			continue;
+		}
+		offset += VME_OFFSET(entry);
+
+		vm_object_lock(object);
+
+		if (sync_flags & (VM_SYNC_KILLPAGES | VM_SYNC_DEACTIVATE)) {
+			int kill_pages = 0;
+			boolean_t reusable_pages = FALSE;
+
+			if (sync_flags & VM_SYNC_KILLPAGES) {
+				if (((object->ref_count == 1) ||
+				    ((object->copy_strategy !=
+				    MEMORY_OBJECT_COPY_SYMMETRIC) &&
+				    (object->copy == VM_OBJECT_NULL))) &&
+				    (object->shadow == VM_OBJECT_NULL)) {
+					if (object->ref_count != 1) {
+						vm_page_stats_reusable.free_shared++;
+					}
+					kill_pages = 1;
 				} else {
-					base_addr += baddr_start_delta;
-					*size += baddr_start_delta;
+					kill_pages = -1;
 				}
-				baddr_start_delta = 0;
 			}
-			base_addr += entry->vme_start;
-			if(base_addr >= base_next) {
-				vm_map_unlock_read(map);
-				map = base_map;
-				start = base_next;
-				recurse_count = 0;
-				*nesting_depth = 0;
-				goto LOOKUP_NEXT_BASE_ENTRY;
+			if (kill_pages != -1) {
+				vm_object_deactivate_pages(
+					object,
+					offset,
+					(vm_object_size_t) flush_size,
+					kill_pages,
+					reusable_pages,
+					map->pmap,
+					pmap_offset);
 			}
-			if (*size > (entry->vme_end - start))
-				*size = entry->vme_end - start;
-
-			start = entry->vme_start - start;
+			vm_object_unlock(object);
+			vm_map_unlock(map);
+			continue;
 		}
+		/*
+		 * We can't sync this object if there isn't a pager.
+		 * Don't bother to sync internal objects, since there can't
+		 * be any "permanent" storage for these objects anyway.
+		 */
+		if ((object->pager == MEMORY_OBJECT_NULL) ||
+		    (object->internal) || (object->private)) {
+			vm_object_unlock(object);
+			vm_map_unlock(map);
+			continue;
+		}
+		/*
+		 * keep reference on the object until syncing is done
+		 */
+		vm_object_reference_locked(object);
+		vm_object_unlock(object);
 
-		start += entry->offset;
-
-	}
-	*nesting_depth -= recurse_count;
-	if(entry != base_entry) {
-		start = entry->vme_start + (start - entry->offset);
-	}
+		vm_map_unlock(map);
 
+		do_sync_req = vm_object_sync(object,
+		    offset,
+		    flush_size,
+		    sync_flags & VM_SYNC_INVALIDATE,
+		    ((sync_flags & VM_SYNC_SYNCHRONOUS) ||
+		    (sync_flags & VM_SYNC_ASYNCHRONOUS)),
+		    sync_flags & VM_SYNC_SYNCHRONOUS);
 
-	submap_info->user_tag = entry->alias;
-	submap_info->offset = entry->offset;
-	submap_info->protection = entry->protection;
-	submap_info->inheritance = entry->inheritance;
-	submap_info->max_protection = entry->max_protection;
-	submap_info->behavior = entry->behavior;
-	submap_info->user_wired_count = entry->user_wired_count;
-	submap_info->is_submap = entry->is_sub_map;
-	submap_info->object_id = (vm_offset_t)entry->object.vm_object;
-	*address = base_addr;
+		if ((sync_flags & VM_SYNC_INVALIDATE) && object->resident_page_count == 0) {
+			/*
+			 * clear out the clustering and read-ahead hints
+			 */
+			vm_object_lock(object);
 
+			object->pages_created = 0;
+			object->pages_used = 0;
+			object->sequential = 0;
+			object->last_alloc = 0;
 
-	extended.pages_resident = 0;
-	extended.pages_swapped_out = 0;
-	extended.pages_shared_now_private = 0;
-	extended.pages_dirtied = 0;
-	extended.external_pager = 0;
-	extended.shadow_depth = 0;
+			vm_object_unlock(object);
+		}
+		vm_object_deallocate(object);
+	} /* while */
 
-	if(!entry->is_sub_map) {
-		vm_region_walk(entry, &extended, entry->offset, 
-				entry->vme_end - start, map, start);
-		submap_info->share_mode = extended.share_mode;
-		if (extended.external_pager && extended.ref_count == 2 
-					&& extended.share_mode == SM_SHARED)
-			submap_info->share_mode = SM_PRIVATE;
-		submap_info->ref_count = extended.ref_count;
-	} else {
-		if(entry->use_pmap) 
-			submap_info->share_mode =  SM_TRUESHARED;
-		else
-			submap_info->share_mode = SM_PRIVATE;
-		submap_info->ref_count = entry->object.sub_map->ref_count;
+	/* for proper msync() behaviour */
+	if (had_hole == TRUE && (sync_flags & VM_SYNC_CONTIGUOUS)) {
+		return KERN_INVALID_ADDRESS;
 	}
 
-	submap_info->pages_resident = extended.pages_resident;
-	submap_info->pages_swapped_out = extended.pages_swapped_out;
-	submap_info->pages_shared_now_private = 
-				extended.pages_shared_now_private;
-	submap_info->pages_dirtied = extended.pages_dirtied;
-	submap_info->external_pager = extended.external_pager;
-	submap_info->shadow_depth = extended.shadow_depth;
-
-	vm_map_unlock_read(map);
-	return(KERN_SUCCESS);
-}
-
+	return KERN_SUCCESS;
+}/* vm_msync */
 
 /*
- *	TEMPORARYTEMPORARYTEMPORARYTEMPORARYTEMPORARYTEMPORARY
- *	Goes away after regular vm_region function migrates to
- *	64 bits
+ *	Routine:	convert_port_entry_to_map
+ *	Purpose:
+ *		Convert from a port specifying an entry or a task
+ *		to a map. Doesn't consume the port ref; produces a map ref,
+ *		which may be null.  Unlike convert_port_to_map, the
+ *		port may be task or a named entry backed.
+ *	Conditions:
+ *		Nothing locked.
  */
 
 
-kern_return_t
-vm_region_64(
-	vm_map_t		 map,
-	vm_offset_t	        *address,		/* IN/OUT */
-	vm_size_t		*size,			/* OUT */
-	vm_region_flavor_t	 flavor,		/* IN */
-	vm_region_info_t	 info,			/* OUT */
-	mach_msg_type_number_t	*count,			/* IN/OUT */
-	ipc_port_t		*object_name)		/* OUT */
-{
-	vm_map_entry_t		tmp_entry;
-	register
-	vm_map_entry_t		entry;
-	register
-	vm_offset_t		start;
-	vm_region_basic_info_64_t	basic;
-	vm_region_extended_info_t	extended;
-	vm_region_top_info_t	top;
-
-	if (map == VM_MAP_NULL) 
-		return(KERN_INVALID_ARGUMENT);
-
-	switch (flavor) {
-	
-	case VM_REGION_BASIC_INFO:
-	{
-	    if (*count < VM_REGION_BASIC_INFO_COUNT)
-		return(KERN_INVALID_ARGUMENT);
-
-	    basic = (vm_region_basic_info_64_t) info;
-	    *count = VM_REGION_BASIC_INFO_COUNT;
-
-	    vm_map_lock_read(map);
+vm_map_t
+convert_port_entry_to_map(
+	ipc_port_t      port)
+{
+	vm_map_t map;
+	vm_named_entry_t        named_entry;
+	uint32_t        try_failed_count = 0;
 
-	    start = *address;
-	    if (!vm_map_lookup_entry(map, start, &tmp_entry)) {
-		if ((entry = tmp_entry->vme_next) == vm_map_to_entry(map)) {
-			vm_map_unlock_read(map);
-		   	return(KERN_INVALID_ADDRESS);
+	if (IP_VALID(port) && (ip_kotype(port) == IKOT_NAMED_ENTRY)) {
+		while (TRUE) {
+			ip_lock(port);
+			if (ip_active(port) && (ip_kotype(port)
+			    == IKOT_NAMED_ENTRY)) {
+				named_entry =
+				    (vm_named_entry_t)port->ip_kobject;
+				if (!(lck_mtx_try_lock(&(named_entry)->Lock))) {
+					ip_unlock(port);
+
+					try_failed_count++;
+					mutex_pause(try_failed_count);
+					continue;
+				}
+				named_entry->ref_count++;
+				lck_mtx_unlock(&(named_entry)->Lock);
+				ip_unlock(port);
+				if ((named_entry->is_sub_map) &&
+				    (named_entry->protection
+				    & VM_PROT_WRITE)) {
+					map = named_entry->backing.map;
+				} else {
+					mach_destroy_memory_entry(port);
+					return VM_MAP_NULL;
+				}
+				vm_map_reference_swap(map);
+				mach_destroy_memory_entry(port);
+				break;
+			} else {
+				return VM_MAP_NULL;
+			}
 		}
-	    } else {
-		entry = tmp_entry;
-	    }
-
-	    start = entry->vme_start;
-
-	    basic->offset = entry->offset;
-	    basic->protection = entry->protection;
-	    basic->inheritance = entry->inheritance;
-	    basic->max_protection = entry->max_protection;
-	    basic->behavior = entry->behavior;
-	    basic->user_wired_count = entry->user_wired_count;
-	    basic->reserved = entry->is_sub_map;
-	    *address = start;
-	    *size = (entry->vme_end - start);
-
-	    if (object_name) *object_name = IP_NULL;
-	    if (entry->is_sub_map) {
-	        basic->shared = FALSE;
-	    } else {
-	        basic->shared = entry->is_shared;
-	    }
-
-	    vm_map_unlock_read(map);
-	    return(KERN_SUCCESS);
+	} else {
+		map = convert_port_to_map(port);
 	}
-	case VM_REGION_EXTENDED_INFO:
-	{
 
-	    if (*count < VM_REGION_EXTENDED_INFO_COUNT)
-		return(KERN_INVALID_ARGUMENT);
+	return map;
+}
 
-	    extended = (vm_region_extended_info_t) info;
-	    *count = VM_REGION_EXTENDED_INFO_COUNT;
+/*
+ *	Routine:	convert_port_entry_to_object
+ *	Purpose:
+ *		Convert from a port specifying a named entry to an
+ *		object. Doesn't consume the port ref; produces a map ref,
+ *		which may be null.
+ *	Conditions:
+ *		Nothing locked.
+ */
 
-	    vm_map_lock_read(map);
 
-	    start = *address;
-	    if (!vm_map_lookup_entry(map, start, &tmp_entry)) {
-		if ((entry = tmp_entry->vme_next) == vm_map_to_entry(map)) {
-			vm_map_unlock_read(map);
-		   	return(KERN_INVALID_ADDRESS);
+vm_object_t
+convert_port_entry_to_object(
+	ipc_port_t      port)
+{
+	vm_object_t             object = VM_OBJECT_NULL;
+	vm_named_entry_t        named_entry;
+	uint32_t                try_failed_count = 0;
+
+	if (IP_VALID(port) &&
+	    (ip_kotype(port) == IKOT_NAMED_ENTRY)) {
+try_again:
+		ip_lock(port);
+		if (ip_active(port) &&
+		    (ip_kotype(port) == IKOT_NAMED_ENTRY)) {
+			named_entry = (vm_named_entry_t)port->ip_kobject;
+			if (!(lck_mtx_try_lock(&(named_entry)->Lock))) {
+				ip_unlock(port);
+				try_failed_count++;
+				mutex_pause(try_failed_count);
+				goto try_again;
+			}
+			named_entry->ref_count++;
+			lck_mtx_unlock(&(named_entry)->Lock);
+			ip_unlock(port);
+			if (!(named_entry->is_sub_map) &&
+			    !(named_entry->is_copy) &&
+			    (named_entry->protection & VM_PROT_WRITE)) {
+				object = named_entry->backing.object;
+				vm_object_reference(object);
+			}
+			mach_destroy_memory_entry(port);
 		}
-	    } else {
-		entry = tmp_entry;
-	    }
-	    start = entry->vme_start;
+	}
+
+	return object;
+}
 
-	    extended->protection = entry->protection;
-	    extended->user_tag = entry->alias;
-	    extended->pages_resident = 0;
-	    extended->pages_swapped_out = 0;
-	    extended->pages_shared_now_private = 0;
-	    extended->pages_dirtied = 0;
-	    extended->external_pager = 0;
-	    extended->shadow_depth = 0;
+/*
+ * Export routines to other components for the things we access locally through
+ * macros.
+ */
+#undef current_map
+vm_map_t
+current_map(void)
+{
+	return current_map_fast();
+}
 
-	    vm_region_walk(entry, extended, entry->offset, entry->vme_end - start, map, start);
+/*
+ *	vm_map_reference:
+ *
+ *	Most code internal to the osfmk will go through a
+ *	macro defining this.  This is always here for the
+ *	use of other kernel components.
+ */
+#undef vm_map_reference
+void
+vm_map_reference(
+	vm_map_t        map)
+{
+	if (map == VM_MAP_NULL) {
+		return;
+	}
 
-	    if (extended->external_pager && extended->ref_count == 2 && extended->share_mode == SM_SHARED)
-	            extended->share_mode = SM_PRIVATE;
+	lck_mtx_lock(&map->s_lock);
+#if     TASK_SWAPPER
+	assert(map->res_count > 0);
+	assert(os_ref_get_count(&map->map_refcnt) >= map->res_count);
+	map->res_count++;
+#endif
+	os_ref_retain_locked(&map->map_refcnt);
+	lck_mtx_unlock(&map->s_lock);
+}
 
-	    if (object_name)
-	        *object_name = IP_NULL;
-	    *address = start;
-	    *size = (entry->vme_end - start);
+/*
+ *	vm_map_deallocate:
+ *
+ *	Removes a reference from the specified map,
+ *	destroying it if no references remain.
+ *	The map should not be locked.
+ */
+void
+vm_map_deallocate(
+	vm_map_t        map)
+{
+	unsigned int            ref;
 
-	    vm_map_unlock_read(map);
-	    return(KERN_SUCCESS);
+	if (map == VM_MAP_NULL) {
+		return;
 	}
-	case VM_REGION_TOP_INFO:
-	{   
 
-	    if (*count < VM_REGION_TOP_INFO_COUNT)
-		return(KERN_INVALID_ARGUMENT);
+	lck_mtx_lock(&map->s_lock);
+	ref = os_ref_release_locked(&map->map_refcnt);
+	if (ref > 0) {
+		vm_map_res_deallocate(map);
+		lck_mtx_unlock(&map->s_lock);
+		return;
+	}
+	assert(os_ref_get_count(&map->map_refcnt) == 0);
+	lck_mtx_unlock(&map->s_lock);
 
-	    top = (vm_region_top_info_t) info;
-	    *count = VM_REGION_TOP_INFO_COUNT;
+#if     TASK_SWAPPER
+	/*
+	 * The map residence count isn't decremented here because
+	 * the vm_map_delete below will traverse the entire map,
+	 * deleting entries, and the residence counts on objects
+	 * and sharing maps will go away then.
+	 */
+#endif
 
-	    vm_map_lock_read(map);
+	vm_map_destroy(map, VM_MAP_REMOVE_NO_FLAGS);
+}
 
-	    start = *address;
-	    if (!vm_map_lookup_entry(map, start, &tmp_entry)) {
-		if ((entry = tmp_entry->vme_next) == vm_map_to_entry(map)) {
-			vm_map_unlock_read(map);
-		   	return(KERN_INVALID_ADDRESS);
-		}
-	    } else {
-		entry = tmp_entry;
 
-	    }
-	    start = entry->vme_start;
+void
+vm_map_disable_NX(vm_map_t map)
+{
+	if (map == NULL) {
+		return;
+	}
+	if (map->pmap == NULL) {
+		return;
+	}
 
-	    top->private_pages_resident = 0;
-	    top->shared_pages_resident = 0;
+	pmap_disable_NX(map->pmap);
+}
 
-	    vm_region_top_walk(entry, top);
+void
+vm_map_disallow_data_exec(vm_map_t map)
+{
+	if (map == NULL) {
+		return;
+	}
 
-	    if (object_name)
-	        *object_name = IP_NULL;
-	    *address = start;
-	    *size = (entry->vme_end - start);
+	map->map_disallow_data_exec = TRUE;
+}
 
-	    vm_map_unlock_read(map);
-	    return(KERN_SUCCESS);
-	}
-	default:
-	    return(KERN_INVALID_ARGUMENT);
-	}
+/* XXX Consider making these constants (VM_MAX_ADDRESS and MACH_VM_MAX_ADDRESS)
+ * more descriptive.
+ */
+void
+vm_map_set_32bit(vm_map_t map)
+{
+#if defined(__arm__) || defined(__arm64__)
+	map->max_offset = pmap_max_offset(FALSE, ARM_PMAP_MAX_OFFSET_DEVICE);
+#else
+	map->max_offset = (vm_map_offset_t)VM_MAX_ADDRESS;
+#endif
 }
 
+
 void
-vm_region_top_walk(
-        vm_map_entry_t		   entry,
-	vm_region_top_info_t       top)
+vm_map_set_64bit(vm_map_t map)
 {
-        register struct vm_object *obj, *tmp_obj;
-	register int    ref_count;
-
-	if (entry->object.vm_object == 0) {
-	    top->share_mode = SM_EMPTY;
-	    top->ref_count = 0;
-	    top->obj_id = 0;
-	    return;
-	}
-        if (entry->is_sub_map)
-	    vm_region_top_walk((vm_map_entry_t)entry->object.sub_map, top);
-	else {
-	    obj = entry->object.vm_object;
-
-	    vm_object_lock(obj);
-
-	    if ((ref_count = obj->ref_count) > 1 && obj->paging_in_progress)
-	        ref_count--;
-
-	    if (obj->shadow) {
-		if (ref_count == 1)
-		    top->private_pages_resident = obj->resident_page_count;
-		else
-		    top->shared_pages_resident = obj->resident_page_count;
-		top->ref_count  = ref_count;
-	        top->share_mode = SM_COW;
-	    
-	        while (tmp_obj = obj->shadow) {
-		    vm_object_lock(tmp_obj);
-		    vm_object_unlock(obj);
-		    obj = tmp_obj;
-
-		    if ((ref_count = obj->ref_count) > 1 && obj->paging_in_progress)
-		        ref_count--;
-
-		    top->shared_pages_resident += obj->resident_page_count;
-		    top->ref_count += ref_count - 1;
-		}
-	    } else {
-	        if (entry->needs_copy) {
-		    top->share_mode = SM_COW;
-		    top->shared_pages_resident = obj->resident_page_count;
-		} else {
-		    if (ref_count == 1 ||
-		       (ref_count == 2 && !(obj->pager_trusted) && !(obj->internal))) {
-		        top->share_mode = SM_PRIVATE;
-			top->private_pages_resident = obj->resident_page_count;
-		    } else {
-		        top->share_mode = SM_SHARED;
-			top->shared_pages_resident = obj->resident_page_count;
-		    }
-		}
-		top->ref_count = ref_count;
-	    }
-	    top->obj_id = (int)obj;
+#if defined(__arm__) || defined(__arm64__)
+	map->max_offset = pmap_max_offset(TRUE, ARM_PMAP_MAX_OFFSET_DEVICE);
+#else
+	map->max_offset = (vm_map_offset_t)MACH_VM_MAX_ADDRESS;
+#endif
+}
 
-	    vm_object_unlock(obj);
-	}
+/*
+ * Expand the maximum size of an existing map to the maximum supported.
+ */
+void
+vm_map_set_jumbo(vm_map_t map)
+{
+#if defined (__arm64__)
+	vm_map_set_max_addr(map, ~0);
+#else /* arm64 */
+	(void) map;
+#endif
 }
 
+/*
+ * This map has a JIT entitlement
+ */
 void
-vm_region_walk(
-        vm_map_entry_t		   entry,
-	vm_region_extended_info_t  extended,
-	vm_object_offset_t	   offset,
-	vm_offset_t		   range,
-	vm_map_t		   map,
-	vm_offset_t                va)
-{
-        register struct vm_object *obj, *tmp_obj;
-	register vm_offset_t       last_offset;
-	register int               i;
-	register int               ref_count;
-	void vm_region_look_for_page();
-
-	if ((entry->object.vm_object == 0) || 
-		(entry->object.vm_object->phys_contiguous)) {
-	    extended->share_mode = SM_EMPTY;
-	    extended->ref_count = 0;
-	    return;
-	}
-        if (entry->is_sub_map)
-	    vm_region_walk((vm_map_entry_t)entry->object.sub_map, extended, offset + entry->offset,
-			   range, map, va);
-	else {
-	    obj = entry->object.vm_object;
-
-	    vm_object_lock(obj);
-
-	    if ((ref_count = obj->ref_count) > 1 && obj->paging_in_progress)
-	        ref_count--;
-
-	    for (last_offset = offset + range; offset < last_offset; offset += PAGE_SIZE_64, va += PAGE_SIZE)
-	        vm_region_look_for_page(obj, extended, offset, ref_count, 0, map, va);
-
-	    if (extended->shadow_depth || entry->needs_copy)
-	        extended->share_mode = SM_COW;
-	    else {
-	        if (ref_count == 1)
-		    extended->share_mode = SM_PRIVATE;
-		else {
-	            if (obj->true_share)
-		        extended->share_mode = SM_TRUESHARED;
-		    else
-		        extended->share_mode = SM_SHARED;
-		}
-	    }
-	    extended->ref_count = ref_count - extended->shadow_depth;
-	    
-	    for (i = 0; i < extended->shadow_depth; i++) {
-	        if ((tmp_obj = obj->shadow) == 0)
-		    break;
-		vm_object_lock(tmp_obj);
-		vm_object_unlock(obj);
+vm_map_set_jit_entitled(vm_map_t map)
+{
+#if defined (__arm64__)
+	pmap_set_jit_entitled(map->pmap);
+#else /* arm64 */
+	(void) map;
+#endif
+}
 
-		if ((ref_count = tmp_obj->ref_count) > 1 && tmp_obj->paging_in_progress)
-		    ref_count--;
+/*
+ * Expand the maximum size of an existing map.
+ */
+void
+vm_map_set_max_addr(vm_map_t map, vm_map_offset_t new_max_offset)
+{
+#if defined(__arm64__)
+	vm_map_offset_t max_supported_offset = 0;
+	vm_map_offset_t old_max_offset = map->max_offset;
+	max_supported_offset = pmap_max_offset(vm_map_is_64bit(map), ARM_PMAP_MAX_OFFSET_JUMBO);
 
-		extended->ref_count += ref_count;
-		obj = tmp_obj;
-	    }
-	    vm_object_unlock(obj);
+	new_max_offset = trunc_page(new_max_offset);
 
-	    if (extended->share_mode == SM_SHARED) {
-	        register vm_map_entry_t	     cur;
-	        register vm_map_entry_t	     last;
-		int      my_refs;
+	/* The address space cannot be shrunk using this routine. */
+	if (old_max_offset >= new_max_offset) {
+		return;
+	}
 
-	        obj = entry->object.vm_object;
-		last = vm_map_to_entry(map);
-		my_refs = 0;
+	if (max_supported_offset < new_max_offset) {
+		new_max_offset = max_supported_offset;
+	}
 
-		if ((ref_count = obj->ref_count) > 1 && obj->paging_in_progress)
-		        ref_count--;
-		for (cur = vm_map_first_entry(map); cur != last; cur = cur->vme_next)
-		    my_refs += vm_region_count_obj_refs(cur, obj);
+	map->max_offset = new_max_offset;
 
-		if (my_refs == ref_count)
-		    extended->share_mode = SM_PRIVATE_ALIASED;
-		else if (my_refs > 1)
-		    extended->share_mode = SM_SHARED_ALIASED;
-	    }
+	if (map->holes_list->prev->vme_end == old_max_offset) {
+		/*
+		 * There is already a hole at the end of the map; simply make it bigger.
+		 */
+		map->holes_list->prev->vme_end = map->max_offset;
+	} else {
+		/*
+		 * There is no hole at the end, so we need to create a new hole
+		 * for the new empty space we're creating.
+		 */
+		struct vm_map_links *new_hole = zalloc(vm_map_holes_zone);
+		new_hole->start = old_max_offset;
+		new_hole->end = map->max_offset;
+		new_hole->prev = map->holes_list->prev;
+		new_hole->next = (struct vm_map_entry *)map->holes_list;
+		map->holes_list->prev->links.next = (struct vm_map_entry *)new_hole;
+		map->holes_list->prev = (struct vm_map_entry *)new_hole;
 	}
+#else
+	(void)map;
+	(void)new_max_offset;
+#endif
 }
 
-
-/* object is locked on entry and locked on return */
-
+vm_map_offset_t
+vm_compute_max_offset(boolean_t is64)
+{
+#if defined(__arm__) || defined(__arm64__)
+	return pmap_max_offset(is64, ARM_PMAP_MAX_OFFSET_DEVICE);
+#else
+	return is64 ? (vm_map_offset_t)MACH_VM_MAX_ADDRESS : (vm_map_offset_t)VM_MAX_ADDRESS;
+#endif
+}
 
 void
-vm_region_look_for_page(
-        vm_object_t		   object,
-	vm_region_extended_info_t  extended,
-	vm_object_offset_t	   offset,
-	int                        max_refcnt,
-        int                        depth,
-	vm_map_t		   map,
-	vm_offset_t                va)
-{
-        register vm_page_t	   p;
-        register vm_object_t	   shadow;
-	register int               ref_count;
-	vm_object_t		   caller_object;
-        
-	shadow = object->shadow;
-	caller_object = object;
+vm_map_get_max_aslr_slide_section(
+	vm_map_t                map __unused,
+	int64_t                 *max_sections,
+	int64_t                 *section_size)
+{
+#if defined(__arm64__)
+	*max_sections = 3;
+	*section_size = ARM_TT_TWIG_SIZE;
+#else
+	*max_sections = 1;
+	*section_size = 0;
+#endif
+}
 
-	
-	while (TRUE) {
+uint64_t
+vm_map_get_max_aslr_slide_pages(vm_map_t map)
+{
+#if defined(__arm64__)
+	/* Limit arm64 slide to 16MB to conserve contiguous VA space in the more
+	 * limited embedded address space; this is also meant to minimize pmap
+	 * memory usage on 16KB page systems.
+	 */
+	return 1 << (24 - VM_MAP_PAGE_SHIFT(map));
+#else
+	return 1 << (vm_map_is_64bit(map) ? 16 : 8);
+#endif
+}
 
-		if ( !(object->pager_trusted) && !(object->internal))
-			    extended->external_pager = 1;
+uint64_t
+vm_map_get_max_loader_aslr_slide_pages(vm_map_t map)
+{
+#if defined(__arm64__)
+	/* We limit the loader slide to 4MB, in order to ensure at least 8 bits
+	 * of independent entropy on 16KB page systems.
+	 */
+	return 1 << (22 - VM_MAP_PAGE_SHIFT(map));
+#else
+	return 1 << (vm_map_is_64bit(map) ? 16 : 8);
+#endif
+}
 
-		if ((p = vm_page_lookup(object, offset)) != VM_PAGE_NULL) {
-	        	if (shadow && (max_refcnt == 1))
-		    		extended->pages_shared_now_private++;
+#ifndef __arm__
+boolean_t
+vm_map_is_64bit(
+	vm_map_t map)
+{
+	return map->max_offset > ((vm_map_offset_t)VM_MAX_ADDRESS);
+}
+#endif
+
+boolean_t
+vm_map_has_hard_pagezero(
+	vm_map_t        map,
+	vm_map_offset_t pagezero_size)
+{
+	/*
+	 * XXX FBDP
+	 * We should lock the VM map (for read) here but we can get away
+	 * with it for now because there can't really be any race condition:
+	 * the VM map's min_offset is changed only when the VM map is created
+	 * and when the zero page is established (when the binary gets loaded),
+	 * and this routine gets called only when the task terminates and the
+	 * VM map is being torn down, and when a new map is created via
+	 * load_machfile()/execve().
+	 */
+	return map->min_offset >= pagezero_size;
+}
 
-			if (p->dirty || pmap_is_modified(p->phys_addr))
-		    		extended->pages_dirtied++;
-	        	extended->pages_resident++;
+/*
+ * Raise a VM map's maximun offset.
+ */
+kern_return_t
+vm_map_raise_max_offset(
+	vm_map_t        map,
+	vm_map_offset_t new_max_offset)
+{
+	kern_return_t   ret;
 
-			if(object != caller_object)
-				vm_object_unlock(object);
+	vm_map_lock(map);
+	ret = KERN_INVALID_ADDRESS;
 
-			return;
+	if (new_max_offset >= map->max_offset) {
+		if (!vm_map_is_64bit(map)) {
+			if (new_max_offset <= (vm_map_offset_t)VM_MAX_ADDRESS) {
+				map->max_offset = new_max_offset;
+				ret = KERN_SUCCESS;
+			}
+		} else {
+			if (new_max_offset <= (vm_map_offset_t)MACH_VM_MAX_ADDRESS) {
+				map->max_offset = new_max_offset;
+				ret = KERN_SUCCESS;
+			}
 		}
-		if (object->existence_map) {
-	    		if (vm_external_state_get(object->existence_map, offset) == VM_EXTERNAL_STATE_EXISTS) {
-
-	        		extended->pages_swapped_out++;
+	}
 
-				if(object != caller_object)
-					vm_object_unlock(object);
+	vm_map_unlock(map);
+	return ret;
+}
 
-				return;
-	    		}
-		}
-		if (shadow) {
-	    		vm_object_lock(shadow);
 
-			if ((ref_count = shadow->ref_count) > 1 && shadow->paging_in_progress)
-			        ref_count--;
+/*
+ * Raise a VM map's minimum offset.
+ * To strictly enforce "page zero" reservation.
+ */
+kern_return_t
+vm_map_raise_min_offset(
+	vm_map_t        map,
+	vm_map_offset_t new_min_offset)
+{
+	vm_map_entry_t  first_entry;
 
-	    		if (++depth > extended->shadow_depth)
-	        		extended->shadow_depth = depth;
+	new_min_offset = vm_map_round_page(new_min_offset,
+	    VM_MAP_PAGE_MASK(map));
 
-	    		if (ref_count > max_refcnt)
-	        		max_refcnt = ref_count;
-			
-			if(object != caller_object)
-				vm_object_unlock(object);
+	vm_map_lock(map);
 
-			object = shadow;
-			shadow = object->shadow;
-			offset = offset + object->shadow_offset;
-			continue;
-		}
-		if(object != caller_object)
-			vm_object_unlock(object);
-		break;
+	if (new_min_offset < map->min_offset) {
+		/*
+		 * Can't move min_offset backwards, as that would expose
+		 * a part of the address space that was previously, and for
+		 * possibly good reasons, inaccessible.
+		 */
+		vm_map_unlock(map);
+		return KERN_INVALID_ADDRESS;
+	}
+	if (new_min_offset >= map->max_offset) {
+		/* can't go beyond the end of the address space */
+		vm_map_unlock(map);
+		return KERN_INVALID_ADDRESS;
 	}
-}
-
 
-vm_region_count_obj_refs(
-        vm_map_entry_t    entry,
-	vm_object_t       object)
-{
-        register int ref_count;
-	register vm_object_t chk_obj;
-	register vm_object_t tmp_obj;
+	first_entry = vm_map_first_entry(map);
+	if (first_entry != vm_map_to_entry(map) &&
+	    first_entry->vme_start < new_min_offset) {
+		/*
+		 * Some memory was already allocated below the new
+		 * minimun offset.  It's too late to change it now...
+		 */
+		vm_map_unlock(map);
+		return KERN_NO_SPACE;
+	}
 
-	if (entry->object.vm_object == 0)
-	    return(0);
+	map->min_offset = new_min_offset;
 
-        if (entry->is_sub_map)
-	    ref_count = vm_region_count_obj_refs((vm_map_entry_t)entry->object.sub_map, object);
-	else {
-	    ref_count = 0;
+	assert(map->holes_list);
+	map->holes_list->start = new_min_offset;
+	assert(new_min_offset < map->holes_list->end);
 
-	    chk_obj = entry->object.vm_object;
-	    vm_object_lock(chk_obj);
+	vm_map_unlock(map);
 
-	    while (chk_obj) {
-	        if (chk_obj == object)
-		    ref_count++;
-		if (tmp_obj = chk_obj->shadow)
-		    vm_object_lock(tmp_obj);
-		vm_object_unlock(chk_obj);
-		
-		chk_obj = tmp_obj;
-	    }
-	}
-	return(ref_count);
+	return KERN_SUCCESS;
 }
 
-
 /*
- *	Routine:	vm_map_simplify
- *
- *	Description:
- *		Attempt to simplify the map representation in
- *		the vicinity of the given starting address.
- *	Note:
- *		This routine is intended primarily to keep the
- *		kernel maps more compact -- they generally don't
- *		benefit from the "expand a map entry" technology
- *		at allocation time because the adjacent entry
- *		is often wired down.
+ * Set the limit on the maximum amount of user wired memory allowed for this map.
+ * This is basically a copy of the MEMLOCK rlimit value maintained by the BSD side of
+ * the kernel.  The limits are checked in the mach VM side, so we keep a copy so we
+ * don't have to reach over to the BSD data structures.
  */
+
 void
-vm_map_simplify(
-	vm_map_t	map,
-	vm_offset_t	start)
+vm_map_set_user_wire_limit(vm_map_t     map,
+    vm_size_t    limit)
 {
-	vm_map_entry_t	this_entry;
-	vm_map_entry_t	prev_entry;
-	vm_map_entry_t	next_entry;
+	map->user_wire_limit = limit;
+}
 
+
+void
+vm_map_switch_protect(vm_map_t     map,
+    boolean_t    val)
+{
 	vm_map_lock(map);
-	if (
-		(vm_map_lookup_entry(map, start, &this_entry)) &&
-		((prev_entry = this_entry->vme_prev) != vm_map_to_entry(map)) &&
-
-		(prev_entry->vme_end == this_entry->vme_start) &&
-
-		(prev_entry->is_shared == FALSE) &&
-		(prev_entry->is_sub_map == FALSE) &&
-
-		(this_entry->is_shared == FALSE) &&
-		(this_entry->is_sub_map == FALSE) &&
-
-		(prev_entry->inheritance == this_entry->inheritance) &&
-		(prev_entry->protection == this_entry->protection) &&
-		(prev_entry->max_protection == this_entry->max_protection) &&
-		(prev_entry->behavior == this_entry->behavior) &&
-		(prev_entry->wired_count == this_entry->wired_count) &&
-		(prev_entry->user_wired_count == this_entry->user_wired_count)&&
-		(prev_entry->in_transition == FALSE) &&
-		(this_entry->in_transition == FALSE) &&
-
-		(prev_entry->needs_copy == this_entry->needs_copy) &&
-
-		(prev_entry->object.vm_object == this_entry->object.vm_object)&&
-		((prev_entry->offset +
-		 (prev_entry->vme_end - prev_entry->vme_start))
-		     == this_entry->offset)
-	) {
-		SAVE_HINT(map, prev_entry);
-		vm_map_entry_unlink(map, this_entry);
-		prev_entry->vme_end = this_entry->vme_end;
-		UPDATE_FIRST_FREE(map, map->first_free);
-	 	vm_object_deallocate(this_entry->object.vm_object);
-		vm_map_entry_dispose(map, this_entry);
-		counter(c_vm_map_simplified_lower++);
-	}
-	if (
-		(vm_map_lookup_entry(map, start, &this_entry)) &&
-		((next_entry = this_entry->vme_next) != vm_map_to_entry(map)) &&
-
-		(next_entry->vme_start == this_entry->vme_end) &&
-
-		(next_entry->is_shared == FALSE) &&
-		(next_entry->is_sub_map == FALSE) &&
-
-		(next_entry->is_shared == FALSE) &&
-		(next_entry->is_sub_map == FALSE) &&
-
-		(next_entry->inheritance == this_entry->inheritance) &&
-		(next_entry->protection == this_entry->protection) &&
-		(next_entry->max_protection == this_entry->max_protection) &&
-		(next_entry->behavior == this_entry->behavior) &&
-		(next_entry->wired_count == this_entry->wired_count) &&
-		(next_entry->user_wired_count == this_entry->user_wired_count)&&
-		(this_entry->in_transition == FALSE) &&
-		(next_entry->in_transition == FALSE) &&
-
-		(next_entry->needs_copy == this_entry->needs_copy) &&
-
-		(next_entry->object.vm_object == this_entry->object.vm_object)&&
-		((this_entry->offset +
-		 (this_entry->vme_end - this_entry->vme_start))
-		     == next_entry->offset)
-	) {
-		vm_map_entry_unlink(map, next_entry);
-		this_entry->vme_end = next_entry->vme_end;
-		UPDATE_FIRST_FREE(map, map->first_free);
-	 	vm_object_deallocate(next_entry->object.vm_object);
-		vm_map_entry_dispose(map, next_entry);
-		counter(c_vm_map_simplified_upper++);
-	}
-	counter(c_vm_map_simplify_called++);
+	map->switch_protect = val;
 	vm_map_unlock(map);
 }
 
-
 /*
- *	Routine:	vm_map_machine_attribute
- *	Purpose:
- *		Provide machine-specific attributes to mappings,
- *		such as cachability etc. for machines that provide
- *		them.  NUMA architectures and machines with big/strange
- *		caches will use this.
- *	Note:
- *		Responsibilities for locking and checking are handled here,
- *		everything else in the pmap module. If any non-volatile
- *		information must be kept, the pmap module should handle
- *		it itself. [This assumes that attributes do not
- *		need to be inherited, which seems ok to me]
+ * IOKit has mapped a region into this map; adjust the pmap's ledgers appropriately.
+ * phys_footprint is a composite limit consisting of iokit + physmem, so we need to
+ * bump both counters.
  */
-kern_return_t
-vm_map_machine_attribute(
-	vm_map_t	map,
-	vm_offset_t	address,
-	vm_size_t	size,
-	vm_machine_attribute_t	attribute,
-	vm_machine_attribute_val_t* value)		/* IN/OUT */
+void
+vm_map_iokit_mapped_region(vm_map_t map, vm_size_t bytes)
 {
-	kern_return_t	ret;
-
-	if (address < vm_map_min(map) ||
-	    (address + size) > vm_map_max(map))
-		return KERN_INVALID_ADDRESS;
+	pmap_t pmap = vm_map_pmap(map);
 
-	vm_map_lock(map);
-
-	ret = pmap_attribute(map->pmap, address, size, attribute, value);
+	ledger_credit(pmap->ledger, task_ledgers.iokit_mapped, bytes);
+	ledger_credit(pmap->ledger, task_ledgers.phys_footprint, bytes);
+}
 
-	vm_map_unlock(map);
+void
+vm_map_iokit_unmapped_region(vm_map_t map, vm_size_t bytes)
+{
+	pmap_t pmap = vm_map_pmap(map);
 
-	return ret;
+	ledger_debit(pmap->ledger, task_ledgers.iokit_mapped, bytes);
+	ledger_debit(pmap->ledger, task_ledgers.phys_footprint, bytes);
 }
 
-/*
- *	vm_map_behavior_set:
- *
- *	Sets the paging reference behavior of the specified address
- *	range in the target map.  Paging reference behavior affects
- *	how pagein operations resulting from faults on the map will be 
- *	clustered.
- */
-kern_return_t 
-vm_map_behavior_set(
-	vm_map_t	map,
-	vm_offset_t	start,
-	vm_offset_t	end,
-	vm_behavior_t	new_behavior)
+/* Add (generate) code signature for memory range */
+#if CONFIG_DYNAMIC_CODE_SIGNING
+kern_return_t
+vm_map_sign(vm_map_t map,
+    vm_map_offset_t start,
+    vm_map_offset_t end)
 {
-	register vm_map_entry_t	entry;
-	vm_map_entry_t	temp_entry;
-
-	XPR(XPR_VM_MAP,
-		"vm_map_behavior_set, 0x%X start 0x%X end 0x%X behavior %d",
-		(integer_t)map, start, end, new_behavior, 0);
+	vm_map_entry_t entry;
+	vm_page_t m;
+	vm_object_t object;
 
-	switch (new_behavior) {
-	case VM_BEHAVIOR_DEFAULT:
-	case VM_BEHAVIOR_RANDOM:
-	case VM_BEHAVIOR_SEQUENTIAL:
-	case VM_BEHAVIOR_RSEQNTL:
-		break;
-	default:
-		return(KERN_INVALID_ARGUMENT);
+	/*
+	 * Vet all the input parameters and current type and state of the
+	 * underlaying object.  Return with an error if anything is amiss.
+	 */
+	if (map == VM_MAP_NULL) {
+		return KERN_INVALID_ARGUMENT;
 	}
 
-	vm_map_lock(map);
+	vm_map_lock_read(map);
+
+	if (!vm_map_lookup_entry(map, start, &entry) || entry->is_sub_map) {
+		/*
+		 * Must pass a valid non-submap address.
+		 */
+		vm_map_unlock_read(map);
+		return KERN_INVALID_ADDRESS;
+	}
 
-	/*
-	 *	The entire address range must be valid for the map.
-	 * 	Note that vm_map_range_check() does a 
-	 *	vm_map_lookup_entry() internally and returns the
-	 *	entry containing the start of the address range if
-	 *	the entire range is valid.
-	 */
-	if (vm_map_range_check(map, start, end, &temp_entry)) {
-		entry = temp_entry;
-		vm_map_clip_start(map, entry, start);
+	if ((entry->vme_start > start) || (entry->vme_end < end)) {
+		/*
+		 * Map entry doesn't cover the requested range. Not handling
+		 * this situation currently.
+		 */
+		vm_map_unlock_read(map);
+		return KERN_INVALID_ARGUMENT;
 	}
-	else {
-		vm_map_unlock(map);
-		return(KERN_INVALID_ADDRESS);
+
+	object = VME_OBJECT(entry);
+	if (object == VM_OBJECT_NULL) {
+		/*
+		 * Object must already be present or we can't sign.
+		 */
+		vm_map_unlock_read(map);
+		return KERN_INVALID_ARGUMENT;
 	}
 
-	while ((entry != vm_map_to_entry(map)) && (entry->vme_start < end)) {
-		vm_map_clip_end(map, entry, end);
+	vm_object_lock(object);
+	vm_map_unlock_read(map);
 
-		entry->behavior = new_behavior;
+	while (start < end) {
+		uint32_t refmod;
 
-		entry = entry->vme_next;
+		m = vm_page_lookup(object,
+		    start - entry->vme_start + VME_OFFSET(entry));
+		if (m == VM_PAGE_NULL) {
+			/* shoud we try to fault a page here? we can probably
+			 * demand it exists and is locked for this request */
+			vm_object_unlock(object);
+			return KERN_FAILURE;
+		}
+		/* deal with special page status */
+		if (m->vmp_busy ||
+		    (m->vmp_unusual && (m->vmp_error || m->vmp_restart || m->vmp_private || m->vmp_absent))) {
+			vm_object_unlock(object);
+			return KERN_FAILURE;
+		}
+
+		/* Page is OK... now "validate" it */
+		/* This is the place where we'll call out to create a code
+		 * directory, later */
+		m->vmp_cs_validated = TRUE;
+
+		/* The page is now "clean" for codesigning purposes. That means
+		 * we don't consider it as modified (wpmapped) anymore. But
+		 * we'll disconnect the page so we note any future modification
+		 * attempts. */
+		m->vmp_wpmapped = FALSE;
+		refmod = pmap_disconnect(VM_PAGE_GET_PHYS_PAGE(m));
+
+		/* Pull the dirty status from the pmap, since we cleared the
+		 * wpmapped bit */
+		if ((refmod & VM_MEM_MODIFIED) && !m->vmp_dirty) {
+			SET_PAGE_DIRTY(m, FALSE);
+		}
+
+		/* On to the next page */
+		start += PAGE_SIZE;
 	}
+	vm_object_unlock(object);
 
-	vm_map_unlock(map);
-	return(KERN_SUCCESS);
+	return KERN_SUCCESS;
 }
+#endif
 
+kern_return_t
+vm_map_partial_reap(vm_map_t map, unsigned int *reclaimed_resident, unsigned int *reclaimed_compressed)
+{
+	vm_map_entry_t  entry = VM_MAP_ENTRY_NULL;
+	vm_map_entry_t next_entry;
+	kern_return_t   kr = KERN_SUCCESS;
+	vm_map_t        zap_map;
 
-#include <mach_kdb.h>
-#if	MACH_KDB
-#include <ddb/db_output.h>
-#include <vm/vm_print.h>
+	vm_map_lock(map);
 
-#define	printf	db_printf
+	/*
+	 * We use a "zap_map" to avoid having to unlock
+	 * the "map" in vm_map_delete().
+	 */
+	zap_map = vm_map_create(PMAP_NULL,
+	    map->min_offset,
+	    map->max_offset,
+	    map->hdr.entries_pageable);
 
-/*
- * Forward declarations for internal functions.
- */
-extern void vm_map_links_print(
-		struct vm_map_links	*links);
+	if (zap_map == VM_MAP_NULL) {
+		return KERN_RESOURCE_SHORTAGE;
+	}
 
-extern void vm_map_header_print(
-		struct vm_map_header	*header);
+	vm_map_set_page_shift(zap_map,
+	    VM_MAP_PAGE_SHIFT(map));
+	vm_map_disable_hole_optimization(zap_map);
 
-extern void vm_map_entry_print(
-		vm_map_entry_t		entry);
+	for (entry = vm_map_first_entry(map);
+	    entry != vm_map_to_entry(map);
+	    entry = next_entry) {
+		next_entry = entry->vme_next;
+
+		if (VME_OBJECT(entry) &&
+		    !entry->is_sub_map &&
+		    (VME_OBJECT(entry)->internal == TRUE) &&
+		    (VME_OBJECT(entry)->ref_count == 1)) {
+			*reclaimed_resident += VME_OBJECT(entry)->resident_page_count;
+			*reclaimed_compressed += vm_compressor_pager_get_count(VME_OBJECT(entry)->pager);
+
+			(void)vm_map_delete(map,
+			    entry->vme_start,
+			    entry->vme_end,
+			    VM_MAP_REMOVE_SAVE_ENTRIES,
+			    zap_map);
+		}
+	}
 
-extern void vm_follow_entry(
-		vm_map_entry_t		entry);
+	vm_map_unlock(map);
 
-extern void vm_follow_map(
-		vm_map_t		map);
+	/*
+	 * Get rid of the "zap_maps" and all the map entries that
+	 * they may still contain.
+	 */
+	if (zap_map != VM_MAP_NULL) {
+		vm_map_destroy(zap_map, VM_MAP_REMOVE_NO_PMAP_CLEANUP);
+		zap_map = VM_MAP_NULL;
+	}
 
-/*
- *	vm_map_links_print:	[ debug ]
- */
-void
-vm_map_links_print(
-	struct vm_map_links	*links)
-{
-	iprintf("prev=0x%x, next=0x%x, start=0x%x, end=0x%x\n",
-		links->prev,
-		links->next,
-		links->start,
-		links->end);
+	return kr;
 }
 
-/*
- *	vm_map_header_print:	[ debug ]
- */
-void
-vm_map_header_print(
-	struct vm_map_header	*header)
-{
-	vm_map_links_print(&header->links);
-	iprintf("nentries=0x%x, %sentries_pageable\n",
-		header->nentries,
-		(header->entries_pageable ? "" : "!"));
-}
 
-/*
- *	vm_follow_entry:	[ debug ]
- */
-void
-vm_follow_entry(
-	vm_map_entry_t entry)
-{
-	extern int db_indent;
-	int shadows;
+#if DEVELOPMENT || DEBUG
 
-	iprintf("map entry 0x%x:\n", entry);
+int
+vm_map_disconnect_page_mappings(
+	vm_map_t map,
+	boolean_t do_unnest)
+{
+	vm_map_entry_t entry;
+	int     page_count = 0;
 
-	db_indent += 2;
+	if (do_unnest == TRUE) {
+#ifndef NO_NESTED_PMAP
+		vm_map_lock(map);
 
-	shadows = vm_follow_object(entry->object.vm_object);
-	iprintf("Total objects : %d\n",shadows);
+		for (entry = vm_map_first_entry(map);
+		    entry != vm_map_to_entry(map);
+		    entry = entry->vme_next) {
+			if (entry->is_sub_map && entry->use_pmap) {
+				/*
+				 * Make sure the range between the start of this entry and
+				 * the end of this entry is no longer nested, so that
+				 * we will only remove mappings from the pmap in use by this
+				 * this task
+				 */
+				vm_map_clip_unnest(map, entry, entry->vme_start, entry->vme_end);
+			}
+		}
+		vm_map_unlock(map);
+#endif
+	}
+	vm_map_lock_read(map);
 
-	db_indent -= 2;
-}
+	page_count = map->pmap->stats.resident_count;
 
-/*
- *	vm_map_entry_print:	[ debug ]
- */
-void
-vm_map_entry_print(
-	register vm_map_entry_t	entry)
-{
-	extern int db_indent;
-	static char *inheritance_name[4] = { "share", "copy", "none", "?"};
-	static char *behavior_name[4] = { "dflt", "rand", "seqtl", "rseqntl" };
-	
-	iprintf("map entry 0x%x:\n", entry);
-
-	db_indent += 2;
-
-	vm_map_links_print(&entry->links);
-
-	iprintf("start=0x%x, end=0x%x, prot=%x/%x/%s\n",
-		entry->vme_start,
-		entry->vme_end,
-		entry->protection,
-		entry->max_protection,
-		inheritance_name[(entry->inheritance & 0x3)]);
-
-	iprintf("behavior=%s, wired_count=%d, user_wired_count=%d\n",
-		behavior_name[(entry->behavior & 0x3)],
-		entry->wired_count,
-		entry->user_wired_count);
-	iprintf("%sin_transition, %sneeds_wakeup\n",
-		(entry->in_transition ? "" : "!"),
-		(entry->needs_wakeup ? "" : "!"));
+	for (entry = vm_map_first_entry(map);
+	    entry != vm_map_to_entry(map);
+	    entry = entry->vme_next) {
+		if (!entry->is_sub_map && ((VME_OBJECT(entry) == 0) ||
+		    (VME_OBJECT(entry)->phys_contiguous))) {
+			continue;
+		}
+		if (entry->is_sub_map) {
+			assert(!entry->use_pmap);
+		}
 
-	if (entry->is_sub_map) {
-		iprintf("submap=0x%x, offset=0x%x\n",
-		       entry->object.sub_map,
-		       entry->offset);
-	} else {
-		iprintf("object=0x%x, offset=0x%x, ",
-			entry->object.vm_object,
-			entry->offset);
-		printf("%sis_shared, %sneeds_copy\n",
-		       (entry->is_shared ? "" : "!"),
-		       (entry->needs_copy ? "" : "!"));
+		pmap_remove_options(map->pmap, entry->vme_start, entry->vme_end, 0);
 	}
+	vm_map_unlock_read(map);
 
-	db_indent -= 2;
+	return page_count;
 }
 
-/*
- *	vm_follow_map:	[ debug ]
- */
-void
-vm_follow_map(
-	vm_map_t map)
-{
-	register vm_map_entry_t	entry;
-	extern int db_indent;
+#endif
 
-	iprintf("task map 0x%x:\n", map);
 
-	db_indent += 2;
+#if CONFIG_FREEZE
 
-	for (entry = vm_map_first_entry(map);
-	     entry && entry != vm_map_to_entry(map);
-	     entry = entry->vme_next) {
-	    vm_follow_entry(entry);
-	}
 
-	db_indent -= 2;
-}
+int c_freezer_swapout_page_count;
+int c_freezer_compression_count = 0;
+AbsoluteTime c_freezer_last_yield_ts = 0;
 
-/*
- *	vm_map_print:	[ debug ]
- */
-void
-vm_map_print(
-	register vm_map_t	map)
+extern unsigned int memorystatus_freeze_private_shared_pages_ratio;
+extern unsigned int memorystatus_freeze_shared_mb_per_process_max;
+
+kern_return_t
+vm_map_freeze(
+	task_t       task,
+	unsigned int *purgeable_count,
+	unsigned int *wired_count,
+	unsigned int *clean_count,
+	unsigned int *dirty_count,
+	unsigned int dirty_budget,
+	unsigned int *shared_count,
+	int          *freezer_error_code,
+	boolean_t    eval_only)
 {
-	register vm_map_entry_t	entry;
-	extern int db_indent;
-	char *swstate;
+	vm_map_entry_t  entry2 = VM_MAP_ENTRY_NULL;
+	kern_return_t   kr = KERN_SUCCESS;
+	boolean_t       evaluation_phase = TRUE;
+	vm_object_t     cur_shared_object = NULL;
+	int             cur_shared_obj_ref_cnt = 0;
+	unsigned int    dirty_private_count = 0, dirty_shared_count = 0, obj_pages_snapshot = 0;
 
-	iprintf("task map 0x%x:\n", map);
+	*purgeable_count = *wired_count = *clean_count = *dirty_count = *shared_count = 0;
 
-	db_indent += 2;
+	/*
+	 * We need the exclusive lock here so that we can
+	 * block any page faults or lookups while we are
+	 * in the middle of freezing this vm map.
+	 */
+	vm_map_t map = task->map;
 
-	vm_map_header_print(&map->hdr);
+	vm_map_lock(map);
 
-	iprintf("pmap=0x%x, size=%d, ref=%d, hint=0x%x, first_free=0x%x\n",
-		map->pmap,
-		map->size,
-		map->ref_count,
-		map->hint,
-		map->first_free);
+	assert(VM_CONFIG_COMPRESSOR_IS_PRESENT);
 
-	iprintf("%swait_for_space, %swiring_required, timestamp=%d\n",
-		(map->wait_for_space ? "" : "!"),
-		(map->wiring_required ? "" : "!"),
-		map->timestamp);
+	if (vm_compressor_low_on_space() || vm_swap_low_on_space()) {
+		if (vm_compressor_low_on_space()) {
+			*freezer_error_code = FREEZER_ERROR_NO_COMPRESSOR_SPACE;
+		}
 
-#if	TASK_SWAPPER
-	switch (map->sw_state) {
-	    case MAP_SW_IN:
-		swstate = "SW_IN";
-		break;
-	    case MAP_SW_OUT:
-		swstate = "SW_OUT";
-		break;
-	    default:
-		swstate = "????";
-		break;
-	}
-	iprintf("res=%d, sw_state=%s\n", map->res_count, swstate);
-#endif	/* TASK_SWAPPER */
+		if (vm_swap_low_on_space()) {
+			*freezer_error_code = FREEZER_ERROR_NO_SWAP_SPACE;
+		}
 
-	for (entry = vm_map_first_entry(map);
-	     entry && entry != vm_map_to_entry(map);
-	     entry = entry->vme_next) {
-		vm_map_entry_print(entry);
+		kr = KERN_NO_SPACE;
+		goto done;
 	}
 
-	db_indent -= 2;
-}
+	if (VM_CONFIG_FREEZER_SWAP_IS_ACTIVE == FALSE) {
+		/*
+		 * In-memory compressor backing the freezer. No disk.
+		 * So no need to do the evaluation phase.
+		 */
+		evaluation_phase = FALSE;
 
-/*
- *	Routine:	vm_map_copy_print
- *	Purpose:
- *		Pretty-print a copy object for ddb.
- */
+		if (eval_only == TRUE) {
+			/*
+			 * We don't support 'eval_only' mode
+			 * in this non-swap config.
+			 */
+			*freezer_error_code = FREEZER_ERROR_GENERIC;
+			kr = KERN_INVALID_ARGUMENT;
+			goto done;
+		}
 
-void
-vm_map_copy_print(
-	vm_map_copy_t	copy)
-{
-	extern int db_indent;
-	int i, npages;
-	vm_map_entry_t entry;
+		c_freezer_compression_count = 0;
+		clock_get_uptime(&c_freezer_last_yield_ts);
+	}
+again:
 
-	printf("copy object 0x%x\n", copy);
+	for (entry2 = vm_map_first_entry(map);
+	    entry2 != vm_map_to_entry(map);
+	    entry2 = entry2->vme_next) {
+		vm_object_t     src_object = VME_OBJECT(entry2);
 
-	db_indent += 2;
+		if (src_object &&
+		    !entry2->is_sub_map &&
+		    !src_object->phys_contiguous) {
+			/* If eligible, scan the entry, moving eligible pages over to our parent object */
 
-	iprintf("type=%d", copy->type);
-	switch (copy->type) {
-		case VM_MAP_COPY_ENTRY_LIST:
-		printf("[entry_list]");
-		break;
-		
-		case VM_MAP_COPY_OBJECT:
-		printf("[object]");
-		break;
-		
-		case VM_MAP_COPY_KERNEL_BUFFER:
-		printf("[kernel_buffer]");
-		break;
+			if (src_object->internal == TRUE) {
+				if (VM_CONFIG_FREEZER_SWAP_IS_ACTIVE) {
+					/*
+					 * We skip purgeable objects during evaluation phase only.
+					 * If we decide to freeze this process, we'll explicitly
+					 * purge these objects before we go around again with
+					 * 'evaluation_phase' set to FALSE.
+					 */
 
-		default:
-		printf("[bad type]");
-		break;
-	}
-	printf(", offset=0x%x", copy->offset);
-	printf(", size=0x%x\n", copy->size);
+					if ((src_object->purgable == VM_PURGABLE_EMPTY) || (src_object->purgable == VM_PURGABLE_VOLATILE)) {
+						/*
+						 * We want to purge objects that may not belong to this task but are mapped
+						 * in this task alone. Since we already purged this task's purgeable memory
+						 * at the end of a successful evaluation phase, we want to avoid doing no-op calls
+						 * on this task's purgeable objects. Hence the check for only volatile objects.
+						 */
+						if (evaluation_phase == FALSE &&
+						    (src_object->purgable == VM_PURGABLE_VOLATILE) &&
+						    (src_object->ref_count == 1)) {
+							vm_object_lock(src_object);
+							vm_object_purge(src_object, 0);
+							vm_object_unlock(src_object);
+						}
+						continue;
+					}
 
-	switch (copy->type) {
-		case VM_MAP_COPY_ENTRY_LIST:
-		vm_map_header_print(&copy->cpy_hdr);
-		for (entry = vm_map_copy_first_entry(copy);
-		     entry && entry != vm_map_copy_to_entry(copy);
-		     entry = entry->vme_next) {
-			vm_map_entry_print(entry);
-		}
-		break;
+					/*
+					 * Pages belonging to this object could be swapped to disk.
+					 * Make sure it's not a shared object because we could end
+					 * up just bringing it back in again.
+					 *
+					 * We try to optimize somewhat by checking for objects that are mapped
+					 * more than once within our own map. But we don't do full searches,
+					 * we just look at the entries following our current entry.
+					 */
 
-		case VM_MAP_COPY_OBJECT:
-		iprintf("object=0x%x\n", copy->cpy_object);
-		break;
+					if (src_object->ref_count > 1) {
+						if (src_object != cur_shared_object) {
+							obj_pages_snapshot = (src_object->resident_page_count - src_object->wired_page_count) + vm_compressor_pager_get_count(src_object->pager);
+							dirty_shared_count += obj_pages_snapshot;
+
+							cur_shared_object = src_object;
+							cur_shared_obj_ref_cnt = 1;
+							continue;
+						} else {
+							cur_shared_obj_ref_cnt++;
+							if (src_object->ref_count == cur_shared_obj_ref_cnt) {
+								/*
+								 * Fall through to below and treat this object as private.
+								 * So deduct its pages from our shared total and add it to the
+								 * private total.
+								 */
+
+								dirty_shared_count -= obj_pages_snapshot;
+								dirty_private_count += obj_pages_snapshot;
+							} else {
+								continue;
+							}
+						}
+					}
 
-		case VM_MAP_COPY_KERNEL_BUFFER:
-		iprintf("kernel buffer=0x%x", copy->cpy_kdata);
-		printf(", kalloc_size=0x%x\n", copy->cpy_kalloc_size);
-		break;
 
-	}
+					if (src_object->ref_count == 1) {
+						dirty_private_count += (src_object->resident_page_count - src_object->wired_page_count) + vm_compressor_pager_get_count(src_object->pager);
+					}
 
-	db_indent -=2;
-}
+					if (evaluation_phase == TRUE) {
+						continue;
+					}
+				}
 
-/*
- *	db_vm_map_total_size(map)	[ debug ]
- *
- *	return the total virtual size (in bytes) of the map
- */
-vm_size_t
-db_vm_map_total_size(
-	vm_map_t	map)
-{
-	vm_map_entry_t	entry;
-	vm_size_t	total;
+				uint32_t paged_out_count = vm_object_compressed_freezer_pageout(src_object, dirty_budget);
+				*wired_count += src_object->wired_page_count;
 
-	total = 0;
-	for (entry = vm_map_first_entry(map);
-	     entry != vm_map_to_entry(map);
-	     entry = entry->vme_next) {
-		total += entry->vme_end - entry->vme_start;
+				if (vm_compressor_low_on_space() || vm_swap_low_on_space()) {
+					if (vm_compressor_low_on_space()) {
+						*freezer_error_code = FREEZER_ERROR_NO_COMPRESSOR_SPACE;
+					}
+
+					if (vm_swap_low_on_space()) {
+						*freezer_error_code = FREEZER_ERROR_NO_SWAP_SPACE;
+					}
+
+					kr = KERN_NO_SPACE;
+					break;
+				}
+				if (paged_out_count >= dirty_budget) {
+					break;
+				}
+				dirty_budget -= paged_out_count;
+			}
+		}
 	}
 
-	return total;
-}
+	if (evaluation_phase) {
+		unsigned int shared_pages_threshold = (memorystatus_freeze_shared_mb_per_process_max * 1024 * 1024ULL) / PAGE_SIZE_64;
 
-#endif	/* MACH_KDB */
+		if (dirty_shared_count > shared_pages_threshold) {
+			*freezer_error_code = FREEZER_ERROR_EXCESS_SHARED_MEMORY;
+			kr = KERN_FAILURE;
+			goto done;
+		}
 
-/*
- *	Routine:	vm_map_entry_insert
- *
- *	Descritpion:	This routine inserts a new vm_entry in a locked map.
- */
-vm_map_entry_t
-vm_map_entry_insert(
-	vm_map_t		map,
-	vm_map_entry_t		insp_entry,
-	vm_offset_t		start,
-	vm_offset_t		end,
-	vm_object_t		object,
-	vm_object_offset_t	offset,
-	boolean_t		needs_copy,
-	boolean_t		is_shared,
-	boolean_t		in_transition,
-	vm_prot_t		cur_protection,
-	vm_prot_t		max_protection,
-	vm_behavior_t		behavior,
-	vm_inherit_t		inheritance,
-	unsigned		wired_count)
-{
-	vm_map_entry_t	new_entry;
+		if (dirty_shared_count &&
+		    ((dirty_private_count / dirty_shared_count) < memorystatus_freeze_private_shared_pages_ratio)) {
+			*freezer_error_code = FREEZER_ERROR_LOW_PRIVATE_SHARED_RATIO;
+			kr = KERN_FAILURE;
+			goto done;
+		}
 
-	assert(insp_entry != (vm_map_entry_t)0);
+		evaluation_phase = FALSE;
+		dirty_shared_count = dirty_private_count = 0;
 
-	new_entry = vm_map_entry_create(map);
+		c_freezer_compression_count = 0;
+		clock_get_uptime(&c_freezer_last_yield_ts);
 
-	new_entry->vme_start = start;
-	new_entry->vme_end = end;
-	assert(page_aligned(new_entry->vme_start));
-	assert(page_aligned(new_entry->vme_end));
+		if (eval_only) {
+			kr = KERN_SUCCESS;
+			goto done;
+		}
 
-	new_entry->object.vm_object = object;
-	new_entry->offset = offset;
-	new_entry->is_shared = is_shared;
-	new_entry->is_sub_map = FALSE;
-	new_entry->needs_copy = needs_copy;
-	new_entry->in_transition = in_transition;
-	new_entry->needs_wakeup = FALSE;
-	new_entry->inheritance = inheritance;
-	new_entry->protection = cur_protection;
-	new_entry->max_protection = max_protection;
-	new_entry->behavior = behavior;
-	new_entry->wired_count = wired_count;
-	new_entry->user_wired_count = 0;
-	new_entry->use_pmap = FALSE;
+		vm_purgeable_purge_task_owned(task);
 
-	/*
-	 *	Insert the new entry into the list.
-	 */
+		goto again;
+	} else {
+		kr = KERN_SUCCESS;
+		*shared_count = (unsigned int) ((dirty_shared_count * PAGE_SIZE_64) / (1024 * 1024ULL));
+	}
 
-	vm_map_entry_link(map, insp_entry, new_entry);
-	map->size += end - start;
+done:
+	vm_map_unlock(map);
 
-	/*
-	 *	Update the free space hint and the lookup hint.
-	 */
+	if ((eval_only == FALSE) && (kr == KERN_SUCCESS)) {
+		vm_object_compressed_freezer_done();
 
-	SAVE_HINT(map, new_entry);
-	return new_entry;
+		if (VM_CONFIG_FREEZER_SWAP_IS_ACTIVE) {
+			/*
+			 * reset the counter tracking the # of swapped compressed pages
+			 * because we are now done with this freeze session and task.
+			 */
+
+			*dirty_count = c_freezer_swapout_page_count; //used to track pageouts
+			c_freezer_swapout_page_count = 0;
+		}
+	}
+	return kr;
 }
 
+#endif
+
 /*
- *	Routine:	vm_remap_extract
+ * vm_map_entry_should_cow_for_true_share:
  *
- *	Descritpion:	This routine returns a vm_entry list from a map.
+ * Determines if the map entry should be clipped and setup for copy-on-write
+ * to avoid applying "true_share" to a large VM object when only a subset is
+ * targeted.
+ *
+ * For now, we target only the map entries created for the Objective C
+ * Garbage Collector, which initially have the following properties:
+ *	- alias == VM_MEMORY_MALLOC
+ *      - wired_count == 0
+ *      - !needs_copy
+ * and a VM object with:
+ *      - internal
+ *      - copy_strategy == MEMORY_OBJECT_COPY_SYMMETRIC
+ *      - !true_share
+ *      - vo_size == ANON_CHUNK_SIZE
+ *
+ * Only non-kernel map entries.
  */
-kern_return_t
-vm_remap_extract(
-	vm_map_t		map,
-	vm_offset_t		addr,
-	vm_size_t		size,
-	boolean_t		copy,
-	struct vm_map_header	*map_header,
-	vm_prot_t		*cur_protection,
-	vm_prot_t		*max_protection,
-	/* What, no behavior? */
-	vm_inherit_t		inheritance,
-	boolean_t		pageable)
-{
-	kern_return_t		result;
-	vm_size_t		mapped_size;
-	vm_size_t		tmp_size;
-	vm_map_entry_t		src_entry;     /* result of last map lookup */
-	vm_map_entry_t		new_entry;
-	vm_object_offset_t	offset;
-	vm_offset_t		map_address;
-	vm_offset_t		src_start;     /* start of entry to map */
-	vm_offset_t		src_end;       /* end of region to be mapped */
-	vm_object_t		object;    
-	vm_map_version_t	version;
-	boolean_t		src_needs_copy;
-	boolean_t		new_entry_needs_copy;
-
-	assert(map != VM_MAP_NULL);
-	assert(size != 0 && size == round_page(size));
-	assert(inheritance == VM_INHERIT_NONE ||
-	       inheritance == VM_INHERIT_COPY ||
-	       inheritance == VM_INHERIT_SHARE);
-
-	/*
-	 *	Compute start and end of region.
-	 */
-	src_start = trunc_page(addr);
-	src_end = round_page(src_start + size);
-
-	/*
-	 *	Initialize map_header.
-	 */
-	map_header->links.next = (struct vm_map_entry *)&map_header->links;
-	map_header->links.prev = (struct vm_map_entry *)&map_header->links;
-	map_header->nentries = 0;
-	map_header->entries_pageable = pageable;
+boolean_t
+vm_map_entry_should_cow_for_true_share(
+	vm_map_entry_t  entry)
+{
+	vm_object_t     object;
 
-	*cur_protection = VM_PROT_ALL;
-	*max_protection = VM_PROT_ALL;
+	if (entry->is_sub_map) {
+		/* entry does not point at a VM object */
+		return FALSE;
+	}
 
-	map_address = 0;
-	mapped_size = 0;
-	result = KERN_SUCCESS;
+	if (entry->needs_copy) {
+		/* already set for copy_on_write: done! */
+		return FALSE;
+	}
 
-	/*  
-	 *	The specified source virtual space might correspond to
-	 *	multiple map entries, need to loop on them.
-	 */
-	vm_map_lock(map);
-	while (mapped_size != size) {
-		vm_size_t	entry_size;
+	if (VME_ALIAS(entry) != VM_MEMORY_MALLOC &&
+	    VME_ALIAS(entry) != VM_MEMORY_MALLOC_SMALL) {
+		/* not a malloc heap or Obj-C Garbage Collector heap */
+		return FALSE;
+	}
 
-		/*
-		 *	Find the beginning of the region.
-		 */ 
-		if (! vm_map_lookup_entry(map, src_start, &src_entry)) {
-			result = KERN_INVALID_ADDRESS;
-			break;
-		}
+	if (entry->wired_count) {
+		/* wired: can't change the map entry... */
+		vm_counters.should_cow_but_wired++;
+		return FALSE;
+	}
 
-		if (src_start < src_entry->vme_start ||
-		    (mapped_size && src_start != src_entry->vme_start)) {
-			result = KERN_INVALID_ADDRESS;
-			break;
-		}
+	object = VME_OBJECT(entry);
 
-		if(src_entry->is_sub_map) {
-			result = KERN_INVALID_ADDRESS;
-			break;
-		}
+	if (object == VM_OBJECT_NULL) {
+		/* no object yet... */
+		return FALSE;
+	}
 
-		tmp_size = size - mapped_size;
-		if (src_end > src_entry->vme_end)
-			tmp_size -= (src_end - src_entry->vme_end);
+	if (!object->internal) {
+		/* not an internal object */
+		return FALSE;
+	}
 
-		entry_size = (vm_size_t)(src_entry->vme_end -
-					 src_entry->vme_start);
+	if (object->copy_strategy != MEMORY_OBJECT_COPY_SYMMETRIC) {
+		/* not the default copy strategy */
+		return FALSE;
+	}
 
-		if(src_entry->is_sub_map) {
-			vm_map_reference(src_entry->object.sub_map);
-		} else {
-			object = src_entry->object.vm_object;
+	if (object->true_share) {
+		/* already true_share: too late to avoid it */
+		return FALSE;
+	}
 
-			if (object == VM_OBJECT_NULL) {
-				object = vm_object_allocate(entry_size);
-				src_entry->offset = 0;
-				src_entry->object.vm_object = object;
-			} else if (object->copy_strategy !=
-				   MEMORY_OBJECT_COPY_SYMMETRIC) {
-				/*
-				 *	We are already using an asymmetric
-				 *	copy, and therefore we already have
-				 *	the right object.
-				 */
-				assert(!src_entry->needs_copy);
-			} else if (src_entry->needs_copy || object->shadowed ||
-				   (object->internal && !object->true_share &&
-				   !src_entry->is_shared &&
-				    object->size > entry_size)) {
+	if (VME_ALIAS(entry) == VM_MEMORY_MALLOC &&
+	    object->vo_size != ANON_CHUNK_SIZE) {
+		/* ... not an object created for the ObjC Garbage Collector */
+		return FALSE;
+	}
 
-				vm_object_shadow(&src_entry->object.vm_object,
-						 &src_entry->offset,
-						 entry_size);
+	if (VME_ALIAS(entry) == VM_MEMORY_MALLOC_SMALL &&
+	    object->vo_size != 2048 * 4096) {
+		/* ... not a "MALLOC_SMALL" heap */
+		return FALSE;
+	}
 
-				if (!src_entry->needs_copy &&
-				    (src_entry->protection & VM_PROT_WRITE)) {
-					pmap_protect(vm_map_pmap(map),
-					     src_entry->vme_start,
-					     src_entry->vme_end,
-					     src_entry->protection &
-						     ~VM_PROT_WRITE);
-				}
+	/*
+	 * All the criteria match: we have a large object being targeted for "true_share".
+	 * To limit the adverse side-effects linked with "true_share", tell the caller to
+	 * try and avoid setting up the entire object for "true_share" by clipping the
+	 * targeted range and setting it up for copy-on-write.
+	 */
+	return TRUE;
+}
 
-				object = src_entry->object.vm_object;
-				src_entry->needs_copy = FALSE;
-			}
+vm_map_offset_t
+vm_map_round_page_mask(
+	vm_map_offset_t offset,
+	vm_map_offset_t mask)
+{
+	return VM_MAP_ROUND_PAGE(offset, mask);
+}
 
+vm_map_offset_t
+vm_map_trunc_page_mask(
+	vm_map_offset_t offset,
+	vm_map_offset_t mask)
+{
+	return VM_MAP_TRUNC_PAGE(offset, mask);
+}
 
-			vm_object_lock(object);
-			object->ref_count++;	/* object ref. for new entry */
-			VM_OBJ_RES_INCR(object);
-			if (object->copy_strategy == 
-					MEMORY_OBJECT_COPY_SYMMETRIC) {
-				object->copy_strategy = 
-					MEMORY_OBJECT_COPY_DELAY;
-			}
-			vm_object_unlock(object);
-		}
+boolean_t
+vm_map_page_aligned(
+	vm_map_offset_t offset,
+	vm_map_offset_t mask)
+{
+	return ((offset) & mask) == 0;
+}
 
-		offset = src_entry->offset + (src_start - src_entry->vme_start);
+int
+vm_map_page_shift(
+	vm_map_t map)
+{
+	return VM_MAP_PAGE_SHIFT(map);
+}
 
-		new_entry = _vm_map_entry_create(map_header);
-		vm_map_entry_copy(new_entry, src_entry);
-		new_entry->use_pmap = FALSE; /* clr address space specifics */
+int
+vm_map_page_size(
+	vm_map_t map)
+{
+	return VM_MAP_PAGE_SIZE(map);
+}
 
-		new_entry->vme_start = map_address;
-		new_entry->vme_end = map_address + tmp_size;
-		new_entry->inheritance = inheritance;
-		new_entry->offset = offset;
+vm_map_offset_t
+vm_map_page_mask(
+	vm_map_t map)
+{
+	return VM_MAP_PAGE_MASK(map);
+}
 
-		/*
-		 * The new region has to be copied now if required.
-		 */
-	RestartCopy:
-		if (!copy) {
-			src_entry->is_shared = TRUE;
-			new_entry->is_shared = TRUE;
-			if (!(new_entry->is_sub_map)) 
-				new_entry->needs_copy = FALSE;
+kern_return_t
+vm_map_set_page_shift(
+	vm_map_t        map,
+	int             pageshift)
+{
+	if (map->hdr.nentries != 0) {
+		/* too late to change page size */
+		return KERN_FAILURE;
+	}
 
-		} else if (src_entry->is_sub_map) {
-			/* make this a COW sub_map if not already */
-			new_entry->needs_copy = TRUE;
-		} else if (src_entry->wired_count == 0 &&
-			 vm_object_copy_quickly(&new_entry->object.vm_object,
-						new_entry->offset,
-						(new_entry->vme_end -
-						    new_entry->vme_start),
-						&src_needs_copy,
-						&new_entry_needs_copy)) {
+	map->hdr.page_shift = pageshift;
 
-			new_entry->needs_copy = new_entry_needs_copy;
-			new_entry->is_shared = FALSE;
+	return KERN_SUCCESS;
+}
 
-			/*
-			 * Handle copy_on_write semantics.
-			 */
-			if (src_needs_copy && !src_entry->needs_copy) {
-				vm_object_pmap_protect(object,
-						       offset,
-						       entry_size,
-						       (src_entry->is_shared ?
-							PMAP_NULL : map->pmap),
-						       src_entry->vme_start,
-						       src_entry->protection &
-						       ~VM_PROT_WRITE);
+kern_return_t
+vm_map_query_volatile(
+	vm_map_t        map,
+	mach_vm_size_t  *volatile_virtual_size_p,
+	mach_vm_size_t  *volatile_resident_size_p,
+	mach_vm_size_t  *volatile_compressed_size_p,
+	mach_vm_size_t  *volatile_pmap_size_p,
+	mach_vm_size_t  *volatile_compressed_pmap_size_p)
+{
+	mach_vm_size_t  volatile_virtual_size;
+	mach_vm_size_t  volatile_resident_count;
+	mach_vm_size_t  volatile_compressed_count;
+	mach_vm_size_t  volatile_pmap_count;
+	mach_vm_size_t  volatile_compressed_pmap_count;
+	mach_vm_size_t  resident_count;
+	vm_map_entry_t  entry;
+	vm_object_t     object;
+
+	/* map should be locked by caller */
+
+	volatile_virtual_size = 0;
+	volatile_resident_count = 0;
+	volatile_compressed_count = 0;
+	volatile_pmap_count = 0;
+	volatile_compressed_pmap_count = 0;
 
-				src_entry->needs_copy = TRUE;
-			}
+	for (entry = vm_map_first_entry(map);
+	    entry != vm_map_to_entry(map);
+	    entry = entry->vme_next) {
+		mach_vm_size_t  pmap_resident_bytes, pmap_compressed_bytes;
+
+		if (entry->is_sub_map) {
+			continue;
+		}
+		if (!(entry->protection & VM_PROT_WRITE)) {
+			continue;
+		}
+		object = VME_OBJECT(entry);
+		if (object == VM_OBJECT_NULL) {
+			continue;
+		}
+		if (object->purgable != VM_PURGABLE_VOLATILE &&
+		    object->purgable != VM_PURGABLE_EMPTY) {
+			continue;
+		}
+		if (VME_OFFSET(entry)) {
 			/*
-			 * Throw away the old object reference of the new entry.
+			 * If the map entry has been split and the object now
+			 * appears several times in the VM map, we don't want
+			 * to count the object's resident_page_count more than
+			 * once.  We count it only for the first one, starting
+			 * at offset 0 and ignore the other VM map entries.
 			 */
-			vm_object_deallocate(object);
-
+			continue;
+		}
+		resident_count = object->resident_page_count;
+		if ((VME_OFFSET(entry) / PAGE_SIZE) >= resident_count) {
+			resident_count = 0;
 		} else {
-			new_entry->is_shared = FALSE;
+			resident_count -= (VME_OFFSET(entry) / PAGE_SIZE);
+		}
 
-			/*
-			 * The map can be safely unlocked since we
-			 * already hold a reference on the object.
-			 *
-			 * Record the timestamp of the map for later
-			 * verification, and unlock the map.
-			 */
-			version.main_timestamp = map->timestamp;
-			vm_map_unlock(map);
+		volatile_virtual_size += entry->vme_end - entry->vme_start;
+		volatile_resident_count += resident_count;
+		if (object->pager) {
+			volatile_compressed_count +=
+			    vm_compressor_pager_get_count(object->pager);
+		}
+		pmap_compressed_bytes = 0;
+		pmap_resident_bytes =
+		    pmap_query_resident(map->pmap,
+		    entry->vme_start,
+		    entry->vme_end,
+		    &pmap_compressed_bytes);
+		volatile_pmap_count += (pmap_resident_bytes / PAGE_SIZE);
+		volatile_compressed_pmap_count += (pmap_compressed_bytes
+		    / PAGE_SIZE);
+	}
 
-			/*
-			 * Perform the copy.
-			 */
-			if (src_entry->wired_count > 0) {
-				vm_object_lock(object);
-				result = vm_object_copy_slowly(
-						object,
-						offset,
-						entry_size,
-						THREAD_UNINT,
-						&new_entry->object.vm_object);
+	/* map is still locked on return */
 
-				new_entry->offset = 0;
-				new_entry->needs_copy = FALSE;
-			} else {
-				result = vm_object_copy_strategically(
-						object,
-						offset,
-						entry_size,
-						&new_entry->object.vm_object,
-						&new_entry->offset,
-						&new_entry_needs_copy);
+	*volatile_virtual_size_p = volatile_virtual_size;
+	*volatile_resident_size_p = volatile_resident_count * PAGE_SIZE;
+	*volatile_compressed_size_p = volatile_compressed_count * PAGE_SIZE;
+	*volatile_pmap_size_p = volatile_pmap_count * PAGE_SIZE;
+	*volatile_compressed_pmap_size_p = volatile_compressed_pmap_count * PAGE_SIZE;
 
-				new_entry->needs_copy = new_entry_needs_copy;
-			}
+	return KERN_SUCCESS;
+}
 
-			/*
-			 * Throw away the old object reference of the new entry.
-			 */
-			vm_object_deallocate(object);
+void
+vm_map_sizes(vm_map_t map,
+    vm_map_size_t * psize,
+    vm_map_size_t * pfree,
+    vm_map_size_t * plargest_free)
+{
+	vm_map_entry_t  entry;
+	vm_map_offset_t prev;
+	vm_map_size_t   free, total_free, largest_free;
+	boolean_t       end;
 
-			if (result != KERN_SUCCESS &&
-			    result != KERN_MEMORY_RESTART_COPY) {
-				_vm_map_entry_dispose(map_header, new_entry);
-				break;
-			}
+	if (!map) {
+		*psize = *pfree = *plargest_free = 0;
+		return;
+	}
+	total_free = largest_free = 0;
 
-			/*
-			 * Verify that the map has not substantially
-			 * changed while the copy was being made.
-			 */
+	vm_map_lock_read(map);
+	if (psize) {
+		*psize = map->max_offset - map->min_offset;
+	}
 
-			vm_map_lock(map);	/* Increments timestamp once! */
-			if (version.main_timestamp + 1 != map->timestamp) {
-				/*
-				 * Simple version comparison failed.
-				 *
-				 * Retry the lookup and verify that the
-				 * same object/offset are still present.
-				 */
-				vm_object_deallocate(new_entry->
-						     object.vm_object);
-				_vm_map_entry_dispose(map_header, new_entry);
-				if (result == KERN_MEMORY_RESTART_COPY)
-					result = KERN_SUCCESS;
-				continue;
-			}
+	prev = map->min_offset;
+	for (entry = vm_map_first_entry(map);; entry = entry->vme_next) {
+		end = (entry == vm_map_to_entry(map));
 
-			if (result == KERN_MEMORY_RESTART_COPY) {
-				vm_object_reference(object);
-				goto RestartCopy;
-			}
+		if (end) {
+			free = entry->vme_end   - prev;
+		} else {
+			free = entry->vme_start - prev;
 		}
 
-		_vm_map_entry_link(map_header,
-				   map_header->links.prev, new_entry);
+		total_free += free;
+		if (free > largest_free) {
+			largest_free = free;
+		}
 
-		*cur_protection &= src_entry->protection;
-		*max_protection &= src_entry->max_protection;
+		if (end) {
+			break;
+		}
+		prev = entry->vme_end;
+	}
+	vm_map_unlock_read(map);
+	if (pfree) {
+		*pfree = total_free;
+	}
+	if (plargest_free) {
+		*plargest_free = largest_free;
+	}
+}
 
-		map_address += tmp_size;
-		mapped_size += tmp_size;
-		src_start += tmp_size;
+#if VM_SCAN_FOR_SHADOW_CHAIN
+int vm_map_shadow_max(vm_map_t map);
+int
+vm_map_shadow_max(
+	vm_map_t map)
+{
+	int             shadows, shadows_max;
+	vm_map_entry_t  entry;
+	vm_object_t     object, next_object;
 
-	} /* end while */
+	if (map == NULL) {
+		return 0;
+	}
 
-	vm_map_unlock(map);
-	if (result != KERN_SUCCESS) {
-		/*
-		 * Free all allocated elements.
-		 */
-		for (src_entry = map_header->links.next;
-		     src_entry != (struct vm_map_entry *)&map_header->links;
-		     src_entry = new_entry) {
-			new_entry = src_entry->vme_next;
-			_vm_map_entry_unlink(map_header, src_entry);
-			vm_object_deallocate(src_entry->object.vm_object);
-			_vm_map_entry_dispose(map_header, src_entry);
+	shadows_max = 0;
+
+	vm_map_lock_read(map);
+
+	for (entry = vm_map_first_entry(map);
+	    entry != vm_map_to_entry(map);
+	    entry = entry->vme_next) {
+		if (entry->is_sub_map) {
+			continue;
+		}
+		object = VME_OBJECT(entry);
+		if (object == NULL) {
+			continue;
+		}
+		vm_object_lock_shared(object);
+		for (shadows = 0;
+		    object->shadow != NULL;
+		    shadows++, object = next_object) {
+			next_object = object->shadow;
+			vm_object_lock_shared(next_object);
+			vm_object_unlock(object);
+		}
+		vm_object_unlock(object);
+		if (shadows > shadows_max) {
+			shadows_max = shadows;
 		}
 	}
-	return result;
+
+	vm_map_unlock_read(map);
+
+	return shadows_max;
 }
+#endif /* VM_SCAN_FOR_SHADOW_CHAIN */
 
-/*
- *	Routine:	vm_remap
- *
- *			Map portion of a task's address space.
- *			Mapped region must not overlap more than
- *			one vm memory object. Protections and
- *			inheritance attributes remain the same
- *			as in the original task and are	out parameters.
- *			Source and Target task can be identical
- *			Other attributes are identical as for vm_map()
- */
-kern_return_t
-vm_remap(
-	vm_map_t		target_map,
-	vm_offset_t		*address,
-	vm_size_t		size,
-	vm_offset_t		mask,
-	boolean_t		anywhere,
-	vm_map_t		src_map,
-	vm_offset_t		memory_address,
-	boolean_t		copy,
-	vm_prot_t		*cur_protection,
-	vm_prot_t		*max_protection,
-	vm_inherit_t		inheritance)
-{
-	kern_return_t		result;
-	vm_map_entry_t		entry;
-	vm_map_entry_t		insp_entry;
-	vm_map_entry_t		new_entry;
-	struct vm_map_header	map_header;
-
-	if (target_map == VM_MAP_NULL)
-		return KERN_INVALID_ARGUMENT;
+void
+vm_commit_pagezero_status(vm_map_t lmap)
+{
+	pmap_advise_pagezero_range(lmap->pmap, lmap->min_offset);
+}
 
-	switch (inheritance) {
-	    case VM_INHERIT_NONE:
-	    case VM_INHERIT_COPY:
-	    case VM_INHERIT_SHARE:
-		if (size != 0 && src_map != VM_MAP_NULL)
-			break;
-		/*FALL THRU*/
-	    default:
-		return KERN_INVALID_ARGUMENT;
-	}
+#if !CONFIG_EMBEDDED
+void
+vm_map_set_high_start(
+	vm_map_t        map,
+	vm_map_offset_t high_start)
+{
+	map->vmmap_high_start = high_start;
+}
+#endif
 
-	size = round_page(size);
+#if PMAP_CS
+kern_return_t
+vm_map_entry_cs_associate(
+	vm_map_t                map,
+	vm_map_entry_t          entry,
+	vm_map_kernel_flags_t   vmk_flags)
+{
+	vm_object_t cs_object, cs_shadow;
+	vm_object_offset_t cs_offset;
+	void *cs_blobs;
+	struct vnode *cs_vnode;
+	kern_return_t cs_ret;
+
+	if (map->pmap == NULL ||
+	    entry->is_sub_map || /* XXX FBDP: recurse on sub-range? */
+	    VME_OBJECT(entry) == VM_OBJECT_NULL ||
+	    !(entry->protection & VM_PROT_EXECUTE)) {
+		return KERN_SUCCESS;
+	}
 
-	result = vm_remap_extract(src_map, memory_address,
-				  size, copy, &map_header,
-				  cur_protection,
-				  max_protection,
-				  inheritance,
-				  target_map->hdr.
-				  entries_pageable);
+	vm_map_lock_assert_exclusive(map);
 
-	if (result != KERN_SUCCESS) {
-		return result;
+	if (entry->used_for_jit) {
+		cs_ret = pmap_cs_associate(map->pmap,
+		    PMAP_CS_ASSOCIATE_JIT,
+		    entry->vme_start,
+		    entry->vme_end - entry->vme_start);
+		goto done;
 	}
 
-	/*
-	 * Allocate/check a range of free virtual address
-	 * space for the target
-	 */
-	*address = trunc_page(*address);
-	vm_map_lock(target_map);
-	result = vm_remap_range_allocate(target_map, address, size,
-					 mask, anywhere, &insp_entry);
+	if (vmk_flags.vmkf_remap_prot_copy) {
+		cs_ret = pmap_cs_associate(map->pmap,
+		    PMAP_CS_ASSOCIATE_COW,
+		    entry->vme_start,
+		    entry->vme_end - entry->vme_start);
+		goto done;
+	}
 
-	for (entry = map_header.links.next;
-	     entry != (struct vm_map_entry *)&map_header.links;
-	     entry = new_entry) {
-		new_entry = entry->vme_next;
-		_vm_map_entry_unlink(&map_header, entry);
-		if (result == KERN_SUCCESS) {
-			entry->vme_start += *address;
-			entry->vme_end += *address;
-			vm_map_entry_link(target_map, insp_entry, entry);
-			insp_entry = entry;
-		} else {
-			if (!entry->is_sub_map) {
-				vm_object_deallocate(entry->object.vm_object);
-			} else {
-				vm_map_deallocate(entry->object.sub_map);
-			   }
-			_vm_map_entry_dispose(&map_header, entry);
+	vm_object_lock_shared(VME_OBJECT(entry));
+	cs_offset = VME_OFFSET(entry);
+	for (cs_object = VME_OBJECT(entry);
+	    (cs_object != VM_OBJECT_NULL &&
+	    !cs_object->code_signed);
+	    cs_object = cs_shadow) {
+		cs_shadow = cs_object->shadow;
+		if (cs_shadow != VM_OBJECT_NULL) {
+			cs_offset += cs_object->vo_shadow_offset;
+			vm_object_lock_shared(cs_shadow);
 		}
+		vm_object_unlock(cs_object);
+	}
+	if (cs_object == VM_OBJECT_NULL) {
+		return KERN_SUCCESS;
 	}
 
-	if (result == KERN_SUCCESS) {
-		target_map->size += size;
-		SAVE_HINT(target_map, insp_entry);
+	cs_offset += cs_object->paging_offset;
+	cs_vnode = vnode_pager_lookup_vnode(cs_object->pager);
+	cs_ret = vnode_pager_get_cs_blobs(cs_vnode,
+	    &cs_blobs);
+	assert(cs_ret == KERN_SUCCESS);
+	cs_ret = cs_associate_blob_with_mapping(map->pmap,
+	    entry->vme_start,
+	    (entry->vme_end -
+	    entry->vme_start),
+	    cs_offset,
+	    cs_blobs);
+	vm_object_unlock(cs_object);
+	cs_object = VM_OBJECT_NULL;
+
+done:
+	if (cs_ret == KERN_SUCCESS) {
+		DTRACE_VM2(vm_map_entry_cs_associate_success,
+		    vm_map_offset_t, entry->vme_start,
+		    vm_map_offset_t, entry->vme_end);
+		if (vm_map_executable_immutable) {
+			/*
+			 * Prevent this executable
+			 * mapping from being unmapped
+			 * or modified.
+			 */
+			entry->permanent = TRUE;
+		}
+		/*
+		 * pmap says it will validate the
+		 * code-signing validity of pages
+		 * faulted in via this mapping, so
+		 * this map entry should be marked so
+		 * that vm_fault() bypasses code-signing
+		 * validation for faults coming through
+		 * this mapping.
+		 */
+		entry->pmap_cs_associated = TRUE;
+	} else if (cs_ret == KERN_NOT_SUPPORTED) {
+		/*
+		 * pmap won't check the code-signing
+		 * validity of pages faulted in via
+		 * this mapping, so VM should keep
+		 * doing it.
+		 */
+		DTRACE_VM3(vm_map_entry_cs_associate_off,
+		    vm_map_offset_t, entry->vme_start,
+		    vm_map_offset_t, entry->vme_end,
+		    int, cs_ret);
+	} else {
+		/*
+		 * A real error: do not allow
+		 * execution in this mapping.
+		 */
+		DTRACE_VM3(vm_map_entry_cs_associate_failure,
+		    vm_map_offset_t, entry->vme_start,
+		    vm_map_offset_t, entry->vme_end,
+		    int, cs_ret);
+		entry->protection &= ~VM_PROT_EXECUTE;
+		entry->max_protection &= ~VM_PROT_EXECUTE;
 	}
-	vm_map_unlock(target_map);
 
-	if (result == KERN_SUCCESS && target_map->wiring_required)
-		result = vm_map_wire(target_map, *address,
-				     *address + size, *cur_protection, TRUE);
-	return result;
+	return cs_ret;
 }
+#endif /* PMAP_CS */
 
 /*
- *	Routine:	vm_remap_range_allocate
+ * FORKED CORPSE FOOTPRINT
  *
- *	Description:
- *		Allocate a range in the specified virtual address map.
- *		returns the address and the map entry just before the allocated
- *		range
+ * A forked corpse gets a copy of the original VM map but its pmap is mostly
+ * empty since it never ran and never got to fault in any pages.
+ * Collecting footprint info (via "sysctl vm.self_region_footprint") for
+ * a forked corpse would therefore return very little information.
  *
- *	Map must be locked.
+ * When forking a corpse, we can pass the VM_MAP_FORK_CORPSE_FOOTPRINT option
+ * to vm_map_fork() to collect footprint information from the original VM map
+ * and its pmap, and store it in the forked corpse's VM map.  That information
+ * is stored in place of the VM map's "hole list" since we'll never need to
+ * lookup for holes in the corpse's map.
+ *
+ * The corpse's footprint info looks like this:
+ *
+ * vm_map->vmmap_corpse_footprint points to pageable kernel memory laid out
+ * as follows:
+ *                     +---------------------------------------+
+ *            header-> | cf_size                               |
+ *                     +-------------------+-------------------+
+ *                     | cf_last_region    | cf_last_zeroes    |
+ *                     +-------------------+-------------------+
+ *           region1-> | cfr_vaddr                             |
+ *                     +-------------------+-------------------+
+ *                     | cfr_num_pages     | d0 | d1 | d2 | d3 |
+ *                     +---------------------------------------+
+ *                     | d4 | d5 | ...                         |
+ *                     +---------------------------------------+
+ *                     | ...                                   |
+ *                     +-------------------+-------------------+
+ *                     | dy | dz | na | na | cfr_vaddr...      | <-region2
+ *                     +-------------------+-------------------+
+ *                     | cfr_vaddr (ctd)   | cfr_num_pages     |
+ *                     +---------------------------------------+
+ *                     | d0 | d1 ...                           |
+ *                     +---------------------------------------+
+ *                       ...
+ *                     +---------------------------------------+
+ *       last region-> | cfr_vaddr                             |
+ *                     +---------------------------------------+
+ *                     + cfr_num_pages     | d0 | d1 | d2 | d3 |
+ *                     +---------------------------------------+
+ *                       ...
+ *                     +---------------------------------------+
+ *                     | dx | dy | dz | na | na | na | na | na |
+ *                     +---------------------------------------+
+ *
+ * where:
+ *      cf_size:	total size of the buffer (rounded to page size)
+ *      cf_last_region:	offset in the buffer of the last "region" sub-header
+ *	cf_last_zeroes: number of trailing "zero" dispositions at the end
+ *			of last region
+ *	cfr_vaddr:	virtual address of the start of the covered "region"
+ *	cfr_num_pages:	number of pages in the covered "region"
+ *	d*:		disposition of the page at that virtual address
+ * Regions in the buffer are word-aligned.
+ *
+ * We estimate the size of the buffer based on the number of memory regions
+ * and the virtual size of the address space.  While copying each memory region
+ * during vm_map_fork(), we also collect the footprint info for that region
+ * and store it in the buffer, packing it as much as possible (coalescing
+ * contiguous memory regions to avoid having too many region headers and
+ * avoiding long streaks of "zero" page dispositions by splitting footprint
+ * "regions", so the number of regions in the footprint buffer might not match
+ * the number of memory regions in the address space.
+ *
+ * We also have to copy the original task's "nonvolatile" ledgers since that's
+ * part of the footprint and will need to be reported to any tool asking for
+ * the footprint information of the forked corpse.
  */
 
-kern_return_t
-vm_remap_range_allocate(
-	vm_map_t	map,
-	vm_offset_t	*address,	/* IN/OUT */
-	vm_size_t	size,
-	vm_offset_t	mask,
-	boolean_t	anywhere,
-	vm_map_entry_t	*map_entry)	/* OUT */
+uint64_t vm_map_corpse_footprint_count = 0;
+uint64_t vm_map_corpse_footprint_size_avg = 0;
+uint64_t vm_map_corpse_footprint_size_max = 0;
+uint64_t vm_map_corpse_footprint_full = 0;
+uint64_t vm_map_corpse_footprint_no_buf = 0;
+
+/*
+ * vm_map_corpse_footprint_new_region:
+ *      closes the current footprint "region" and creates a new one
+ *
+ * Returns NULL if there's not enough space in the buffer for a new region.
+ */
+static struct vm_map_corpse_footprint_region *
+vm_map_corpse_footprint_new_region(
+	struct vm_map_corpse_footprint_header *footprint_header)
 {
-	register vm_map_entry_t	entry;
-	register vm_offset_t	start;
-	register vm_offset_t	end;
-	kern_return_t		result = KERN_SUCCESS;
+	uintptr_t       footprint_edge;
+	uint32_t        new_region_offset;
+	struct vm_map_corpse_footprint_region *footprint_region;
+	struct vm_map_corpse_footprint_region *new_footprint_region;
+
+	footprint_edge = ((uintptr_t)footprint_header +
+	    footprint_header->cf_size);
+	footprint_region = ((struct vm_map_corpse_footprint_region *)
+	    ((char *)footprint_header +
+	    footprint_header->cf_last_region));
+	assert((uintptr_t)footprint_region + sizeof(*footprint_region) <=
+	    footprint_edge);
+
+	/* get rid of trailing zeroes in the last region */
+	assert(footprint_region->cfr_num_pages >=
+	    footprint_header->cf_last_zeroes);
+	footprint_region->cfr_num_pages -=
+	    footprint_header->cf_last_zeroes;
+	footprint_header->cf_last_zeroes = 0;
+
+	/* reuse this region if it's now empty */
+	if (footprint_region->cfr_num_pages == 0) {
+		return footprint_region;
+	}
 
- StartAgain: ;
+	/* compute offset of new region */
+	new_region_offset = footprint_header->cf_last_region;
+	new_region_offset += sizeof(*footprint_region);
+	new_region_offset += footprint_region->cfr_num_pages;
+	new_region_offset = roundup(new_region_offset, sizeof(int));
+
+	/* check if we're going over the edge */
+	if (((uintptr_t)footprint_header +
+	    new_region_offset +
+	    sizeof(*footprint_region)) >=
+	    footprint_edge) {
+		/* over the edge: no new region */
+		return NULL;
+	}
 
-    start = *address;
+	/* adjust offset of last region in header */
+	footprint_header->cf_last_region = new_region_offset;
 
-    if (anywhere)
-    {
-	/*
-	 *	Calculate the first possible address.
-	 */
+	new_footprint_region = (struct vm_map_corpse_footprint_region *)
+	    ((char *)footprint_header +
+	    footprint_header->cf_last_region);
+	new_footprint_region->cfr_vaddr = 0;
+	new_footprint_region->cfr_num_pages = 0;
+	/* caller needs to initialize new region */
 
-	if (start < map->min_offset)
-	    start = map->min_offset;
-	if (start > map->max_offset)
-	    return(KERN_NO_SPACE);
-		
-	/*
-	 *	Look for the first possible address;
-	 *	if there's already something at this
-	 *	address, we have to start after it.
-	 */
+	return new_footprint_region;
+}
 
-	assert(first_free_is_valid(map));
-	if (start == map->min_offset) {
-	    if ((entry = map->first_free) != vm_map_to_entry(map))
-		start = entry->vme_end;
-	} else {
-	    vm_map_entry_t	tmp_entry;
-	    if (vm_map_lookup_entry(map, start, &tmp_entry))
-		start = tmp_entry->vme_end;
-	    entry = tmp_entry;
+/*
+ * vm_map_corpse_footprint_collect:
+ *	collect footprint information for "old_entry" in "old_map" and
+ *	stores it in "new_map"'s vmmap_footprint_info.
+ */
+kern_return_t
+vm_map_corpse_footprint_collect(
+	vm_map_t        old_map,
+	vm_map_entry_t  old_entry,
+	vm_map_t        new_map)
+{
+	vm_map_offset_t va;
+	int             disp;
+	kern_return_t   kr;
+	struct vm_map_corpse_footprint_header *footprint_header;
+	struct vm_map_corpse_footprint_region *footprint_region;
+	struct vm_map_corpse_footprint_region *new_footprint_region;
+	unsigned char   *next_disp_p;
+	uintptr_t       footprint_edge;
+	uint32_t        num_pages_tmp;
+
+	va = old_entry->vme_start;
+
+	vm_map_lock_assert_exclusive(old_map);
+	vm_map_lock_assert_exclusive(new_map);
+
+	assert(new_map->has_corpse_footprint);
+	assert(!old_map->has_corpse_footprint);
+	if (!new_map->has_corpse_footprint ||
+	    old_map->has_corpse_footprint) {
+		/*
+		 * This can only transfer footprint info from a
+		 * map with a live pmap to a map with a corpse footprint.
+		 */
+		return KERN_NOT_SUPPORTED;
 	}
-		
-	/*
-	 *	In any case, the "entry" always precedes
-	 *	the proposed new region throughout the
-	 *	loop:
-	 */
 
-	while (TRUE) {
-	    register vm_map_entry_t	next;
-
-	    /*
-	     *	Find the end of the proposed new region.
-	     *	Be sure we didn't go beyond the end, or
-	     *	wrap around the address.
-	     */
-
-	    end = ((start + mask) & ~mask);
-	    if (end < start)
-		    return(KERN_NO_SPACE);
-	    start = end;
-	    end += size;
-
-	    if ((end > map->max_offset) || (end < start)) {
-		if (map->wait_for_space) {
-		    if (size <= (map->max_offset -
-				 map->min_offset)) {
-			assert_wait((event_t) map, THREAD_INTERRUPTIBLE);
-			vm_map_unlock(map);
-			thread_block((void (*)(void))0);
-			vm_map_lock(map);
-			goto StartAgain;
-		    }
+	if (new_map->vmmap_corpse_footprint == NULL) {
+		vm_offset_t     buf;
+		vm_size_t       buf_size;
+
+		buf = 0;
+		buf_size = (sizeof(*footprint_header) +
+		    (old_map->hdr.nentries
+		    *
+		    (sizeof(*footprint_region) +
+		    +3))            /* potential alignment for each region */
+		    +
+		    ((old_map->size / PAGE_SIZE)
+		    *
+		    sizeof(char)));           /* disposition for each page */
+//		printf("FBDP corpse map %p guestimate footprint size 0x%llx\n", new_map, (uint64_t) buf_size);
+		buf_size = round_page(buf_size);
+
+		/* limit buffer to 1 page to validate overflow detection */
+//		buf_size = PAGE_SIZE;
+
+		/* limit size to a somewhat sane amount */
+#if CONFIG_EMBEDDED
+#define VM_MAP_CORPSE_FOOTPRINT_INFO_MAX_SIZE   (256*1024)      /* 256KB */
+#else /* CONFIG_EMBEDDED */
+#define VM_MAP_CORPSE_FOOTPRINT_INFO_MAX_SIZE   (8*1024*1024)   /* 8MB */
+#endif /* CONFIG_EMBEDDED */
+		if (buf_size > VM_MAP_CORPSE_FOOTPRINT_INFO_MAX_SIZE) {
+			buf_size = VM_MAP_CORPSE_FOOTPRINT_INFO_MAX_SIZE;
 		}
-		
-		return(KERN_NO_SPACE);
-	    }
-
-	    /*
-	     *	If there are no more entries, we must win.
-	     */
-
-	    next = entry->vme_next;
-	    if (next == vm_map_to_entry(map))
-		break;
 
-	    /*
-	     *	If there is another entry, it must be
-	     *	after the end of the potential new region.
-	     */
+		/*
+		 * Allocate the pageable buffer (with a trailing guard page).
+		 * It will be zero-filled on demand.
+		 */
+		kr = kernel_memory_allocate(kernel_map,
+		    &buf,
+		    (buf_size
+		    + PAGE_SIZE),                          /* trailing guard page */
+		    0,                         /* mask */
+		    KMA_PAGEABLE | KMA_GUARD_LAST,
+		    VM_KERN_MEMORY_DIAG);
+		if (kr != KERN_SUCCESS) {
+			vm_map_corpse_footprint_no_buf++;
+			return kr;
+		}
 
-	    if (next->vme_start >= end)
-		break;
+		/* initialize header and 1st region */
+		footprint_header = (struct vm_map_corpse_footprint_header *)buf;
+		new_map->vmmap_corpse_footprint = footprint_header;
 
-	    /*
-	     *	Didn't fit -- move to the next entry.
-	     */
+		footprint_header->cf_size = buf_size;
+		footprint_header->cf_last_region =
+		    sizeof(*footprint_header);
+		footprint_header->cf_last_zeroes = 0;
 
-	    entry = next;
-	    start = entry->vme_end;
+		footprint_region = (struct vm_map_corpse_footprint_region *)
+		    ((char *)footprint_header +
+		    footprint_header->cf_last_region);
+		footprint_region->cfr_vaddr = 0;
+		footprint_region->cfr_num_pages = 0;
+	} else {
+		/* retrieve header and last region */
+		footprint_header = (struct vm_map_corpse_footprint_header *)
+		    new_map->vmmap_corpse_footprint;
+		footprint_region = (struct vm_map_corpse_footprint_region *)
+		    ((char *)footprint_header +
+		    footprint_header->cf_last_region);
 	}
-	*address = start;
-    } else {
-	vm_map_entry_t		temp_entry;
-	
-	/*
-	 *	Verify that:
-	 *		the address doesn't itself violate
-	 *		the mask requirement.
-	 */
+	footprint_edge = ((uintptr_t)footprint_header +
+	    footprint_header->cf_size);
 
-	if ((start & mask) != 0)
-	    return(KERN_NO_SPACE);
+	if ((footprint_region->cfr_vaddr +
+	    (((vm_map_offset_t)footprint_region->cfr_num_pages) *
+	    PAGE_SIZE))
+	    != old_entry->vme_start) {
+		uint64_t num_pages_delta;
+		uint32_t region_offset_delta;
 
+		/*
+		 * Not the next contiguous virtual address:
+		 * start a new region or store "zero" dispositions for
+		 * the missing pages?
+		 */
+		/* size of gap in actual page dispositions */
+		num_pages_delta = (((old_entry->vme_start -
+		    footprint_region->cfr_vaddr) / PAGE_SIZE)
+		    - footprint_region->cfr_num_pages);
+		/* size of gap as a new footprint region header */
+		region_offset_delta =
+		    (sizeof(*footprint_region) +
+		    roundup((footprint_region->cfr_num_pages -
+		    footprint_header->cf_last_zeroes),
+		    sizeof(int)) -
+		    (footprint_region->cfr_num_pages -
+		    footprint_header->cf_last_zeroes));
+//		printf("FBDP %s:%d region 0x%x 0x%llx 0x%x vme_start 0x%llx pages_delta 0x%llx region_delta 0x%x\n", __FUNCTION__, __LINE__, footprint_header->cf_last_region, footprint_region->cfr_vaddr, footprint_region->cfr_num_pages, old_entry->vme_start, num_pages_delta, region_offset_delta);
+		if (region_offset_delta < num_pages_delta ||
+		    os_add3_overflow(footprint_region->cfr_num_pages,
+		    (uint32_t) num_pages_delta,
+		    1,
+		    &num_pages_tmp)) {
+			/*
+			 * Storing data for this gap would take more space
+			 * than inserting a new footprint region header:
+			 * let's start a new region and save space. If it's a
+			 * tie, let's avoid using a new region, since that
+			 * would require more region hops to find the right
+			 * range during lookups.
+			 *
+			 * If the current region's cfr_num_pages would overflow
+			 * if we added "zero" page dispositions for the gap,
+			 * no choice but to start a new region.
+			 */
+//			printf("FBDP %s:%d new region\n", __FUNCTION__, __LINE__);
+			new_footprint_region =
+			    vm_map_corpse_footprint_new_region(footprint_header);
+			/* check that we're not going over the edge */
+			if (new_footprint_region == NULL) {
+				goto over_the_edge;
+			}
+			footprint_region = new_footprint_region;
+			/* initialize new region as empty */
+			footprint_region->cfr_vaddr = old_entry->vme_start;
+			footprint_region->cfr_num_pages = 0;
+		} else {
+			/*
+			 * Store "zero" page dispositions for the missing
+			 * pages.
+			 */
+//			printf("FBDP %s:%d zero gap\n", __FUNCTION__, __LINE__);
+			for (; num_pages_delta > 0; num_pages_delta--) {
+				next_disp_p =
+				    ((unsigned char *) footprint_region +
+				    sizeof(*footprint_region) +
+				    footprint_region->cfr_num_pages);
+				/* check that we're not going over the edge */
+				if ((uintptr_t)next_disp_p >= footprint_edge) {
+					goto over_the_edge;
+				}
+				/* store "zero" disposition for this gap page */
+				footprint_region->cfr_num_pages++;
+				*next_disp_p = (unsigned char) 0;
+				footprint_header->cf_last_zeroes++;
+			}
+		}
+	}
 
-	/*
-	 *	...	the address is within bounds
-	 */
+	for (va = old_entry->vme_start;
+	    va < old_entry->vme_end;
+	    va += PAGE_SIZE) {
+		vm_object_t     object;
+
+		object = VME_OBJECT(old_entry);
+		if (!old_entry->is_sub_map &&
+		    old_entry->iokit_acct &&
+		    object != VM_OBJECT_NULL &&
+		    object->internal &&
+		    object->purgable == VM_PURGABLE_DENY) {
+			/*
+			 * Non-purgeable IOKit memory: phys_footprint
+			 * includes the entire virtual mapping.
+			 * Since the forked corpse's VM map entry will not
+			 * have "iokit_acct", pretend that this page's
+			 * disposition is "present & internal", so that it
+			 * shows up in the forked corpse's footprint.
+			 */
+			disp = (PMAP_QUERY_PAGE_PRESENT |
+			    PMAP_QUERY_PAGE_INTERNAL);
+		} else {
+			disp = 0;
+			pmap_query_page_info(old_map->pmap,
+			    va,
+			    &disp);
+		}
 
-	end = start + size;
+//		if (va < SHARED_REGION_BASE_ARM64) printf("FBDP collect map %p va 0x%llx disp 0x%x\n", new_map, va, disp);
 
-	if ((start < map->min_offset) ||
-	    (end > map->max_offset) ||
-	    (start >= end)) {
-	    return(KERN_INVALID_ADDRESS);
-	}
+		if (disp == 0 && footprint_region->cfr_num_pages == 0) {
+			/*
+			 * Ignore "zero" dispositions at start of
+			 * region: just move start of region.
+			 */
+			footprint_region->cfr_vaddr += PAGE_SIZE;
+			continue;
+		}
 
-	/*
-	 *	...	the starting address isn't allocated
-	 */
+		/* would region's cfr_num_pages overflow? */
+		if (os_add_overflow(footprint_region->cfr_num_pages, 1,
+		    &num_pages_tmp)) {
+			/* overflow: create a new region */
+			new_footprint_region =
+			    vm_map_corpse_footprint_new_region(
+				footprint_header);
+			if (new_footprint_region == NULL) {
+				goto over_the_edge;
+			}
+			footprint_region = new_footprint_region;
+			footprint_region->cfr_vaddr = va;
+			footprint_region->cfr_num_pages = 0;
+		}
 
-	if (vm_map_lookup_entry(map, start, &temp_entry))
-	    return(KERN_NO_SPACE);
+		next_disp_p = ((unsigned char *)footprint_region +
+		    sizeof(*footprint_region) +
+		    footprint_region->cfr_num_pages);
+		/* check that we're not going over the edge */
+		if ((uintptr_t)next_disp_p >= footprint_edge) {
+			goto over_the_edge;
+		}
+		/* store this dispostion */
+		*next_disp_p = (unsigned char) disp;
+		footprint_region->cfr_num_pages++;
+
+		if (disp != 0) {
+			/* non-zero disp: break the current zero streak */
+			footprint_header->cf_last_zeroes = 0;
+			/* done */
+			continue;
+		}
 
-	entry = temp_entry;
+		/* zero disp: add to the current streak of zeroes */
+		footprint_header->cf_last_zeroes++;
+		if ((footprint_header->cf_last_zeroes +
+		    roundup((footprint_region->cfr_num_pages -
+		    footprint_header->cf_last_zeroes) &
+		    (sizeof(int) - 1),
+		    sizeof(int))) <
+		    (sizeof(*footprint_header))) {
+			/*
+			 * There are not enough trailing "zero" dispositions
+			 * (+ the extra padding we would need for the previous
+			 * region); creating a new region would not save space
+			 * at this point, so let's keep this "zero" disposition
+			 * in this region and reconsider later.
+			 */
+			continue;
+		}
+		/*
+		 * Create a new region to avoid having too many consecutive
+		 * "zero" dispositions.
+		 */
+		new_footprint_region =
+		    vm_map_corpse_footprint_new_region(footprint_header);
+		if (new_footprint_region == NULL) {
+			goto over_the_edge;
+		}
+		footprint_region = new_footprint_region;
+		/* initialize the new region as empty ... */
+		footprint_region->cfr_num_pages = 0;
+		/* ... and skip this "zero" disp */
+		footprint_region->cfr_vaddr = va + PAGE_SIZE;
+	}
 
-	/*
-	 *	...	the next region doesn't overlap the
-	 *		end point.
-	 */
+	return KERN_SUCCESS;
 
-	if ((entry->vme_next != vm_map_to_entry(map)) &&
-	    (entry->vme_next->vme_start < end))
-	    return(KERN_NO_SPACE);
-    }
-    *map_entry = entry;
-    return(KERN_SUCCESS);
+over_the_edge:
+//	printf("FBDP map %p footprint was full for va 0x%llx\n", new_map, va);
+	vm_map_corpse_footprint_full++;
+	return KERN_RESOURCE_SHORTAGE;
 }
 
 /*
- *	vm_map_switch:
- *
- *	Set the address map for the current thr_act to the specified map
+ * vm_map_corpse_footprint_collect_done:
+ *	completes the footprint collection by getting rid of any remaining
+ *	trailing "zero" dispositions and trimming the unused part of the
+ *	kernel buffer
  */
-
-vm_map_t
-vm_map_switch(
-	vm_map_t	map)
+void
+vm_map_corpse_footprint_collect_done(
+	vm_map_t        new_map)
 {
-	int		mycpu;
-	thread_act_t	thr_act = current_act();
-	vm_map_t	oldmap = thr_act->map;
+	struct vm_map_corpse_footprint_header *footprint_header;
+	struct vm_map_corpse_footprint_region *footprint_region;
+	vm_size_t       buf_size, actual_size;
+	kern_return_t   kr;
+
+	assert(new_map->has_corpse_footprint);
+	if (!new_map->has_corpse_footprint ||
+	    new_map->vmmap_corpse_footprint == NULL) {
+		return;
+	}
 
-	mp_disable_preemption();
-	mycpu = cpu_number();
+	footprint_header = (struct vm_map_corpse_footprint_header *)
+	    new_map->vmmap_corpse_footprint;
+	buf_size = footprint_header->cf_size;
+
+	footprint_region = (struct vm_map_corpse_footprint_region *)
+	    ((char *)footprint_header +
+	    footprint_header->cf_last_region);
+
+	/* get rid of trailing zeroes in last region */
+	assert(footprint_region->cfr_num_pages >= footprint_header->cf_last_zeroes);
+	footprint_region->cfr_num_pages -= footprint_header->cf_last_zeroes;
+	footprint_header->cf_last_zeroes = 0;
+
+	actual_size = (vm_size_t)(footprint_header->cf_last_region +
+	    sizeof(*footprint_region) +
+	    footprint_region->cfr_num_pages);
+
+//	printf("FBDP map %p buf_size 0x%llx actual_size 0x%llx\n", new_map, (uint64_t) buf_size, (uint64_t) actual_size);
+	vm_map_corpse_footprint_size_avg =
+	    (((vm_map_corpse_footprint_size_avg *
+	    vm_map_corpse_footprint_count) +
+	    actual_size) /
+	    (vm_map_corpse_footprint_count + 1));
+	vm_map_corpse_footprint_count++;
+	if (actual_size > vm_map_corpse_footprint_size_max) {
+		vm_map_corpse_footprint_size_max = actual_size;
+	}
 
-	/*
-	 *	Deactivate the current map and activate the requested map
-	 */
-	PMAP_SWITCH_USER(thr_act, map, mycpu);
+	actual_size = round_page(actual_size);
+	if (buf_size > actual_size) {
+		kr = vm_deallocate(kernel_map,
+		    ((vm_address_t)footprint_header +
+		    actual_size +
+		    PAGE_SIZE),                 /* trailing guard page */
+		    (buf_size - actual_size));
+		assertf(kr == KERN_SUCCESS,
+		    "trim: footprint_header %p buf_size 0x%llx actual_size 0x%llx kr=0x%x\n",
+		    footprint_header,
+		    (uint64_t) buf_size,
+		    (uint64_t) actual_size,
+		    kr);
+		kr = vm_protect(kernel_map,
+		    ((vm_address_t)footprint_header +
+		    actual_size),
+		    PAGE_SIZE,
+		    FALSE,             /* set_maximum */
+		    VM_PROT_NONE);
+		assertf(kr == KERN_SUCCESS,
+		    "guard: footprint_header %p buf_size 0x%llx actual_size 0x%llx kr=0x%x\n",
+		    footprint_header,
+		    (uint64_t) buf_size,
+		    (uint64_t) actual_size,
+		    kr);
+	}
 
-	mp_enable_preemption();
-	return(oldmap);
+	footprint_header->cf_size = actual_size;
 }
 
-
 /*
- *	Routine:	vm_map_write_user
- *
- *	Description:
- *		Copy out data from a kernel space into space in the
- *		destination map. The space must already exist in the
- *		destination map.
- *		NOTE:  This routine should only be called by threads
- *		which can block on a page fault. i.e. kernel mode user
- *		threads.
+ * vm_map_corpse_footprint_query_page_info:
+ *	retrieves the disposition of the page at virtual address "vaddr"
+ *	in the forked corpse's VM map
  *
+ * This is the equivalent of pmap_query_page_info() for a forked corpse.
  */
 kern_return_t
-vm_map_write_user(
-	vm_map_t	map,
-	vm_offset_t	src_addr,
-	vm_offset_t	dst_addr,
-	vm_size_t	size)
+vm_map_corpse_footprint_query_page_info(
+	vm_map_t        map,
+	vm_map_offset_t va,
+	int             *disp)
 {
-	thread_act_t	thr_act = current_act();
-	kern_return_t	kr = KERN_SUCCESS;
+	struct vm_map_corpse_footprint_header *footprint_header;
+	struct vm_map_corpse_footprint_region *footprint_region;
+	uint32_t        footprint_region_offset;
+	vm_map_offset_t region_start, region_end;
+	int             disp_idx;
+	kern_return_t   kr;
+
+	if (!map->has_corpse_footprint) {
+		*disp = 0;
+		kr = KERN_INVALID_ARGUMENT;
+		goto done;
+	}
 
-	if(thr_act->map == map) {
-		if (copyout((char *)src_addr, (char *)dst_addr, size)) {
-			kr = KERN_INVALID_ADDRESS;
-		}
-	} else {
-		vm_map_t	oldmap;
+	footprint_header = map->vmmap_corpse_footprint;
+	if (footprint_header == NULL) {
+		*disp = 0;
+//		if (va < SHARED_REGION_BASE_ARM64) printf("FBDP %d query map %p va 0x%llx disp 0x%x\n", __LINE__, map, va, *disp);
+		kr = KERN_INVALID_ARGUMENT;
+		goto done;
+	}
 
-		/* take on the identity of the target map while doing */
-		/* the transfer */
+	/* start looking at the hint ("cf_hint_region") */
+	footprint_region_offset = footprint_header->cf_hint_region;
 
-		vm_map_reference(map);
-		oldmap = vm_map_switch(map);
-		if (copyout((char *)src_addr, (char *)dst_addr, size)) {
-			kr = KERN_INVALID_ADDRESS;
+lookup_again:
+	if (footprint_region_offset < sizeof(*footprint_header)) {
+		/* hint too low: start from 1st region */
+		footprint_region_offset = sizeof(*footprint_header);
+	}
+	if (footprint_region_offset >= footprint_header->cf_last_region) {
+		/* hint too high: re-start from 1st region */
+		footprint_region_offset = sizeof(*footprint_header);
+	}
+	footprint_region = (struct vm_map_corpse_footprint_region *)
+	    ((char *)footprint_header + footprint_region_offset);
+	region_start = footprint_region->cfr_vaddr;
+	region_end = (region_start +
+	    ((vm_map_offset_t)(footprint_region->cfr_num_pages) *
+	    PAGE_SIZE));
+	if (va < region_start &&
+	    footprint_region_offset != sizeof(*footprint_header)) {
+		/* our range starts before the hint region */
+
+		/* reset the hint (in a racy way...) */
+		footprint_header->cf_hint_region = sizeof(*footprint_header);
+		/* lookup "va" again from 1st region */
+		footprint_region_offset = sizeof(*footprint_header);
+		goto lookup_again;
+	}
+
+	while (va >= region_end) {
+		if (footprint_region_offset >= footprint_header->cf_last_region) {
+			break;
 		}
-		vm_map_switch(oldmap);
-		vm_map_deallocate(map);
+		/* skip the region's header */
+		footprint_region_offset += sizeof(*footprint_region);
+		/* skip the region's page dispositions */
+		footprint_region_offset += footprint_region->cfr_num_pages;
+		/* align to next word boundary */
+		footprint_region_offset =
+		    roundup(footprint_region_offset,
+		    sizeof(int));
+		footprint_region = (struct vm_map_corpse_footprint_region *)
+		    ((char *)footprint_header + footprint_region_offset);
+		region_start = footprint_region->cfr_vaddr;
+		region_end = (region_start +
+		    ((vm_map_offset_t)(footprint_region->cfr_num_pages) *
+		    PAGE_SIZE));
+	}
+	if (va < region_start || va >= region_end) {
+		/* page not found */
+		*disp = 0;
+//		if (va < SHARED_REGION_BASE_ARM64) printf("FBDP %d query map %p va 0x%llx disp 0x%x\n", __LINE__, map, va, *disp);
+		kr = KERN_SUCCESS;
+		goto done;
 	}
-	return kr;
-}
 
-/*
- *	Routine:	vm_map_read_user
- *
- *	Description:
- *		Copy in data from a user space source map into the
- *		kernel map. The space must already exist in the
- *		kernel map.
- *		NOTE:  This routine should only be called by threads
- *		which can block on a page fault. i.e. kernel mode user
- *		threads.
- *
- */
-kern_return_t
-vm_map_read_user(
-	vm_map_t	map,
-	vm_offset_t	src_addr,
-	vm_offset_t	dst_addr,
-	vm_size_t	size)
-{
-	thread_act_t	thr_act = current_act();
-	kern_return_t	kr = KERN_SUCCESS;
+	/* "va" found: set the lookup hint for next lookup (in a racy way...) */
+	footprint_header->cf_hint_region = footprint_region_offset;
 
-	if(thr_act->map == map) {
-		if (copyin((char *)src_addr, (char *)dst_addr, size)) {
-			kr = KERN_INVALID_ADDRESS;
-		}
-	} else {
-		vm_map_t	oldmap;
+	/* get page disposition for "va" in this region */
+	disp_idx = (int) ((va - footprint_region->cfr_vaddr) / PAGE_SIZE);
+	*disp = (int) (footprint_region->cfr_disposition[disp_idx]);
 
-		/* take on the identity of the target map while doing */
-		/* the transfer */
+	kr = KERN_SUCCESS;
+done:
+//	if (va < SHARED_REGION_BASE_ARM64) printf("FBDP %d query map %p va 0x%llx disp 0x%x\n", __LINE__, map, va, *disp);
+	/* dtrace -n 'vminfo:::footprint_query_page_info { printf("map 0x%p va 0x%llx disp 0x%x kr 0x%x", arg0, arg1, arg2, arg3); }' */
+	DTRACE_VM4(footprint_query_page_info,
+	    vm_map_t, map,
+	    vm_map_offset_t, va,
+	    int, *disp,
+	    kern_return_t, kr);
 
-		vm_map_reference(map);
-		oldmap = vm_map_switch(map);
-		if (copyin((char *)src_addr, (char *)dst_addr, size)) {
-			kr = KERN_INVALID_ADDRESS;
-		}
-		vm_map_switch(oldmap);
-		vm_map_deallocate(map);
-	}
 	return kr;
 }
 
-/* Takes existing source and destination sub-maps and clones the contents of */
-/* the source map */
 
-kern_return_t
-vm_region_clone(
-	ipc_port_t	src_region, 
-	ipc_port_t	dst_region)
-{
-	vm_named_entry_t	src_object;
-	vm_named_entry_t	dst_object;
-	vm_map_t		src_map;
-	vm_map_t		dst_map;
-	vm_offset_t		addr;
-	vm_offset_t		max_off;
-	vm_map_entry_t		entry;
-	vm_map_entry_t		new_entry;
-	vm_map_entry_t		insert_point;
-
-	src_object = (vm_named_entry_t)src_region->ip_kobject;
-	dst_object = (vm_named_entry_t)dst_region->ip_kobject;
-	if((!src_object->is_sub_map) || (!dst_object->is_sub_map)) {
-		return KERN_INVALID_ARGUMENT;
-	}
-	src_map = (vm_map_t)src_object->backing.map;
-	dst_map = (vm_map_t)dst_object->backing.map;
-	/* destination map is assumed to be unavailable to any other */
-	/* activity.  i.e. it is new */
-	vm_map_lock(src_map);
-	if((src_map->min_offset != dst_map->min_offset) 
-			|| (src_map->max_offset != dst_map->max_offset)) {
-		vm_map_unlock(src_map);
-		return KERN_INVALID_ARGUMENT;
-	}
-	addr = src_map->min_offset;
-	vm_map_lookup_entry(dst_map, addr, &entry);
-	if(entry == vm_map_to_entry(dst_map)) {
-		entry = entry->vme_next;
-	}
-	if(entry == vm_map_to_entry(dst_map)) {
-		max_off = src_map->max_offset;
-	} else {
-		max_off =  entry->vme_start;
-	}
-	vm_map_lookup_entry(src_map, addr, &entry);
-	if(entry == vm_map_to_entry(src_map)) {
-		entry = entry->vme_next;
-	}
-	vm_map_lookup_entry(dst_map, addr, &insert_point);
-	while((entry != vm_map_to_entry(src_map)) && 
-					(entry->vme_end <= max_off)) {
-		addr = entry->vme_start;
-		new_entry = vm_map_entry_create(dst_map);
-		vm_map_entry_copy(new_entry, entry);
-		vm_map_entry_link(dst_map, insert_point, new_entry);
-		insert_point = new_entry;
-		if (entry->object.vm_object != VM_OBJECT_NULL) {
-			if (new_entry->is_sub_map) {
-				vm_map_reference(new_entry->object.sub_map);
-			} else {
-				vm_object_reference(
-					new_entry->object.vm_object);
-			}
-		}
-		dst_map->size += new_entry->vme_end - new_entry->vme_start;
-		entry = entry->vme_next;
+static void
+vm_map_corpse_footprint_destroy(
+	vm_map_t        map)
+{
+	if (map->has_corpse_footprint &&
+	    map->vmmap_corpse_footprint != 0) {
+		struct vm_map_corpse_footprint_header *footprint_header;
+		vm_size_t buf_size;
+		kern_return_t kr;
+
+		footprint_header = map->vmmap_corpse_footprint;
+		buf_size = footprint_header->cf_size;
+		kr = vm_deallocate(kernel_map,
+		    (vm_offset_t) map->vmmap_corpse_footprint,
+		    ((vm_size_t) buf_size
+		    + PAGE_SIZE));                 /* trailing guard page */
+		assertf(kr == KERN_SUCCESS, "kr=0x%x\n", kr);
+		map->vmmap_corpse_footprint = 0;
+		map->has_corpse_footprint = FALSE;
 	}
-	vm_map_unlock(src_map);
-	return KERN_SUCCESS;
 }
 
 /*
- * Export routines to other components for the things we access locally through
- * macros.
+ * vm_map_copy_footprint_ledgers:
+ *	copies any ledger that's relevant to the memory footprint of "old_task"
+ *	into the forked corpse's task ("new_task")
  */
-#undef current_map
-vm_map_t
-current_map(void)
+void
+vm_map_copy_footprint_ledgers(
+	task_t  old_task,
+	task_t  new_task)
 {
-	return (current_map_fast());
+	vm_map_copy_ledger(old_task, new_task, task_ledgers.phys_footprint);
+	vm_map_copy_ledger(old_task, new_task, task_ledgers.purgeable_nonvolatile);
+	vm_map_copy_ledger(old_task, new_task, task_ledgers.purgeable_nonvolatile_compressed);
+	vm_map_copy_ledger(old_task, new_task, task_ledgers.internal);
+	vm_map_copy_ledger(old_task, new_task, task_ledgers.internal_compressed);
+	vm_map_copy_ledger(old_task, new_task, task_ledgers.iokit_mapped);
+	vm_map_copy_ledger(old_task, new_task, task_ledgers.alternate_accounting);
+	vm_map_copy_ledger(old_task, new_task, task_ledgers.alternate_accounting_compressed);
+	vm_map_copy_ledger(old_task, new_task, task_ledgers.page_table);
+	vm_map_copy_ledger(old_task, new_task, task_ledgers.tagged_footprint);
+	vm_map_copy_ledger(old_task, new_task, task_ledgers.tagged_footprint_compressed);
+	vm_map_copy_ledger(old_task, new_task, task_ledgers.network_nonvolatile);
+	vm_map_copy_ledger(old_task, new_task, task_ledgers.network_nonvolatile_compressed);
+	vm_map_copy_ledger(old_task, new_task, task_ledgers.media_footprint);
+	vm_map_copy_ledger(old_task, new_task, task_ledgers.media_footprint_compressed);
+	vm_map_copy_ledger(old_task, new_task, task_ledgers.graphics_footprint);
+	vm_map_copy_ledger(old_task, new_task, task_ledgers.graphics_footprint_compressed);
+	vm_map_copy_ledger(old_task, new_task, task_ledgers.neural_footprint);
+	vm_map_copy_ledger(old_task, new_task, task_ledgers.neural_footprint_compressed);
+	vm_map_copy_ledger(old_task, new_task, task_ledgers.wired_mem);
 }
 
 /*
- *	vm_map_check_protection:
- *
- *	Assert that the target map allows the specified
- *	privilege on the entire address region given.
- *	The entire region must be allocated.
+ * vm_map_copy_ledger:
+ *	copy a single ledger from "old_task" to "new_task"
  */
-boolean_t vm_map_check_protection(map, start, end, protection)
-	register vm_map_t	map;
-	register vm_offset_t	start;
-	register vm_offset_t	end;
-	register vm_prot_t	protection;
+void
+vm_map_copy_ledger(
+	task_t  old_task,
+	task_t  new_task,
+	int     ledger_entry)
 {
-	register vm_map_entry_t	entry;
-	vm_map_entry_t		tmp_entry;
-
-	vm_map_lock(map);
+	ledger_amount_t old_balance, new_balance, delta;
 
-    if (start < vm_map_min(map) || end > vm_map_max(map) || start > end)
-	{
-			vm_map_unlock(map);
-			return (FALSE);
+	assert(new_task->map->has_corpse_footprint);
+	if (!new_task->map->has_corpse_footprint) {
+		return;
 	}
 
-	if (!vm_map_lookup_entry(map, start, &tmp_entry)) {
-		vm_map_unlock(map);
-		return(FALSE);
+	/* turn off sanity checks for the ledger we're about to mess with */
+	ledger_disable_panic_on_negative(new_task->ledger,
+	    ledger_entry);
+
+	/* adjust "new_task" to match "old_task" */
+	ledger_get_balance(old_task->ledger,
+	    ledger_entry,
+	    &old_balance);
+	ledger_get_balance(new_task->ledger,
+	    ledger_entry,
+	    &new_balance);
+	if (new_balance == old_balance) {
+		/* new == old: done */
+	} else if (new_balance > old_balance) {
+		/* new > old ==> new -= new - old */
+		delta = new_balance - old_balance;
+		ledger_debit(new_task->ledger,
+		    ledger_entry,
+		    delta);
+	} else {
+		/* new < old ==> new += old - new */
+		delta = old_balance - new_balance;
+		ledger_credit(new_task->ledger,
+		    ledger_entry,
+		    delta);
 	}
+}
 
-	entry = tmp_entry;
-
-	while (start < end) {
-		if (entry == vm_map_to_entry(map)) {
-			vm_map_unlock(map);
-			return(FALSE);
-		}
-
-		/*
-		 *	No holes allowed!
-		 */
-
-		if (start < entry->vme_start) {
-			vm_map_unlock(map);
-			return(FALSE);
-		}
+#if MACH_ASSERT
+
+extern int pmap_ledgers_panic;
+extern int pmap_ledgers_panic_leeway;
+
+#define LEDGER_DRIFT(__LEDGER)                    \
+	int             __LEDGER##_over;          \
+	ledger_amount_t __LEDGER##_over_total;    \
+	ledger_amount_t __LEDGER##_over_max;      \
+	int             __LEDGER##_under;         \
+	ledger_amount_t __LEDGER##_under_total;   \
+	ledger_amount_t __LEDGER##_under_max
+
+struct {
+	uint64_t        num_pmaps_checked;
+
+	LEDGER_DRIFT(phys_footprint);
+	LEDGER_DRIFT(internal);
+	LEDGER_DRIFT(internal_compressed);
+	LEDGER_DRIFT(iokit_mapped);
+	LEDGER_DRIFT(alternate_accounting);
+	LEDGER_DRIFT(alternate_accounting_compressed);
+	LEDGER_DRIFT(page_table);
+	LEDGER_DRIFT(purgeable_volatile);
+	LEDGER_DRIFT(purgeable_nonvolatile);
+	LEDGER_DRIFT(purgeable_volatile_compressed);
+	LEDGER_DRIFT(purgeable_nonvolatile_compressed);
+	LEDGER_DRIFT(tagged_nofootprint);
+	LEDGER_DRIFT(tagged_footprint);
+	LEDGER_DRIFT(tagged_nofootprint_compressed);
+	LEDGER_DRIFT(tagged_footprint_compressed);
+	LEDGER_DRIFT(network_volatile);
+	LEDGER_DRIFT(network_nonvolatile);
+	LEDGER_DRIFT(network_volatile_compressed);
+	LEDGER_DRIFT(network_nonvolatile_compressed);
+	LEDGER_DRIFT(media_nofootprint);
+	LEDGER_DRIFT(media_footprint);
+	LEDGER_DRIFT(media_nofootprint_compressed);
+	LEDGER_DRIFT(media_footprint_compressed);
+	LEDGER_DRIFT(graphics_nofootprint);
+	LEDGER_DRIFT(graphics_footprint);
+	LEDGER_DRIFT(graphics_nofootprint_compressed);
+	LEDGER_DRIFT(graphics_footprint_compressed);
+	LEDGER_DRIFT(neural_nofootprint);
+	LEDGER_DRIFT(neural_footprint);
+	LEDGER_DRIFT(neural_nofootprint_compressed);
+	LEDGER_DRIFT(neural_footprint_compressed);
+} pmap_ledgers_drift;
 
-		/*
-		 * Check protection associated with entry.
-		 */
+void
+vm_map_pmap_check_ledgers(
+	pmap_t          pmap,
+	ledger_t        ledger,
+	int             pid,
+	char            *procname)
+{
+	ledger_amount_t bal;
+	boolean_t       do_panic;
+
+	do_panic = FALSE;
+
+	pmap_ledgers_drift.num_pmaps_checked++;
+
+#define LEDGER_CHECK_BALANCE(__LEDGER)                                  \
+MACRO_BEGIN                                                             \
+	int panic_on_negative = TRUE;                                   \
+	ledger_get_balance(ledger,                                      \
+	                   task_ledgers.__LEDGER,                       \
+	                   &bal);                                       \
+	ledger_get_panic_on_negative(ledger,                            \
+	                             task_ledgers.__LEDGER,             \
+	                             &panic_on_negative);               \
+	if (bal != 0) {                                                 \
+	        if (panic_on_negative ||                                \
+	            (pmap_ledgers_panic &&                              \
+	             pmap_ledgers_panic_leeway > 0 &&                   \
+	             (bal > (pmap_ledgers_panic_leeway * PAGE_SIZE) ||  \
+	              bal < (-pmap_ledgers_panic_leeway * PAGE_SIZE)))) { \
+	                do_panic = TRUE;                                \
+	        }                                                       \
+	        printf("LEDGER BALANCE proc %d (%s) "                   \
+	               "\"%s\" = %lld\n",                               \
+	               pid, procname, #__LEDGER, bal);                  \
+	        if (bal > 0) {                                          \
+	                pmap_ledgers_drift.__LEDGER##_over++;           \
+	                pmap_ledgers_drift.__LEDGER##_over_total += bal; \
+	                if (bal > pmap_ledgers_drift.__LEDGER##_over_max) { \
+	                        pmap_ledgers_drift.__LEDGER##_over_max = bal; \
+	                }                                               \
+	        } else if (bal < 0) {                                   \
+	                pmap_ledgers_drift.__LEDGER##_under++;          \
+	                pmap_ledgers_drift.__LEDGER##_under_total += bal; \
+	                if (bal < pmap_ledgers_drift.__LEDGER##_under_max) { \
+	                        pmap_ledgers_drift.__LEDGER##_under_max = bal; \
+	                }                                               \
+	        }                                                       \
+	}                                                               \
+MACRO_END
 
-		if ((entry->protection & protection) != protection) {
-			vm_map_unlock(map);
-			return(FALSE);
+	LEDGER_CHECK_BALANCE(phys_footprint);
+	LEDGER_CHECK_BALANCE(internal);
+	LEDGER_CHECK_BALANCE(internal_compressed);
+	LEDGER_CHECK_BALANCE(iokit_mapped);
+	LEDGER_CHECK_BALANCE(alternate_accounting);
+	LEDGER_CHECK_BALANCE(alternate_accounting_compressed);
+	LEDGER_CHECK_BALANCE(page_table);
+	LEDGER_CHECK_BALANCE(purgeable_volatile);
+	LEDGER_CHECK_BALANCE(purgeable_nonvolatile);
+	LEDGER_CHECK_BALANCE(purgeable_volatile_compressed);
+	LEDGER_CHECK_BALANCE(purgeable_nonvolatile_compressed);
+	LEDGER_CHECK_BALANCE(tagged_nofootprint);
+	LEDGER_CHECK_BALANCE(tagged_footprint);
+	LEDGER_CHECK_BALANCE(tagged_nofootprint_compressed);
+	LEDGER_CHECK_BALANCE(tagged_footprint_compressed);
+	LEDGER_CHECK_BALANCE(network_volatile);
+	LEDGER_CHECK_BALANCE(network_nonvolatile);
+	LEDGER_CHECK_BALANCE(network_volatile_compressed);
+	LEDGER_CHECK_BALANCE(network_nonvolatile_compressed);
+	LEDGER_CHECK_BALANCE(media_nofootprint);
+	LEDGER_CHECK_BALANCE(media_footprint);
+	LEDGER_CHECK_BALANCE(media_nofootprint_compressed);
+	LEDGER_CHECK_BALANCE(media_footprint_compressed);
+	LEDGER_CHECK_BALANCE(graphics_nofootprint);
+	LEDGER_CHECK_BALANCE(graphics_footprint);
+	LEDGER_CHECK_BALANCE(graphics_nofootprint_compressed);
+	LEDGER_CHECK_BALANCE(graphics_footprint_compressed);
+	LEDGER_CHECK_BALANCE(neural_nofootprint);
+	LEDGER_CHECK_BALANCE(neural_footprint);
+	LEDGER_CHECK_BALANCE(neural_nofootprint_compressed);
+	LEDGER_CHECK_BALANCE(neural_footprint_compressed);
+
+	if (do_panic) {
+		if (pmap_ledgers_panic) {
+			panic("pmap_destroy(%p) %d[%s] has imbalanced ledgers\n",
+			    pmap, pid, procname);
+		} else {
+			printf("pmap_destroy(%p) %d[%s] has imbalanced ledgers\n",
+			    pmap, pid, procname);
 		}
-
-		/* go to next entry */
-
-		start = entry->vme_end;
-		entry = entry->vme_next;
 	}
-	vm_map_unlock(map);
-	return(TRUE);
 }
+#endif /* MACH_ASSERT */