2 * Copyright (c) 2000-2006 Apple Computer, Inc. All rights reserved.
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
29 #include <sys/errno.h>
31 #include <mach/mach_types.h>
32 #include <mach/mach_traps.h>
33 #include <mach/host_priv.h>
34 #include <mach/kern_return.h>
35 #include <mach/memory_object_control.h>
36 #include <mach/memory_object_types.h>
37 #include <mach/port.h>
38 #include <mach/policy.h>
40 #include <mach/thread_act.h>
42 #include <kern/assert.h>
43 #include <kern/host.h>
44 #include <kern/thread.h>
46 #include <ipc/ipc_port.h>
47 #include <ipc/ipc_space.h>
49 #include <default_pager/default_pager_types.h>
50 #include <default_pager/default_pager_object_server.h>
52 #include <vm/vm_map.h>
53 #include <vm/vm_pageout.h>
54 #include <vm/memory_object.h>
55 #include <vm/vm_pageout.h>
56 #include <vm/vm_protos.h>
57 #include <vm/vm_purgeable_internal.h>
60 /* BSD VM COMPONENT INTERFACES */
80 return(map
->hdr
.nentries
);
84 mach_get_vm_start(vm_map_t map
)
86 return( vm_map_first_entry(map
)->vme_start
);
90 mach_get_vm_end(vm_map_t map
)
92 return( vm_map_last_entry(map
)->vme_end
);
99 const struct memory_object_pager_ops vnode_pager_ops
= {
100 vnode_pager_reference
,
101 vnode_pager_deallocate
,
103 vnode_pager_terminate
,
104 vnode_pager_data_request
,
105 vnode_pager_data_return
,
106 vnode_pager_data_initialize
,
107 vnode_pager_data_unlock
,
108 vnode_pager_synchronize
,
110 vnode_pager_last_unmap
,
111 NULL
, /* data_reclaim */
115 typedef struct vnode_pager
{
116 struct ipc_object_header pager_header
; /* fake ip_kotype() */
117 memory_object_pager_ops_t pager_ops
; /* == &vnode_pager_ops */
118 unsigned int ref_count
; /* reference count */
119 memory_object_control_t control_handle
; /* mem object control handle */
120 struct vnode
*vnode_handle
; /* vnode handle */
123 #define pager_ikot pager_header.io_bits
126 trigger_name_to_port( /* forward */
130 vnode_pager_cluster_read( /* forward */
138 vnode_pager_cluster_write( /* forward */
142 vm_object_offset_t
*,
148 vnode_object_create( /* forward */
152 vnode_pager_lookup( /* forward */
155 zone_t vnode_pager_zone
;
158 #define VNODE_PAGER_NULL ((vnode_pager_t) 0)
160 /* TODO: Should be set dynamically by vnode_pager_init() */
161 #define CLUSTER_SHIFT 1
163 /* TODO: Should be set dynamically by vnode_pager_bootstrap() */
164 #define MAX_VNODE 10000
170 #define PAGER_ALL 0xffffffff
171 #define PAGER_INIT 0x00000001
172 #define PAGER_PAGEIN 0x00000002
174 #define PAGER_DEBUG(LEVEL, A) {if ((pagerdebug & LEVEL)==LEVEL){printf A;}}
176 #define PAGER_DEBUG(LEVEL, A)
179 extern int proc_resetpcontrol(int);
181 #if DEVELOPMENT || DEBUG
182 extern unsigned long vm_cs_validated_resets
;
186 * Routine: mach_macx_triggers
188 * Syscall interface to set the call backs for low and
193 struct macx_triggers_args
*args
)
195 int hi_water
= args
->hi_water
;
196 int low_water
= args
->low_water
;
197 int flags
= args
->flags
;
198 mach_port_t trigger_name
= args
->alert_port
;
200 memory_object_default_t default_pager
;
201 ipc_port_t trigger_port
;
203 default_pager
= MEMORY_OBJECT_DEFAULT_NULL
;
204 kr
= host_default_memory_manager(host_priv_self(),
206 if(kr
!= KERN_SUCCESS
) {
210 if (((flags
& SWAP_ENCRYPT_ON
) && (flags
& SWAP_ENCRYPT_OFF
)) ||
211 ((flags
& SWAP_COMPACT_ENABLE
) && (flags
& SWAP_COMPACT_DISABLE
))) {
212 /* can't have it both ways */
216 if (default_pager_init_flag
== 0) {
217 start_def_pager(NULL
);
218 default_pager_init_flag
= 1;
221 if (flags
& SWAP_ENCRYPT_ON
) {
222 /* ENCRYPTED SWAP: tell default_pager to encrypt */
223 default_pager_triggers(default_pager
,
227 } else if (flags
& SWAP_ENCRYPT_OFF
) {
228 /* ENCRYPTED SWAP: tell default_pager not to encrypt */
229 default_pager_triggers(default_pager
,
235 if (flags
& USE_EMERGENCY_SWAP_FILE_FIRST
) {
237 * Time to switch to the emergency segment.
239 return default_pager_triggers(default_pager
,
241 USE_EMERGENCY_SWAP_FILE_FIRST
,
245 if (flags
& SWAP_FILE_CREATION_ERROR
) {
247 * For some reason, the dynamic pager failed to create a swap file.
249 trigger_port
= trigger_name_to_port(trigger_name
);
250 if(trigger_port
== NULL
) {
253 /* trigger_port is locked and active */
254 ipc_port_make_send_locked(trigger_port
);
256 default_pager_triggers(default_pager
,
258 SWAP_FILE_CREATION_ERROR
,
262 if (flags
& HI_WAT_ALERT
) {
263 trigger_port
= trigger_name_to_port(trigger_name
);
264 if(trigger_port
== NULL
) {
267 /* trigger_port is locked and active */
268 ipc_port_make_send_locked(trigger_port
);
270 default_pager_triggers(default_pager
,
272 HI_WAT_ALERT
, trigger_port
);
275 if (flags
& LO_WAT_ALERT
) {
276 trigger_port
= trigger_name_to_port(trigger_name
);
277 if(trigger_port
== NULL
) {
280 /* trigger_port is locked and active */
281 ipc_port_make_send_locked(trigger_port
);
282 /* and now its unlocked */
283 default_pager_triggers(default_pager
,
285 LO_WAT_ALERT
, trigger_port
);
289 if (flags
& PROC_RESUME
) {
292 * For this call, hi_water is used to pass in the pid of the process we want to resume
293 * or unthrottle. This is of course restricted to the superuser (checked inside of
294 * proc_resetpcontrol).
297 return proc_resetpcontrol(hi_water
);
301 * Set thread scheduling priority and policy for the current thread
302 * it is assumed for the time being that the thread setting the alert
303 * is the same one which will be servicing it.
305 * XXX This does not belong in the kernel XXX
307 if (flags
& HI_WAT_ALERT
) {
308 thread_precedence_policy_data_t pre
;
309 thread_extended_policy_data_t ext
;
311 ext
.timeshare
= FALSE
;
312 pre
.importance
= INT32_MAX
;
314 thread_policy_set(current_thread(),
315 THREAD_EXTENDED_POLICY
,
316 (thread_policy_t
)&ext
,
317 THREAD_EXTENDED_POLICY_COUNT
);
319 thread_policy_set(current_thread(),
320 THREAD_PRECEDENCE_POLICY
,
321 (thread_policy_t
)&pre
,
322 THREAD_PRECEDENCE_POLICY_COUNT
);
324 current_thread()->options
|= TH_OPT_VMPRIV
;
327 if (flags
& (SWAP_COMPACT_DISABLE
| SWAP_COMPACT_ENABLE
)) {
328 return macx_backing_store_compaction(flags
& (SWAP_COMPACT_DISABLE
| SWAP_COMPACT_ENABLE
));
338 trigger_name_to_port(
339 mach_port_t trigger_name
)
341 ipc_port_t trigger_port
;
344 if (trigger_name
== 0)
347 space
= current_space();
348 if(ipc_port_translate_receive(space
, CAST_MACH_PORT_TO_NAME(trigger_name
),
349 &trigger_port
) != KERN_SUCCESS
)
355 extern int uiomove64(addr64_t
, int, void *);
359 memory_object_control_uiomove(
360 memory_object_control_t control
,
361 memory_object_offset_t offset
,
376 vm_page_t page_run
[MAX_RUN
];
378 object
= memory_object_control_to_vm_object(control
);
379 if (object
== VM_OBJECT_NULL
) {
382 assert(!object
->internal
);
384 vm_object_lock(object
);
386 if (mark_dirty
&& object
->copy
!= VM_OBJECT_NULL
) {
388 * We can't modify the pages without honoring
389 * copy-on-write obligations first, so fall off
390 * this optimized path and fall back to the regular
393 vm_object_unlock(object
);
396 orig_offset
= start_offset
;
398 while (io_requested
&& retval
== 0) {
400 cur_needed
= (start_offset
+ io_requested
+ (PAGE_SIZE
- 1)) / PAGE_SIZE
;
402 if (cur_needed
> MAX_RUN
)
403 cur_needed
= MAX_RUN
;
405 for (cur_run
= 0; cur_run
< cur_needed
; ) {
407 if ((dst_page
= vm_page_lookup(object
, offset
)) == VM_PAGE_NULL
)
411 * if we're in this routine, we are inside a filesystem's
412 * locking model, so we don't ever want to wait for pages that have
413 * list_req_pending == TRUE since it means that the
414 * page is a candidate for some type of I/O operation,
415 * but that it has not yet been gathered into a UPL...
416 * this implies that it is still outside the domain
417 * of the filesystem and that whoever is responsible for
418 * grabbing it into a UPL may be stuck behind the filesystem
419 * lock this thread owns, or trying to take a lock exclusively
420 * and waiting for the readers to drain from a rw lock...
421 * if we block in those cases, we will deadlock
423 if (dst_page
->list_req_pending
) {
425 if (dst_page
->absent
) {
427 * this is the list_req_pending | absent | busy case
428 * which originates from vm_fault_page... we want
429 * to fall out of the fast path and go back
430 * to the caller which will gather this page
431 * into a UPL and issue the I/O if no one
432 * else beats us to it
436 if (dst_page
->pageout
|| dst_page
->cleaning
) {
438 * this is the list_req_pending | pageout | busy case
439 * or the list_req_pending | cleaning case...
440 * which originate from the pageout_scan and
441 * msync worlds for the pageout case and the hibernate
442 * pre-cleaning world for the cleaning case...
443 * we need to reset the state of this page to indicate
444 * it should stay in the cache marked dirty... nothing else we
445 * can do at this point... we can't block on it, we can't busy
446 * it and we can't clean it from this routine.
448 vm_page_lockspin_queues();
450 vm_pageout_queue_steal(dst_page
, TRUE
);
451 vm_page_deactivate(dst_page
);
453 vm_page_unlock_queues();
456 * this is the list_req_pending | cleaning case...
457 * we can go ahead and deal with this page since
458 * its ok for us to mark this page busy... if a UPL
459 * tries to gather this page, it will block until the
460 * busy is cleared, thus allowing us safe use of the page
461 * when we're done with it, we will clear busy and wake
462 * up anyone waiting on it, thus allowing the UPL creation
466 } else if (dst_page
->busy
|| dst_page
->cleaning
) {
468 * someone else is playing with the page... if we've
469 * already collected pages into this run, go ahead
470 * and process now, we can't block on this
471 * page while holding other pages in the BUSY state
472 * otherwise we will wait
476 PAGE_SLEEP(object
, dst_page
, THREAD_UNINT
);
481 * this routine is only called when copying
482 * to/from real files... no need to consider
483 * encrypted swap pages
485 assert(!dst_page
->encrypted
);
488 dst_page
->dirty
= TRUE
;
489 if (dst_page
->cs_validated
&&
490 !dst_page
->cs_tainted
) {
493 * We're modifying a code-signed
494 * page: force revalidate
496 dst_page
->cs_validated
= FALSE
;
497 #if DEVELOPMENT || DEBUG
498 vm_cs_validated_resets
++;
500 pmap_disconnect(dst_page
->phys_page
);
503 dst_page
->busy
= TRUE
;
505 page_run
[cur_run
++] = dst_page
;
507 offset
+= PAGE_SIZE_64
;
511 * we hit a 'hole' in the cache or
512 * a page we don't want to try to handle,
513 * so bail at this point
514 * we'll unlock the object below
517 vm_object_unlock(object
);
519 for (i
= 0; i
< cur_run
; i
++) {
521 dst_page
= page_run
[i
];
523 if ((xsize
= PAGE_SIZE
- start_offset
) > io_requested
)
524 xsize
= io_requested
;
526 if ( (retval
= uiomove64((addr64_t
)(((addr64_t
)(dst_page
->phys_page
) << 12) + start_offset
), xsize
, uio
)) )
529 io_requested
-= xsize
;
532 vm_object_lock(object
);
535 * if we have more than 1 page to work on
536 * in the current run, or the original request
537 * started at offset 0 of the page, or we're
538 * processing multiple batches, we will move
539 * the pages to the tail of the inactive queue
540 * to implement an LRU for read/write accesses
542 * the check for orig_offset == 0 is there to
543 * mitigate the cost of small (< page_size) requests
544 * to the same page (this way we only move it once)
546 if (take_reference
&& (cur_run
> 1 || orig_offset
== 0)) {
548 vm_page_lockspin_queues();
550 for (i
= 0; i
< cur_run
; i
++)
551 vm_page_lru(page_run
[i
]);
553 vm_page_unlock_queues();
555 for (i
= 0; i
< cur_run
; i
++) {
556 dst_page
= page_run
[i
];
559 * someone is explicitly referencing this page...
560 * update clustered and speculative state
563 VM_PAGE_CONSUME_CLUSTERED(dst_page
);
565 PAGE_WAKEUP_DONE(dst_page
);
569 vm_object_unlock(object
);
579 vnode_pager_bootstrap(void)
581 register vm_size_t size
;
583 size
= (vm_size_t
) sizeof(struct vnode_pager
);
584 vnode_pager_zone
= zinit(size
, (vm_size_t
) MAX_VNODE
*size
,
585 PAGE_SIZE
, "vnode pager structures");
586 zone_change(vnode_pager_zone
, Z_CALLERACCT
, FALSE
);
587 zone_change(vnode_pager_zone
, Z_NOENCRYPT
, TRUE
);
590 #if CONFIG_CODE_DECRYPTION
591 apple_protect_pager_bootstrap();
592 #endif /* CONFIG_CODE_DECRYPTION */
593 swapfile_pager_bootstrap();
603 __unused memory_object_t pager
)
605 vnode_pager_t vnode_object
;
607 vnode_object
= vnode_object_create(vp
);
608 if (vnode_object
== VNODE_PAGER_NULL
)
609 panic("vnode_pager_setup: vnode_object_create() failed");
610 return((memory_object_t
)vnode_object
);
617 vnode_pager_init(memory_object_t mem_obj
,
618 memory_object_control_t control
,
622 memory_object_cluster_size_t pg_size
)
624 vnode_pager_t vnode_object
;
626 memory_object_attr_info_data_t attributes
;
629 PAGER_DEBUG(PAGER_ALL
, ("vnode_pager_init: %p, %p, %lx\n", mem_obj
, control
, (unsigned long)pg_size
));
631 if (control
== MEMORY_OBJECT_CONTROL_NULL
)
632 return KERN_INVALID_ARGUMENT
;
634 vnode_object
= vnode_pager_lookup(mem_obj
);
636 memory_object_control_reference(control
);
638 vnode_object
->control_handle
= control
;
640 attributes
.copy_strategy
= MEMORY_OBJECT_COPY_DELAY
;
641 /* attributes.cluster_size = (1 << (CLUSTER_SHIFT + PAGE_SHIFT));*/
642 attributes
.cluster_size
= (1 << (PAGE_SHIFT
));
643 attributes
.may_cache_object
= TRUE
;
644 attributes
.temporary
= TRUE
;
646 kr
= memory_object_change_attributes(
648 MEMORY_OBJECT_ATTRIBUTE_INFO
,
649 (memory_object_info_t
) &attributes
,
650 MEMORY_OBJECT_ATTR_INFO_COUNT
);
651 if (kr
!= KERN_SUCCESS
)
652 panic("vnode_pager_init: memory_object_change_attributes() failed");
654 return(KERN_SUCCESS
);
661 vnode_pager_data_return(
662 memory_object_t mem_obj
,
663 memory_object_offset_t offset
,
664 memory_object_cluster_size_t data_cnt
,
665 memory_object_offset_t
*resid_offset
,
667 __unused boolean_t dirty
,
668 __unused boolean_t kernel_copy
,
671 register vnode_pager_t vnode_object
;
673 vnode_object
= vnode_pager_lookup(mem_obj
);
675 vnode_pager_cluster_write(vnode_object
, offset
, data_cnt
, resid_offset
, io_error
, upl_flags
);
681 vnode_pager_data_initialize(
682 __unused memory_object_t mem_obj
,
683 __unused memory_object_offset_t offset
,
684 __unused memory_object_cluster_size_t data_cnt
)
686 panic("vnode_pager_data_initialize");
691 vnode_pager_data_unlock(
692 __unused memory_object_t mem_obj
,
693 __unused memory_object_offset_t offset
,
694 __unused memory_object_size_t size
,
695 __unused vm_prot_t desired_access
)
701 vnode_pager_get_isinuse(
702 memory_object_t mem_obj
,
705 vnode_pager_t vnode_object
;
707 if (mem_obj
->mo_pager_ops
!= &vnode_pager_ops
) {
709 return KERN_INVALID_ARGUMENT
;
712 vnode_object
= vnode_pager_lookup(mem_obj
);
714 *isinuse
= vnode_pager_isinuse(vnode_object
->vnode_handle
);
719 vnode_pager_check_hard_throttle(
720 memory_object_t mem_obj
,
722 uint32_t hard_throttle
)
724 vnode_pager_t vnode_object
;
726 if (mem_obj
->mo_pager_ops
!= &vnode_pager_ops
)
727 return KERN_INVALID_ARGUMENT
;
729 vnode_object
= vnode_pager_lookup(mem_obj
);
731 (void)vnode_pager_return_hard_throttle_limit(vnode_object
->vnode_handle
, limit
, hard_throttle
);
736 vnode_pager_get_isSSD(
737 memory_object_t mem_obj
,
740 vnode_pager_t vnode_object
;
742 if (mem_obj
->mo_pager_ops
!= &vnode_pager_ops
)
743 return KERN_INVALID_ARGUMENT
;
745 vnode_object
= vnode_pager_lookup(mem_obj
);
747 *isSSD
= vnode_pager_isSSD(vnode_object
->vnode_handle
);
752 vnode_pager_get_object_size(
753 memory_object_t mem_obj
,
754 memory_object_offset_t
*length
)
756 vnode_pager_t vnode_object
;
758 if (mem_obj
->mo_pager_ops
!= &vnode_pager_ops
) {
760 return KERN_INVALID_ARGUMENT
;
763 vnode_object
= vnode_pager_lookup(mem_obj
);
765 *length
= vnode_pager_get_filesize(vnode_object
->vnode_handle
);
770 vnode_pager_get_object_pathname(
771 memory_object_t mem_obj
,
775 vnode_pager_t vnode_object
;
777 if (mem_obj
->mo_pager_ops
!= &vnode_pager_ops
) {
778 return KERN_INVALID_ARGUMENT
;
781 vnode_object
= vnode_pager_lookup(mem_obj
);
783 return vnode_pager_get_pathname(vnode_object
->vnode_handle
,
789 vnode_pager_get_object_filename(
790 memory_object_t mem_obj
,
791 const char **filename
)
793 vnode_pager_t vnode_object
;
795 if (mem_obj
->mo_pager_ops
!= &vnode_pager_ops
) {
796 return KERN_INVALID_ARGUMENT
;
799 vnode_object
= vnode_pager_lookup(mem_obj
);
801 return vnode_pager_get_filename(vnode_object
->vnode_handle
,
806 vnode_pager_get_object_cs_blobs(
807 memory_object_t mem_obj
,
810 vnode_pager_t vnode_object
;
812 if (mem_obj
== MEMORY_OBJECT_NULL
||
813 mem_obj
->mo_pager_ops
!= &vnode_pager_ops
) {
814 return KERN_INVALID_ARGUMENT
;
817 vnode_object
= vnode_pager_lookup(mem_obj
);
819 return vnode_pager_get_cs_blobs(vnode_object
->vnode_handle
,
823 #if CHECK_CS_VALIDATION_BITMAP
825 vnode_pager_cs_check_validation_bitmap(
826 memory_object_t mem_obj
,
827 memory_object_offset_t offset
,
830 vnode_pager_t vnode_object
;
832 if (mem_obj
== MEMORY_OBJECT_NULL
||
833 mem_obj
->mo_pager_ops
!= &vnode_pager_ops
) {
834 return KERN_INVALID_ARGUMENT
;
837 vnode_object
= vnode_pager_lookup(mem_obj
);
838 return ubc_cs_check_validation_bitmap( vnode_object
->vnode_handle
, offset
, optype
);
840 #endif /* CHECK_CS_VALIDATION_BITMAP */
846 vnode_pager_data_request(
847 memory_object_t mem_obj
,
848 memory_object_offset_t offset
,
849 __unused memory_object_cluster_size_t length
,
850 __unused vm_prot_t desired_access
,
851 memory_object_fault_info_t fault_info
)
853 vnode_pager_t vnode_object
;
854 memory_object_offset_t base_offset
;
856 uint32_t io_streaming
= 0;
858 vnode_object
= vnode_pager_lookup(mem_obj
);
860 size
= MAX_UPL_TRANSFER
* PAGE_SIZE
;
861 base_offset
= offset
;
863 if (memory_object_cluster_size(vnode_object
->control_handle
, &base_offset
, &size
, &io_streaming
, fault_info
) != KERN_SUCCESS
)
866 assert(offset
>= base_offset
&&
867 offset
< base_offset
+ size
);
869 return vnode_pager_cluster_read(vnode_object
, base_offset
, offset
, io_streaming
, size
);
876 vnode_pager_reference(
877 memory_object_t mem_obj
)
879 register vnode_pager_t vnode_object
;
880 unsigned int new_ref_count
;
882 vnode_object
= vnode_pager_lookup(mem_obj
);
883 new_ref_count
= hw_atomic_add(&vnode_object
->ref_count
, 1);
884 assert(new_ref_count
> 1);
891 vnode_pager_deallocate(
892 memory_object_t mem_obj
)
894 register vnode_pager_t vnode_object
;
896 PAGER_DEBUG(PAGER_ALL
, ("vnode_pager_deallocate: %p\n", mem_obj
));
898 vnode_object
= vnode_pager_lookup(mem_obj
);
900 if (hw_atomic_sub(&vnode_object
->ref_count
, 1) == 0) {
901 if (vnode_object
->vnode_handle
!= NULL
) {
902 vnode_pager_vrele(vnode_object
->vnode_handle
);
904 zfree(vnode_pager_zone
, vnode_object
);
913 vnode_pager_terminate(
917 memory_object_t mem_obj
)
919 PAGER_DEBUG(PAGER_ALL
, ("vnode_pager_terminate: %p\n", mem_obj
));
921 return(KERN_SUCCESS
);
928 vnode_pager_synchronize(
929 memory_object_t mem_obj
,
930 memory_object_offset_t offset
,
931 memory_object_size_t length
,
932 __unused vm_sync_t sync_flags
)
934 register vnode_pager_t vnode_object
;
936 PAGER_DEBUG(PAGER_ALL
, ("vnode_pager_synchronize: %p\n", mem_obj
));
938 vnode_object
= vnode_pager_lookup(mem_obj
);
940 memory_object_synchronize_completed(vnode_object
->control_handle
, offset
, length
);
942 return (KERN_SUCCESS
);
950 memory_object_t mem_obj
,
953 vnode_pager_t vnode_object
;
957 PAGER_DEBUG(PAGER_ALL
, ("vnode_pager_map: %p %x\n", mem_obj
, prot
));
959 vnode_object
= vnode_pager_lookup(mem_obj
);
961 ret
= ubc_map(vnode_object
->vnode_handle
, prot
);
973 vnode_pager_last_unmap(
974 memory_object_t mem_obj
)
976 register vnode_pager_t vnode_object
;
978 PAGER_DEBUG(PAGER_ALL
, ("vnode_pager_last_unmap: %p\n", mem_obj
));
980 vnode_object
= vnode_pager_lookup(mem_obj
);
982 ubc_unmap(vnode_object
->vnode_handle
);
992 vnode_pager_cluster_write(
993 vnode_pager_t vnode_object
,
994 vm_object_offset_t offset
,
996 vm_object_offset_t
* resid_offset
,
1003 if (upl_flags
& UPL_MSYNC
) {
1005 upl_flags
|= UPL_VNODE_PAGER
;
1007 if ( (upl_flags
& UPL_IOSYNC
) && io_error
)
1008 upl_flags
|= UPL_KEEPCACHED
;
1011 size
= (cnt
< (PAGE_SIZE
* MAX_UPL_TRANSFER
)) ? cnt
: (PAGE_SIZE
* MAX_UPL_TRANSFER
); /* effective max */
1013 assert((upl_size_t
) size
== size
);
1014 vnode_pageout(vnode_object
->vnode_handle
,
1015 NULL
, (upl_offset_t
)0, offset
, (upl_size_t
)size
, upl_flags
, &errno
);
1017 if ( (upl_flags
& UPL_KEEPCACHED
) ) {
1018 if ( (*io_error
= errno
) )
1025 *resid_offset
= offset
;
1028 vm_object_offset_t vnode_size
;
1029 vm_object_offset_t base_offset
;
1032 * this is the pageout path
1034 vnode_size
= vnode_pager_get_filesize(vnode_object
->vnode_handle
);
1036 if (vnode_size
> (offset
+ PAGE_SIZE
)) {
1038 * preset the maximum size of the cluster
1039 * and put us on a nice cluster boundary...
1040 * and then clip the size to insure we
1041 * don't request past the end of the underlying file
1043 size
= PAGE_SIZE
* MAX_UPL_TRANSFER
;
1044 base_offset
= offset
& ~((signed)(size
- 1));
1046 if ((base_offset
+ size
) > vnode_size
)
1047 size
= round_page(((vm_size_t
)(vnode_size
- base_offset
)));
1050 * we've been requested to page out a page beyond the current
1051 * end of the 'file'... don't try to cluster in this case...
1052 * we still need to send this page through because it might
1053 * be marked precious and the underlying filesystem may need
1054 * to do something with it (besides page it out)...
1056 base_offset
= offset
;
1059 assert((upl_size_t
) size
== size
);
1060 vnode_pageout(vnode_object
->vnode_handle
,
1061 NULL
, (upl_offset_t
)(offset
- base_offset
), base_offset
, (upl_size_t
) size
, UPL_VNODE_PAGER
, NULL
);
1070 vnode_pager_cluster_read(
1071 vnode_pager_t vnode_object
,
1072 vm_object_offset_t base_offset
,
1073 vm_object_offset_t offset
,
1074 uint32_t io_streaming
,
1077 int local_error
= 0;
1081 assert(! (cnt
& PAGE_MASK
));
1084 flags
|= UPL_IOSTREAMING
;
1086 assert((upl_size_t
) cnt
== cnt
);
1087 kret
= vnode_pagein(vnode_object
->vnode_handle
,
1089 (upl_offset_t
) (offset
- base_offset
),
1095 if(kret == PAGER_ABSENT) {
1096 Need to work out the defs here, 1 corresponds to PAGER_ABSENT
1097 defined in bsd/vm/vm_pager.h However, we should not be including
1098 that file here it is a layering violation.
1103 unsigned int count
= 0;
1106 uplflags
= (UPL_NO_SYNC
|
1107 UPL_CLEAN_IN_PLACE
|
1110 assert((upl_size_t
) cnt
== cnt
);
1111 kr
= memory_object_upl_request(vnode_object
->control_handle
,
1112 base_offset
, (upl_size_t
) cnt
,
1113 &upl
, NULL
, &count
, uplflags
);
1114 if (kr
== KERN_SUCCESS
) {
1116 upl_deallocate(upl
);
1119 * We couldn't gather the page list, probably
1120 * because the memory object doesn't have a link
1121 * to a VM object anymore (forced unmount, for
1122 * example). Just return an error to the vm_fault()
1123 * path and let it handle it.
1127 return KERN_FAILURE
;
1130 return KERN_SUCCESS
;
1139 vnode_pager_release_from_cache(
1142 memory_object_free_from_cache(
1143 &realhost
, &vnode_pager_ops
, cnt
);
1150 vnode_object_create(
1153 register vnode_pager_t vnode_object
;
1155 vnode_object
= (struct vnode_pager
*) zalloc(vnode_pager_zone
);
1156 if (vnode_object
== VNODE_PAGER_NULL
)
1157 return(VNODE_PAGER_NULL
);
1160 * The vm_map call takes both named entry ports and raw memory
1161 * objects in the same parameter. We need to make sure that
1162 * vm_map does not see this object as a named entry port. So,
1163 * we reserve the first word in the object for a fake ip_kotype
1164 * setting - that will tell vm_map to use it as a memory object.
1166 vnode_object
->pager_ops
= &vnode_pager_ops
;
1167 vnode_object
->pager_ikot
= IKOT_MEMORY_OBJECT
;
1168 vnode_object
->ref_count
= 1;
1169 vnode_object
->control_handle
= MEMORY_OBJECT_CONTROL_NULL
;
1170 vnode_object
->vnode_handle
= vp
;
1172 return(vnode_object
);
1180 memory_object_t name
)
1182 vnode_pager_t vnode_object
;
1184 vnode_object
= (vnode_pager_t
)name
;
1185 assert(vnode_object
->pager_ops
== &vnode_pager_ops
);
1186 return (vnode_object
);
1190 /*********************** proc_info implementation *************/
1192 #include <sys/bsdtask_info.h>
1194 static int fill_vnodeinfoforaddr( vm_map_entry_t entry
, uintptr_t * vnodeaddr
, uint32_t * vid
);
1198 fill_procregioninfo(task_t task
, uint64_t arg
, struct proc_regioninfo_internal
*pinfo
, uintptr_t *vnodeaddr
, uint32_t *vid
)
1202 vm_map_offset_t address
= (vm_map_offset_t
)arg
;
1203 vm_map_entry_t tmp_entry
;
1204 vm_map_entry_t entry
;
1205 vm_map_offset_t start
;
1206 vm_region_extended_info_data_t extended
;
1207 vm_region_top_info_data_t top
;
1211 if (map
== VM_MAP_NULL
)
1216 vm_map_reference(map
);
1219 vm_map_lock_read(map
);
1222 if (!vm_map_lookup_entry(map
, start
, &tmp_entry
)) {
1223 if ((entry
= tmp_entry
->vme_next
) == vm_map_to_entry(map
)) {
1224 vm_map_unlock_read(map
);
1225 vm_map_deallocate(map
);
1232 start
= entry
->vme_start
;
1234 pinfo
->pri_offset
= entry
->offset
;
1235 pinfo
->pri_protection
= entry
->protection
;
1236 pinfo
->pri_max_protection
= entry
->max_protection
;
1237 pinfo
->pri_inheritance
= entry
->inheritance
;
1238 pinfo
->pri_behavior
= entry
->behavior
;
1239 pinfo
->pri_user_wired_count
= entry
->user_wired_count
;
1240 pinfo
->pri_user_tag
= entry
->alias
;
1242 if (entry
->is_sub_map
) {
1243 pinfo
->pri_flags
|= PROC_REGION_SUBMAP
;
1245 if (entry
->is_shared
)
1246 pinfo
->pri_flags
|= PROC_REGION_SHARED
;
1250 extended
.protection
= entry
->protection
;
1251 extended
.user_tag
= entry
->alias
;
1252 extended
.pages_resident
= 0;
1253 extended
.pages_swapped_out
= 0;
1254 extended
.pages_shared_now_private
= 0;
1255 extended
.pages_dirtied
= 0;
1256 extended
.external_pager
= 0;
1257 extended
.shadow_depth
= 0;
1259 vm_map_region_walk(map
, start
, entry
, entry
->offset
, entry
->vme_end
- start
, &extended
);
1261 if (extended
.external_pager
&& extended
.ref_count
== 2 && extended
.share_mode
== SM_SHARED
)
1262 extended
.share_mode
= SM_PRIVATE
;
1264 top
.private_pages_resident
= 0;
1265 top
.shared_pages_resident
= 0;
1266 vm_map_region_top_walk(entry
, &top
);
1269 pinfo
->pri_pages_resident
= extended
.pages_resident
;
1270 pinfo
->pri_pages_shared_now_private
= extended
.pages_shared_now_private
;
1271 pinfo
->pri_pages_swapped_out
= extended
.pages_swapped_out
;
1272 pinfo
->pri_pages_dirtied
= extended
.pages_dirtied
;
1273 pinfo
->pri_ref_count
= extended
.ref_count
;
1274 pinfo
->pri_shadow_depth
= extended
.shadow_depth
;
1275 pinfo
->pri_share_mode
= extended
.share_mode
;
1277 pinfo
->pri_private_pages_resident
= top
.private_pages_resident
;
1278 pinfo
->pri_shared_pages_resident
= top
.shared_pages_resident
;
1279 pinfo
->pri_obj_id
= top
.obj_id
;
1281 pinfo
->pri_address
= (uint64_t)start
;
1282 pinfo
->pri_size
= (uint64_t)(entry
->vme_end
- start
);
1283 pinfo
->pri_depth
= 0;
1285 if ((vnodeaddr
!= 0) && (entry
->is_sub_map
== 0)) {
1286 *vnodeaddr
= (uintptr_t)0;
1288 if (fill_vnodeinfoforaddr(entry
, vnodeaddr
, vid
) ==0) {
1289 vm_map_unlock_read(map
);
1290 vm_map_deallocate(map
);
1295 vm_map_unlock_read(map
);
1296 vm_map_deallocate(map
);
1301 fill_vnodeinfoforaddr(
1302 vm_map_entry_t entry
,
1303 uintptr_t * vnodeaddr
,
1306 vm_object_t top_object
, object
;
1307 memory_object_t memory_object
;
1308 memory_object_pager_ops_t pager_ops
;
1313 if (entry
->is_sub_map
) {
1317 * The last object in the shadow chain has the
1318 * relevant pager information.
1320 top_object
= entry
->object
.vm_object
;
1321 if (top_object
== VM_OBJECT_NULL
) {
1322 object
= VM_OBJECT_NULL
;
1325 vm_object_lock(top_object
);
1326 for (object
= top_object
, shadow_depth
= 0;
1327 object
->shadow
!= VM_OBJECT_NULL
;
1328 object
= object
->shadow
, shadow_depth
++) {
1329 vm_object_lock(object
->shadow
);
1330 vm_object_unlock(object
);
1335 if (object
== VM_OBJECT_NULL
) {
1337 } else if (object
->internal
) {
1338 vm_object_unlock(object
);
1340 } else if (! object
->pager_ready
||
1341 object
->terminating
||
1343 vm_object_unlock(object
);
1346 memory_object
= object
->pager
;
1347 pager_ops
= memory_object
->mo_pager_ops
;
1348 if (pager_ops
== &vnode_pager_ops
) {
1349 kr
= vnode_pager_get_object_vnode(
1352 if (kr
!= KERN_SUCCESS
) {
1353 vm_object_unlock(object
);
1357 vm_object_unlock(object
);
1361 vm_object_unlock(object
);
1366 vnode_pager_get_object_vnode (
1367 memory_object_t mem_obj
,
1368 uintptr_t * vnodeaddr
,
1371 vnode_pager_t vnode_object
;
1373 vnode_object
= vnode_pager_lookup(mem_obj
);
1374 if (vnode_object
->vnode_handle
) {
1375 *vnodeaddr
= (uintptr_t)vnode_object
->vnode_handle
;
1376 *vid
= (uint32_t)vnode_vid((void *)vnode_object
->vnode_handle
);
1378 return(KERN_SUCCESS
);
1381 return(KERN_FAILURE
);
1386 * Find the underlying vnode object for the given vm_map_entry. If found, return with the
1387 * object locked, otherwise return NULL with nothing locked.
1392 vm_map_entry_t entry
1395 vm_object_t top_object
, object
;
1396 memory_object_t memory_object
;
1397 memory_object_pager_ops_t pager_ops
;
1399 if (!entry
->is_sub_map
) {
1402 * The last object in the shadow chain has the
1403 * relevant pager information.
1406 top_object
= entry
->object
.vm_object
;
1409 vm_object_lock(top_object
);
1411 for (object
= top_object
; object
->shadow
!= VM_OBJECT_NULL
; object
= object
->shadow
) {
1412 vm_object_lock(object
->shadow
);
1413 vm_object_unlock(object
);
1416 if (object
&& !object
->internal
&& object
->pager_ready
&& !object
->terminating
&&
1418 memory_object
= object
->pager
;
1419 pager_ops
= memory_object
->mo_pager_ops
;
1422 * If this object points to the vnode_pager_ops, then we found what we're
1423 * looking for. Otherwise, this vm_map_entry doesn't have an underlying
1424 * vnode and so we fall through to the bottom and return NULL.
1427 if (pager_ops
== &vnode_pager_ops
)
1428 return object
; /* we return with the object locked */
1431 vm_object_unlock(object
);
1436 return(VM_OBJECT_NULL
);