2 * Copyright (c) 2000-2013 Apple Inc. All rights reserved.
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
29 #include "vm_compressor_backing_store.h"
30 #include <vm/vm_pageout.h>
31 #include <vm/vm_protos.h>
33 #include <IOKit/IOHibernatePrivate.h>
35 #include <kern/policy_internal.h>
37 boolean_t compressor_store_stop_compaction
= FALSE
;
38 boolean_t vm_swapfile_create_needed
= FALSE
;
39 boolean_t vm_swapfile_gc_needed
= FALSE
;
41 int vm_swapper_throttle
= -1;
42 uint64_t vm_swapout_thread_id
;
44 uint64_t vm_swap_put_failures
= 0; /* Likely failed I/O. Data is still in memory. */
45 uint64_t vm_swap_get_failures
= 0; /* Fatal */
46 uint64_t vm_swap_put_failures_no_swap_file
= 0; /* Possibly not fatal because we might just need a new swapfile. */
47 int vm_num_swap_files_config
= 0;
48 int vm_num_swap_files
= 0;
49 int vm_num_pinned_swap_files
= 0;
50 int vm_swapout_thread_processed_segments
= 0;
51 int vm_swapout_thread_awakened
= 0;
52 int vm_swapfile_create_thread_awakened
= 0;
53 int vm_swapfile_create_thread_running
= 0;
54 int vm_swapfile_gc_thread_awakened
= 0;
55 int vm_swapfile_gc_thread_running
= 0;
57 int64_t vm_swappin_avail
= 0;
58 boolean_t vm_swappin_enabled
= FALSE
;
59 unsigned int vm_swapfile_total_segs_alloced
= 0;
60 unsigned int vm_swapfile_total_segs_used
= 0;
62 char swapfilename
[MAX_SWAPFILENAME_LEN
+ 1] = SWAP_FILE_NAME
;
64 extern vm_map_t compressor_map
;
67 #define SWAP_READY 0x1 /* Swap file is ready to be used */
68 #define SWAP_RECLAIM 0x2 /* Swap file is marked to be reclaimed */
69 #define SWAP_WANTED 0x4 /* Swap file has waiters */
70 #define SWAP_REUSE 0x8 /* Swap file is on the Q and has a name. Reuse after init-ing.*/
71 #define SWAP_PINNED 0x10 /* Swap file is pinned (FusionDrive) */
75 queue_head_t swp_queue
; /* list of swap files */
76 char *swp_path
; /* saved pathname of swap file */
77 struct vnode
*swp_vp
; /* backing vnode */
78 uint64_t swp_size
; /* size of this swap file */
79 uint8_t *swp_bitmap
; /* bitmap showing the alloced/freed slots in the swap file */
80 unsigned int swp_pathlen
; /* length of pathname */
81 unsigned int swp_nsegs
; /* #segments we can use */
82 unsigned int swp_nseginuse
; /* #segments in use */
83 unsigned int swp_index
; /* index of this swap file */
84 unsigned int swp_flags
; /* state of swap file */
85 unsigned int swp_free_hint
; /* offset of 1st free chunk */
86 unsigned int swp_io_count
; /* count of outstanding I/Os */
87 c_segment_t
*swp_csegs
; /* back pointers to the c_segments. Used during swap reclaim. */
89 struct trim_list
*swp_delayed_trim_list_head
;
90 unsigned int swp_delayed_trim_count
;
93 queue_head_t swf_global_queue
;
94 boolean_t swp_trim_supported
= FALSE
;
96 extern clock_sec_t dont_trim_until_ts
;
97 clock_sec_t vm_swapfile_last_failed_to_create_ts
= 0;
98 clock_sec_t vm_swapfile_last_successful_create_ts
= 0;
99 int vm_swapfile_can_be_created
= FALSE
;
100 boolean_t delayed_trim_handling_in_progress
= FALSE
;
102 boolean_t hibernate_in_progress_with_pinned_swap
= FALSE
;
104 static void vm_swapout_thread_throttle_adjust(void);
105 static void vm_swap_free_now(struct swapfile
*swf
, uint64_t f_offset
);
106 static void vm_swapout_thread(void);
107 static void vm_swapfile_create_thread(void);
108 static void vm_swapfile_gc_thread(void);
109 static void vm_swap_defragment(void);
110 static void vm_swap_handle_delayed_trims(boolean_t
);
111 static void vm_swap_do_delayed_trim(struct swapfile
*);
112 static void vm_swap_wait_on_trim_handling_in_progress(void);
115 boolean_t vm_swap_force_defrag
= FALSE
, vm_swap_force_reclaim
= FALSE
;
119 #if DEVELOPMENT || DEBUG
120 #define VM_MAX_SWAP_FILE_NUM 100
121 #else /* DEVELOPMENT || DEBUG */
122 #define VM_MAX_SWAP_FILE_NUM 5
123 #endif /* DEVELOPMENT || DEBUG */
125 #define VM_SWAPFILE_DELAYED_TRIM_MAX 4
127 #define VM_SWAP_SHOULD_DEFRAGMENT() (((vm_swap_force_defrag == TRUE) || (c_swappedout_sparse_count > (vm_swapfile_total_segs_used / 16))) ? 1 : 0)
128 #define VM_SWAP_SHOULD_PIN(_size) FALSE
129 #define VM_SWAP_SHOULD_CREATE(cur_ts) ((vm_num_swap_files < vm_num_swap_files_config) && ((vm_swapfile_total_segs_alloced - vm_swapfile_total_segs_used) < (unsigned int)VM_SWAPFILE_HIWATER_SEGS) && \
130 ((cur_ts - vm_swapfile_last_failed_to_create_ts) > VM_SWAPFILE_DELAYED_CREATE) ? 1 : 0)
131 #define VM_SWAP_SHOULD_TRIM(swf) ((swf->swp_delayed_trim_count >= VM_SWAPFILE_DELAYED_TRIM_MAX) ? 1 : 0)
133 #else /* CONFIG_EMBEDDED */
135 #define VM_MAX_SWAP_FILE_NUM 100
136 #define VM_SWAPFILE_DELAYED_TRIM_MAX 128
138 #define VM_SWAP_SHOULD_DEFRAGMENT() (((vm_swap_force_defrag == TRUE) || (c_swappedout_sparse_count > (vm_swapfile_total_segs_used / 4))) ? 1 : 0)
139 #define VM_SWAP_SHOULD_PIN(_size) (vm_swappin_avail > 0 && vm_swappin_avail >= (int64_t)(_size))
140 #define VM_SWAP_SHOULD_CREATE(cur_ts) ((vm_num_swap_files < vm_num_swap_files_config) && ((vm_swapfile_total_segs_alloced - vm_swapfile_total_segs_used) < (unsigned int)VM_SWAPFILE_HIWATER_SEGS) && \
141 ((cur_ts - vm_swapfile_last_failed_to_create_ts) > VM_SWAPFILE_DELAYED_CREATE) ? 1 : 0)
142 #define VM_SWAP_SHOULD_TRIM(swf) ((swf->swp_delayed_trim_count >= VM_SWAPFILE_DELAYED_TRIM_MAX) ? 1 : 0)
144 #endif /* CONFIG_EMBEDDED */
146 #define VM_SWAP_SHOULD_RECLAIM() (((vm_swap_force_reclaim == TRUE) || ((vm_swapfile_total_segs_alloced - vm_swapfile_total_segs_used) >= SWAPFILE_RECLAIM_THRESHOLD_SEGS)) ? 1 : 0)
147 #define VM_SWAP_SHOULD_ABORT_RECLAIM() (((vm_swap_force_reclaim == FALSE) && ((vm_swapfile_total_segs_alloced - vm_swapfile_total_segs_used) <= SWAPFILE_RECLAIM_MINIMUM_SEGS)) ? 1 : 0)
148 #define VM_SWAPFILE_DELAYED_CREATE 15
150 #define VM_SWAP_BUSY() ((c_swapout_count && (vm_swapper_throttle == THROTTLE_LEVEL_COMPRESSOR_TIER0)) ? 1 : 0)
153 #if CHECKSUM_THE_SWAP
154 extern unsigned int hash_string(char *cp
, int len
);
157 #if RECORD_THE_COMPRESSED_DATA
158 boolean_t c_compressed_record_init_done
= FALSE
;
159 int c_compressed_record_write_error
= 0;
160 struct vnode
*c_compressed_record_vp
= NULL
;
161 uint64_t c_compressed_record_file_offset
= 0;
162 void c_compressed_record_init(void);
163 void c_compressed_record_write(char *, int);
166 extern void vm_pageout_io_throttle(void);
168 static struct swapfile
*vm_swapfile_for_handle(uint64_t);
171 * Called with the vm_swap_data_lock held.
174 static struct swapfile
*
175 vm_swapfile_for_handle(uint64_t f_offset
)
177 uint64_t file_offset
= 0;
178 unsigned int swapfile_index
= 0;
179 struct swapfile
* swf
= NULL
;
181 file_offset
= (f_offset
& SWAP_SLOT_MASK
);
182 swapfile_index
= (f_offset
>> SWAP_DEVICE_SHIFT
);
184 swf
= (struct swapfile
*) queue_first(&swf_global_queue
);
186 while (queue_end(&swf_global_queue
, (queue_entry_t
)swf
) == FALSE
) {
187 if (swapfile_index
== swf
->swp_index
) {
191 swf
= (struct swapfile
*) queue_next(&swf
->swp_queue
);
194 if (queue_end(&swf_global_queue
, (queue_entry_t
) swf
)) {
203 #include <libkern/crypto/aesxts.h>
205 extern int cc_rand_generate(void *, size_t); /* from libkern/cyrpto/rand.h> */
207 boolean_t swap_crypt_initialized
;
208 void swap_crypt_initialize(void);
210 symmetric_xts xts_modectx
;
211 uint32_t swap_crypt_key1
[8]; /* big enough for a 256 bit random key */
212 uint32_t swap_crypt_key2
[8]; /* big enough for a 256 bit random key */
214 #if DEVELOPMENT || DEBUG
215 boolean_t swap_crypt_xts_tested
= FALSE
;
216 unsigned char swap_crypt_test_page_ref
[4096] __attribute__((aligned(4096)));
217 unsigned char swap_crypt_test_page_encrypt
[4096] __attribute__((aligned(4096)));
218 unsigned char swap_crypt_test_page_decrypt
[4096] __attribute__((aligned(4096)));
219 #endif /* DEVELOPMENT || DEBUG */
221 unsigned long vm_page_encrypt_counter
;
222 unsigned long vm_page_decrypt_counter
;
226 swap_crypt_initialize(void)
228 uint8_t *enckey1
, *enckey2
;
229 int keylen1
, keylen2
;
232 assert(swap_crypt_initialized
== FALSE
);
234 keylen1
= sizeof(swap_crypt_key1
);
235 enckey1
= (uint8_t *)&swap_crypt_key1
;
236 keylen2
= sizeof(swap_crypt_key2
);
237 enckey2
= (uint8_t *)&swap_crypt_key2
;
239 error
= cc_rand_generate((void *)enckey1
, keylen1
);
242 error
= cc_rand_generate((void *)enckey2
, keylen2
);
245 error
= xts_start(0, NULL
, enckey1
, keylen1
, enckey2
, keylen2
, 0, 0, &xts_modectx
);
248 swap_crypt_initialized
= TRUE
;
250 #if DEVELOPMENT || DEBUG
260 assert(swap_crypt_xts_tested
== FALSE
);
263 * Validate the encryption algorithms.
265 * First initialize the test data.
267 for (i
= 0; i
< 4096; i
++) {
268 swap_crypt_test_page_ref
[i
] = (char) i
;
270 ivnum
[0] = (uint64_t)0xaa;
272 iv
= (uint8_t *)ivnum
;
274 refptr
= (uint8_t *)swap_crypt_test_page_ref
;
275 encptr
= (uint8_t *)swap_crypt_test_page_encrypt
;
276 decptr
= (uint8_t *)swap_crypt_test_page_decrypt
;
280 rc
= xts_encrypt(refptr
, size
, encptr
, iv
, &xts_modectx
);
283 /* compare result with original - should NOT match */
284 for (i
= 0; i
< 4096; i
++) {
285 if (swap_crypt_test_page_encrypt
[i
] !=
286 swap_crypt_test_page_ref
[i
]) {
293 rc
= xts_decrypt(encptr
, size
, decptr
, iv
, &xts_modectx
);
296 /* compare result with original */
297 for (i
= 0; i
< 4096; i
++) {
298 if (swap_crypt_test_page_decrypt
[i
] !=
299 swap_crypt_test_page_ref
[i
]) {
300 panic("encryption test failed");
303 /* encrypt in place */
304 rc
= xts_encrypt(decptr
, size
, decptr
, iv
, &xts_modectx
);
307 /* decrypt in place */
308 rc
= xts_decrypt(decptr
, size
, decptr
, iv
, &xts_modectx
);
311 for (i
= 0; i
< 4096; i
++) {
312 if (swap_crypt_test_page_decrypt
[i
] !=
313 swap_crypt_test_page_ref
[i
]) {
314 panic("in place encryption test failed");
317 swap_crypt_xts_tested
= TRUE
;
318 #endif /* DEVELOPMENT || DEBUG */
323 vm_swap_encrypt(c_segment_t c_seg
)
331 if (swap_crypt_initialized
== FALSE
) {
332 swap_crypt_initialize();
335 #if DEVELOPMENT || DEBUG
336 C_SEG_MAKE_WRITEABLE(c_seg
);
338 ptr
= (uint8_t *)c_seg
->c_store
.c_buffer
;
339 size
= round_page_32(C_SEG_OFFSET_TO_BYTES(c_seg
->c_populated_offset
));
341 ivnum
[0] = (uint64_t)c_seg
;
343 iv
= (uint8_t *)ivnum
;
345 rc
= xts_encrypt(ptr
, size
, ptr
, iv
, &xts_modectx
);
348 vm_page_encrypt_counter
+= (size
/ PAGE_SIZE_64
);
350 #if DEVELOPMENT || DEBUG
351 C_SEG_WRITE_PROTECT(c_seg
);
356 vm_swap_decrypt(c_segment_t c_seg
)
364 assert(swap_crypt_initialized
);
366 #if DEVELOPMENT || DEBUG
367 C_SEG_MAKE_WRITEABLE(c_seg
);
369 ptr
= (uint8_t *)c_seg
->c_store
.c_buffer
;
370 size
= round_page_32(C_SEG_OFFSET_TO_BYTES(c_seg
->c_populated_offset
));
372 ivnum
[0] = (uint64_t)c_seg
;
374 iv
= (uint8_t *)ivnum
;
376 rc
= xts_decrypt(ptr
, size
, ptr
, iv
, &xts_modectx
);
379 vm_page_decrypt_counter
+= (size
/ PAGE_SIZE_64
);
381 #if DEVELOPMENT || DEBUG
382 C_SEG_WRITE_PROTECT(c_seg
);
385 #endif /* ENCRYPTED_SWAP */
389 vm_compressor_swap_init()
391 thread_t thread
= NULL
;
393 lck_grp_attr_setdefault(&vm_swap_data_lock_grp_attr
);
394 lck_grp_init(&vm_swap_data_lock_grp
,
396 &vm_swap_data_lock_grp_attr
);
397 lck_attr_setdefault(&vm_swap_data_lock_attr
);
398 lck_mtx_init_ext(&vm_swap_data_lock
,
399 &vm_swap_data_lock_ext
,
400 &vm_swap_data_lock_grp
,
401 &vm_swap_data_lock_attr
);
403 queue_init(&swf_global_queue
);
406 if (kernel_thread_start_priority((thread_continue_t
)vm_swapout_thread
, NULL
,
407 BASEPRI_VM
, &thread
) != KERN_SUCCESS
) {
408 panic("vm_swapout_thread: create failed");
410 thread_set_thread_name(thread
, "VM_swapout");
411 vm_swapout_thread_id
= thread
->thread_id
;
413 thread_deallocate(thread
);
415 if (kernel_thread_start_priority((thread_continue_t
)vm_swapfile_create_thread
, NULL
,
416 BASEPRI_VM
, &thread
) != KERN_SUCCESS
) {
417 panic("vm_swapfile_create_thread: create failed");
420 thread_set_thread_name(thread
, "VM_swapfile_create");
421 thread_deallocate(thread
);
423 if (kernel_thread_start_priority((thread_continue_t
)vm_swapfile_gc_thread
, NULL
,
424 BASEPRI_VM
, &thread
) != KERN_SUCCESS
) {
425 panic("vm_swapfile_gc_thread: create failed");
427 thread_set_thread_name(thread
, "VM_swapfile_gc");
430 * Swapfile garbage collection will need to allocate memory
431 * to complete its swap reclaim and in-memory compaction.
432 * So allow it to dip into the reserved VM page pool.
435 thread
->options
|= TH_OPT_VMPRIV
;
436 thread_unlock(thread
);
438 thread_deallocate(thread
);
440 proc_set_thread_policy_with_tid(kernel_task
, thread
->thread_id
,
441 TASK_POLICY_INTERNAL
, TASK_POLICY_IO
, THROTTLE_LEVEL_COMPRESSOR_TIER2
);
442 proc_set_thread_policy_with_tid(kernel_task
, thread
->thread_id
,
443 TASK_POLICY_INTERNAL
, TASK_POLICY_PASSIVE_IO
, TASK_POLICY_ENABLE
);
447 * dummy value until the swap file gets created
448 * when we drive the first c_segment_t to the
449 * swapout queue... at that time we will
450 * know the true size we have to work with
452 c_overage_swapped_limit
= 16;
455 vm_num_swap_files_config
= VM_MAX_SWAP_FILE_NUM
;
457 printf("VM Swap Subsystem is ON\n");
461 #if RECORD_THE_COMPRESSED_DATA
464 c_compressed_record_init()
466 if (c_compressed_record_init_done
== FALSE
) {
467 vm_swapfile_open("/tmp/compressed_data", &c_compressed_record_vp
);
468 c_compressed_record_init_done
= TRUE
;
473 c_compressed_record_write(char *buf
, int size
)
475 if (c_compressed_record_write_error
== 0) {
476 c_compressed_record_write_error
= vm_record_file_write(c_compressed_record_vp
, c_compressed_record_file_offset
, buf
, size
);
477 c_compressed_record_file_offset
+= size
;
483 int compaction_swapper_inited
= 0;
486 vm_compaction_swapper_do_init(void)
492 if (compaction_swapper_inited
) {
496 if (vm_compressor_mode
!= VM_PAGER_COMPRESSOR_WITH_SWAP
) {
497 compaction_swapper_inited
= 1;
500 lck_mtx_lock(&vm_swap_data_lock
);
502 if (!compaction_swapper_inited
) {
503 namelen
= (int)strlen(swapfilename
) + SWAPFILENAME_INDEX_LEN
+ 1;
504 pathname
= (char*)kalloc(namelen
);
505 memset(pathname
, 0, namelen
);
506 snprintf(pathname
, namelen
, "%s%d", swapfilename
, 0);
508 vm_swapfile_open(pathname
, &vp
);
511 if (vnode_pager_isSSD(vp
) == FALSE
) {
513 * swap files live on an HDD, so let's make sure to start swapping
514 * much earlier since we're not worried about SSD write-wear and
515 * we have so little write bandwidth to work with
516 * these values were derived expermentially by running the performance
517 * teams stock test for evaluating HDD performance against various
518 * combinations and looking and comparing overall results.
519 * Note that the > relationship between these 4 values must be maintained
521 if (vm_compressor_minorcompact_threshold_divisor_overridden
== 0) {
522 vm_compressor_minorcompact_threshold_divisor
= 15;
524 if (vm_compressor_majorcompact_threshold_divisor_overridden
== 0) {
525 vm_compressor_majorcompact_threshold_divisor
= 18;
527 if (vm_compressor_unthrottle_threshold_divisor_overridden
== 0) {
528 vm_compressor_unthrottle_threshold_divisor
= 24;
530 if (vm_compressor_catchup_threshold_divisor_overridden
== 0) {
531 vm_compressor_catchup_threshold_divisor
= 30;
535 vnode_setswapmount(vp
);
536 vm_swappin_avail
= vnode_getswappin_avail(vp
);
538 if (vm_swappin_avail
) {
539 vm_swappin_enabled
= TRUE
;
542 vm_swapfile_close((uint64_t)pathname
, vp
);
544 kfree(pathname
, namelen
);
546 compaction_swapper_inited
= 1;
548 lck_mtx_unlock(&vm_swap_data_lock
);
553 vm_swap_consider_defragmenting(int flags
)
555 boolean_t force_defrag
= (flags
& VM_SWAP_FLAGS_FORCE_DEFRAG
);
556 boolean_t force_reclaim
= (flags
& VM_SWAP_FLAGS_FORCE_RECLAIM
);
558 if (compressor_store_stop_compaction
== FALSE
&& !VM_SWAP_BUSY() &&
559 (force_defrag
|| force_reclaim
|| VM_SWAP_SHOULD_DEFRAGMENT() || VM_SWAP_SHOULD_RECLAIM())) {
560 if (!vm_swapfile_gc_thread_running
|| force_defrag
|| force_reclaim
) {
561 lck_mtx_lock(&vm_swap_data_lock
);
564 vm_swap_force_defrag
= TRUE
;
568 vm_swap_force_reclaim
= TRUE
;
571 if (!vm_swapfile_gc_thread_running
) {
572 thread_wakeup((event_t
) &vm_swapfile_gc_needed
);
575 lck_mtx_unlock(&vm_swap_data_lock
);
581 int vm_swap_defragment_yielded
= 0;
582 int vm_swap_defragment_swapin
= 0;
583 int vm_swap_defragment_free
= 0;
584 int vm_swap_defragment_busy
= 0;
593 * have to grab the master lock w/o holding
594 * any locks in spin mode
596 PAGE_REPLACEMENT_DISALLOWED(TRUE
);
598 lck_mtx_lock_spin_always(c_list_lock
);
600 while (!queue_empty(&c_swappedout_sparse_list_head
)) {
601 if (compressor_store_stop_compaction
== TRUE
|| VM_SWAP_BUSY()) {
602 vm_swap_defragment_yielded
++;
605 c_seg
= (c_segment_t
)queue_first(&c_swappedout_sparse_list_head
);
607 lck_mtx_lock_spin_always(&c_seg
->c_lock
);
609 assert(c_seg
->c_state
== C_ON_SWAPPEDOUTSPARSE_Q
);
612 lck_mtx_unlock_always(c_list_lock
);
614 PAGE_REPLACEMENT_DISALLOWED(FALSE
);
616 * c_seg_wait_on_busy consumes c_seg->c_lock
618 c_seg_wait_on_busy(c_seg
);
620 PAGE_REPLACEMENT_DISALLOWED(TRUE
);
622 lck_mtx_lock_spin_always(c_list_lock
);
624 vm_swap_defragment_busy
++;
627 if (c_seg
->c_bytes_used
== 0) {
629 * c_seg_free_locked consumes the c_list_lock
633 c_seg_free_locked(c_seg
);
635 vm_swap_defragment_free
++;
637 lck_mtx_unlock_always(c_list_lock
);
639 if (c_seg_swapin(c_seg
, TRUE
, FALSE
) == 0) {
640 lck_mtx_unlock_always(&c_seg
->c_lock
);
643 vm_swap_defragment_swapin
++;
645 PAGE_REPLACEMENT_DISALLOWED(FALSE
);
647 vm_pageout_io_throttle();
650 * because write waiters have privilege over readers,
651 * dropping and immediately retaking the master lock will
652 * still allow any thread waiting to acquire the
653 * master lock exclusively an opportunity to take it
655 PAGE_REPLACEMENT_DISALLOWED(TRUE
);
657 lck_mtx_lock_spin_always(c_list_lock
);
659 lck_mtx_unlock_always(c_list_lock
);
661 PAGE_REPLACEMENT_DISALLOWED(FALSE
);
667 vm_swapfile_create_thread(void)
672 current_thread()->options
|= TH_OPT_VMPRIV
;
674 vm_swapfile_create_thread_awakened
++;
675 vm_swapfile_create_thread_running
= 1;
679 * walk through the list of swap files
680 * and do the delayed frees/trims for
681 * any swap file whose count of delayed
682 * frees is above the batch limit
684 vm_swap_handle_delayed_trims(FALSE
);
686 lck_mtx_lock(&vm_swap_data_lock
);
688 if (hibernate_in_progress_with_pinned_swap
== TRUE
) {
692 if (compressor_store_stop_compaction
== TRUE
) {
696 clock_get_system_nanotime(&sec
, &nsec
);
698 if (VM_SWAP_SHOULD_CREATE(sec
) == 0) {
702 lck_mtx_unlock(&vm_swap_data_lock
);
704 if (vm_swap_create_file() == FALSE
) {
705 vm_swapfile_last_failed_to_create_ts
= sec
;
706 HIBLOG("vm_swap_create_file failed @ %lu secs\n", (unsigned long)sec
);
708 vm_swapfile_last_successful_create_ts
= sec
;
711 vm_swapfile_create_thread_running
= 0;
713 if (hibernate_in_progress_with_pinned_swap
== TRUE
) {
714 thread_wakeup((event_t
)&hibernate_in_progress_with_pinned_swap
);
717 if (compressor_store_stop_compaction
== TRUE
) {
718 thread_wakeup((event_t
)&compressor_store_stop_compaction
);
721 assert_wait((event_t
)&vm_swapfile_create_needed
, THREAD_UNINT
);
723 lck_mtx_unlock(&vm_swap_data_lock
);
725 thread_block((thread_continue_t
)vm_swapfile_create_thread
);
734 hibernate_pin_swap(boolean_t start
)
736 vm_compaction_swapper_do_init();
738 if (start
== FALSE
) {
739 lck_mtx_lock(&vm_swap_data_lock
);
740 hibernate_in_progress_with_pinned_swap
= FALSE
;
741 lck_mtx_unlock(&vm_swap_data_lock
);
745 if (vm_swappin_enabled
== FALSE
) {
749 lck_mtx_lock(&vm_swap_data_lock
);
751 hibernate_in_progress_with_pinned_swap
= TRUE
;
753 while (vm_swapfile_create_thread_running
|| vm_swapfile_gc_thread_running
) {
754 assert_wait((event_t
)&hibernate_in_progress_with_pinned_swap
, THREAD_UNINT
);
756 lck_mtx_unlock(&vm_swap_data_lock
);
758 thread_block(THREAD_CONTINUE_NULL
);
760 lck_mtx_lock(&vm_swap_data_lock
);
762 if (vm_num_swap_files
> vm_num_pinned_swap_files
) {
763 hibernate_in_progress_with_pinned_swap
= FALSE
;
764 lck_mtx_unlock(&vm_swap_data_lock
);
766 HIBLOG("hibernate_pin_swap failed - vm_num_swap_files = %d, vm_num_pinned_swap_files = %d\n",
767 vm_num_swap_files
, vm_num_pinned_swap_files
);
770 lck_mtx_unlock(&vm_swap_data_lock
);
772 while (VM_SWAP_SHOULD_PIN(MAX_SWAP_FILE_SIZE
)) {
773 if (vm_swap_create_file() == FALSE
) {
782 vm_swapfile_gc_thread(void)
784 boolean_t need_defragment
;
785 boolean_t need_reclaim
;
787 vm_swapfile_gc_thread_awakened
++;
788 vm_swapfile_gc_thread_running
= 1;
791 lck_mtx_lock(&vm_swap_data_lock
);
793 if (hibernate_in_progress_with_pinned_swap
== TRUE
) {
797 if (VM_SWAP_BUSY() || compressor_store_stop_compaction
== TRUE
) {
801 need_defragment
= FALSE
;
802 need_reclaim
= FALSE
;
804 if (VM_SWAP_SHOULD_DEFRAGMENT()) {
805 need_defragment
= TRUE
;
808 if (VM_SWAP_SHOULD_RECLAIM()) {
809 need_defragment
= TRUE
;
812 if (need_defragment
== FALSE
&& need_reclaim
== FALSE
) {
816 vm_swap_force_defrag
= FALSE
;
817 vm_swap_force_reclaim
= FALSE
;
819 lck_mtx_unlock(&vm_swap_data_lock
);
821 if (need_defragment
== TRUE
) {
822 vm_swap_defragment();
824 if (need_reclaim
== TRUE
) {
828 vm_swapfile_gc_thread_running
= 0;
830 if (hibernate_in_progress_with_pinned_swap
== TRUE
) {
831 thread_wakeup((event_t
)&hibernate_in_progress_with_pinned_swap
);
834 if (compressor_store_stop_compaction
== TRUE
) {
835 thread_wakeup((event_t
)&compressor_store_stop_compaction
);
838 assert_wait((event_t
)&vm_swapfile_gc_needed
, THREAD_UNINT
);
840 lck_mtx_unlock(&vm_swap_data_lock
);
842 thread_block((thread_continue_t
)vm_swapfile_gc_thread
);
849 #define VM_SWAPOUT_LIMIT_T2P 4
850 #define VM_SWAPOUT_LIMIT_T1P 4
851 #define VM_SWAPOUT_LIMIT_T0P 6
852 #define VM_SWAPOUT_LIMIT_T0 8
853 #define VM_SWAPOUT_LIMIT_MAX 8
855 #define VM_SWAPOUT_START 0
856 #define VM_SWAPOUT_T2_PASSIVE 1
857 #define VM_SWAPOUT_T1_PASSIVE 2
858 #define VM_SWAPOUT_T0_PASSIVE 3
859 #define VM_SWAPOUT_T0 4
861 int vm_swapout_state
= VM_SWAPOUT_START
;
862 int vm_swapout_limit
= 1;
864 int vm_swapper_entered_T0
= 0;
865 int vm_swapper_entered_T0P
= 0;
866 int vm_swapper_entered_T1P
= 0;
867 int vm_swapper_entered_T2P
= 0;
871 vm_swapout_thread_throttle_adjust(void)
873 switch (vm_swapout_state
) {
874 case VM_SWAPOUT_START
:
876 vm_swapper_throttle
= THROTTLE_LEVEL_COMPRESSOR_TIER2
;
877 vm_swapper_entered_T2P
++;
879 proc_set_thread_policy_with_tid(kernel_task
, vm_swapout_thread_id
,
880 TASK_POLICY_INTERNAL
, TASK_POLICY_IO
, vm_swapper_throttle
);
881 proc_set_thread_policy_with_tid(kernel_task
, vm_swapout_thread_id
,
882 TASK_POLICY_INTERNAL
, TASK_POLICY_PASSIVE_IO
, TASK_POLICY_ENABLE
);
883 vm_swapout_limit
= VM_SWAPOUT_LIMIT_T2P
;
884 vm_swapout_state
= VM_SWAPOUT_T2_PASSIVE
;
888 case VM_SWAPOUT_T2_PASSIVE
:
890 if (SWAPPER_NEEDS_TO_UNTHROTTLE()) {
891 vm_swapper_throttle
= THROTTLE_LEVEL_COMPRESSOR_TIER0
;
892 vm_swapper_entered_T0P
++;
894 proc_set_thread_policy_with_tid(kernel_task
, vm_swapout_thread_id
,
895 TASK_POLICY_INTERNAL
, TASK_POLICY_IO
, vm_swapper_throttle
);
896 proc_set_thread_policy_with_tid(kernel_task
, vm_swapout_thread_id
,
897 TASK_POLICY_INTERNAL
, TASK_POLICY_PASSIVE_IO
, TASK_POLICY_ENABLE
);
898 vm_swapout_limit
= VM_SWAPOUT_LIMIT_T0P
;
899 vm_swapout_state
= VM_SWAPOUT_T0_PASSIVE
;
903 if (swapout_target_age
|| hibernate_flushing
== TRUE
) {
904 vm_swapper_throttle
= THROTTLE_LEVEL_COMPRESSOR_TIER1
;
905 vm_swapper_entered_T1P
++;
907 proc_set_thread_policy_with_tid(kernel_task
, vm_swapout_thread_id
,
908 TASK_POLICY_INTERNAL
, TASK_POLICY_IO
, vm_swapper_throttle
);
909 proc_set_thread_policy_with_tid(kernel_task
, vm_swapout_thread_id
,
910 TASK_POLICY_INTERNAL
, TASK_POLICY_PASSIVE_IO
, TASK_POLICY_ENABLE
);
911 vm_swapout_limit
= VM_SWAPOUT_LIMIT_T1P
;
912 vm_swapout_state
= VM_SWAPOUT_T1_PASSIVE
;
916 case VM_SWAPOUT_T1_PASSIVE
:
918 if (SWAPPER_NEEDS_TO_UNTHROTTLE()) {
919 vm_swapper_throttle
= THROTTLE_LEVEL_COMPRESSOR_TIER0
;
920 vm_swapper_entered_T0P
++;
922 proc_set_thread_policy_with_tid(kernel_task
, vm_swapout_thread_id
,
923 TASK_POLICY_INTERNAL
, TASK_POLICY_IO
, vm_swapper_throttle
);
924 proc_set_thread_policy_with_tid(kernel_task
, vm_swapout_thread_id
,
925 TASK_POLICY_INTERNAL
, TASK_POLICY_PASSIVE_IO
, TASK_POLICY_ENABLE
);
926 vm_swapout_limit
= VM_SWAPOUT_LIMIT_T0P
;
927 vm_swapout_state
= VM_SWAPOUT_T0_PASSIVE
;
931 if (swapout_target_age
== 0 && hibernate_flushing
== FALSE
) {
932 vm_swapper_throttle
= THROTTLE_LEVEL_COMPRESSOR_TIER2
;
933 vm_swapper_entered_T2P
++;
935 proc_set_thread_policy_with_tid(kernel_task
, vm_swapout_thread_id
,
936 TASK_POLICY_INTERNAL
, TASK_POLICY_IO
, vm_swapper_throttle
);
937 proc_set_thread_policy_with_tid(kernel_task
, vm_swapout_thread_id
,
938 TASK_POLICY_INTERNAL
, TASK_POLICY_PASSIVE_IO
, TASK_POLICY_ENABLE
);
939 vm_swapout_limit
= VM_SWAPOUT_LIMIT_T2P
;
940 vm_swapout_state
= VM_SWAPOUT_T2_PASSIVE
;
944 case VM_SWAPOUT_T0_PASSIVE
:
946 if (SWAPPER_NEEDS_TO_RETHROTTLE()) {
947 vm_swapper_throttle
= THROTTLE_LEVEL_COMPRESSOR_TIER2
;
948 vm_swapper_entered_T2P
++;
950 proc_set_thread_policy_with_tid(kernel_task
, vm_swapout_thread_id
,
951 TASK_POLICY_INTERNAL
, TASK_POLICY_IO
, vm_swapper_throttle
);
952 proc_set_thread_policy_with_tid(kernel_task
, vm_swapout_thread_id
,
953 TASK_POLICY_INTERNAL
, TASK_POLICY_PASSIVE_IO
, TASK_POLICY_ENABLE
);
954 vm_swapout_limit
= VM_SWAPOUT_LIMIT_T2P
;
955 vm_swapout_state
= VM_SWAPOUT_T2_PASSIVE
;
959 if (SWAPPER_NEEDS_TO_CATCHUP()) {
960 vm_swapper_entered_T0
++;
962 proc_set_thread_policy_with_tid(kernel_task
, vm_swapout_thread_id
,
963 TASK_POLICY_INTERNAL
, TASK_POLICY_PASSIVE_IO
, TASK_POLICY_DISABLE
);
964 vm_swapout_limit
= VM_SWAPOUT_LIMIT_T0
;
965 vm_swapout_state
= VM_SWAPOUT_T0
;
971 if (SWAPPER_HAS_CAUGHTUP()) {
972 vm_swapper_entered_T0P
++;
974 proc_set_thread_policy_with_tid(kernel_task
, vm_swapout_thread_id
,
975 TASK_POLICY_INTERNAL
, TASK_POLICY_PASSIVE_IO
, TASK_POLICY_ENABLE
);
976 vm_swapout_limit
= VM_SWAPOUT_LIMIT_T0P
;
977 vm_swapout_state
= VM_SWAPOUT_T0_PASSIVE
;
983 int vm_swapout_found_empty
= 0;
985 struct swapout_io_completion vm_swapout_ctx
[VM_SWAPOUT_LIMIT_MAX
];
987 int vm_swapout_soc_busy
= 0;
988 int vm_swapout_soc_done
= 0;
991 static struct swapout_io_completion
*
992 vm_swapout_find_free_soc(void)
996 for (i
= 0; i
< VM_SWAPOUT_LIMIT_MAX
; i
++) {
997 if (vm_swapout_ctx
[i
].swp_io_busy
== 0) {
998 return &vm_swapout_ctx
[i
];
1001 assert(vm_swapout_soc_busy
== VM_SWAPOUT_LIMIT_MAX
);
1006 static struct swapout_io_completion
*
1007 vm_swapout_find_done_soc(void)
1011 if (vm_swapout_soc_done
) {
1012 for (i
= 0; i
< VM_SWAPOUT_LIMIT_MAX
; i
++) {
1013 if (vm_swapout_ctx
[i
].swp_io_done
) {
1014 return &vm_swapout_ctx
[i
];
1022 vm_swapout_complete_soc(struct swapout_io_completion
*soc
)
1026 if (soc
->swp_io_error
) {
1032 lck_mtx_unlock_always(c_list_lock
);
1034 vm_swap_put_finish(soc
->swp_swf
, &soc
->swp_f_offset
, soc
->swp_io_error
);
1035 vm_swapout_finish(soc
->swp_c_seg
, soc
->swp_f_offset
, soc
->swp_c_size
, kr
);
1037 lck_mtx_lock_spin_always(c_list_lock
);
1039 soc
->swp_io_done
= 0;
1040 soc
->swp_io_busy
= 0;
1042 vm_swapout_soc_busy
--;
1043 vm_swapout_soc_done
--;
1048 vm_swapout_thread(void)
1051 c_segment_t c_seg
= NULL
;
1052 kern_return_t kr
= KERN_SUCCESS
;
1053 struct swapout_io_completion
*soc
;
1055 current_thread()->options
|= TH_OPT_VMPRIV
;
1057 vm_swapout_thread_awakened
++;
1059 lck_mtx_lock_spin_always(c_list_lock
);
1061 while (!queue_empty(&c_swapout_list_head
) && vm_swapout_soc_busy
< vm_swapout_limit
) {
1062 c_seg
= (c_segment_t
)queue_first(&c_swapout_list_head
);
1064 lck_mtx_lock_spin_always(&c_seg
->c_lock
);
1066 assert(c_seg
->c_state
== C_ON_SWAPOUT_Q
);
1068 if (c_seg
->c_busy
) {
1069 lck_mtx_unlock_always(c_list_lock
);
1071 c_seg_wait_on_busy(c_seg
);
1073 lck_mtx_lock_spin_always(c_list_lock
);
1077 vm_swapout_thread_processed_segments
++;
1079 size
= round_page_32(C_SEG_OFFSET_TO_BYTES(c_seg
->c_populated_offset
));
1082 assert(c_seg
->c_bytes_used
== 0);
1084 if (!c_seg
->c_on_minorcompact_q
) {
1085 c_seg_need_delayed_compaction(c_seg
, TRUE
);
1088 c_seg_switch_state(c_seg
, C_IS_EMPTY
, FALSE
);
1089 lck_mtx_unlock_always(&c_seg
->c_lock
);
1090 lck_mtx_unlock_always(c_list_lock
);
1092 vm_swapout_found_empty
++;
1093 goto c_seg_is_empty
;
1096 c_seg
->c_busy_swapping
= 1;
1098 c_seg_switch_state(c_seg
, C_ON_SWAPIO_Q
, FALSE
);
1100 lck_mtx_unlock_always(c_list_lock
);
1101 lck_mtx_unlock_always(&c_seg
->c_lock
);
1103 #if CHECKSUM_THE_SWAP
1104 c_seg
->cseg_hash
= hash_string((char *)c_seg
->c_store
.c_buffer
, (int)size
);
1105 c_seg
->cseg_swap_size
= size
;
1106 #endif /* CHECKSUM_THE_SWAP */
1109 vm_swap_encrypt(c_seg
);
1110 #endif /* ENCRYPTED_SWAP */
1112 soc
= vm_swapout_find_free_soc();
1115 soc
->swp_upl_ctx
.io_context
= (void *)soc
;
1116 soc
->swp_upl_ctx
.io_done
= (void *)vm_swapout_iodone
;
1117 soc
->swp_upl_ctx
.io_error
= 0;
1119 kr
= vm_swap_put((vm_offset_t
)c_seg
->c_store
.c_buffer
, &soc
->swp_f_offset
, size
, c_seg
, soc
);
1121 if (kr
!= KERN_SUCCESS
) {
1122 if (soc
->swp_io_done
) {
1123 lck_mtx_lock_spin_always(c_list_lock
);
1125 soc
->swp_io_done
= 0;
1126 vm_swapout_soc_done
--;
1128 lck_mtx_unlock_always(c_list_lock
);
1130 vm_swapout_finish(c_seg
, soc
->swp_f_offset
, size
, kr
);
1132 soc
->swp_io_busy
= 1;
1133 vm_swapout_soc_busy
++;
1137 if (c_swapout_count
== 0) {
1138 vm_swap_consider_defragmenting(VM_SWAP_FLAGS_NONE
);
1141 lck_mtx_lock_spin_always(c_list_lock
);
1143 if ((soc
= vm_swapout_find_done_soc())) {
1144 vm_swapout_complete_soc(soc
);
1146 lck_mtx_unlock_always(c_list_lock
);
1148 vm_swapout_thread_throttle_adjust();
1149 vm_pageout_io_throttle();
1151 lck_mtx_lock_spin_always(c_list_lock
);
1153 if ((soc
= vm_swapout_find_done_soc())) {
1154 vm_swapout_complete_soc(soc
);
1157 assert_wait((event_t
)&c_swapout_list_head
, THREAD_UNINT
);
1159 lck_mtx_unlock_always(c_list_lock
);
1161 thread_block((thread_continue_t
)vm_swapout_thread
);
1168 vm_swapout_iodone(void *io_context
, int error
)
1170 struct swapout_io_completion
*soc
;
1172 soc
= (struct swapout_io_completion
*)io_context
;
1174 lck_mtx_lock_spin_always(c_list_lock
);
1176 soc
->swp_io_done
= 1;
1177 soc
->swp_io_error
= error
;
1178 vm_swapout_soc_done
++;
1180 thread_wakeup((event_t
)&c_swapout_list_head
);
1182 lck_mtx_unlock_always(c_list_lock
);
1187 vm_swapout_finish(c_segment_t c_seg
, uint64_t f_offset
, uint32_t size
, kern_return_t kr
)
1189 PAGE_REPLACEMENT_DISALLOWED(TRUE
);
1191 if (kr
== KERN_SUCCESS
) {
1192 kernel_memory_depopulate(compressor_map
, (vm_offset_t
)c_seg
->c_store
.c_buffer
, size
, KMA_COMPRESSOR
);
1196 vm_swap_decrypt(c_seg
);
1198 #endif /* ENCRYPTED_SWAP */
1199 lck_mtx_lock_spin_always(c_list_lock
);
1200 lck_mtx_lock_spin_always(&c_seg
->c_lock
);
1202 if (kr
== KERN_SUCCESS
) {
1203 int new_state
= C_ON_SWAPPEDOUT_Q
;
1204 boolean_t insert_head
= FALSE
;
1206 if (hibernate_flushing
== TRUE
) {
1207 if (c_seg
->c_generation_id
>= first_c_segment_to_warm_generation_id
&&
1208 c_seg
->c_generation_id
<= last_c_segment_to_warm_generation_id
) {
1211 } else if (C_SEG_ONDISK_IS_SPARSE(c_seg
)) {
1212 new_state
= C_ON_SWAPPEDOUTSPARSE_Q
;
1215 c_seg_switch_state(c_seg
, new_state
, insert_head
);
1217 c_seg
->c_store
.c_swap_handle
= f_offset
;
1219 VM_STAT_INCR_BY(swapouts
, size
>> PAGE_SHIFT
);
1221 if (c_seg
->c_bytes_used
) {
1222 OSAddAtomic64(-c_seg
->c_bytes_used
, &compressor_bytes_used
);
1225 if (c_seg
->c_overage_swap
== TRUE
) {
1226 c_seg
->c_overage_swap
= FALSE
;
1227 c_overage_swapped_count
--;
1229 c_seg_switch_state(c_seg
, C_ON_AGE_Q
, FALSE
);
1231 if (!c_seg
->c_on_minorcompact_q
&& C_SEG_UNUSED_BYTES(c_seg
) >= PAGE_SIZE
) {
1232 c_seg_need_delayed_compaction(c_seg
, TRUE
);
1235 assert(c_seg
->c_busy_swapping
);
1236 assert(c_seg
->c_busy
);
1238 c_seg
->c_busy_swapping
= 0;
1239 lck_mtx_unlock_always(c_list_lock
);
1241 C_SEG_WAKEUP_DONE(c_seg
);
1242 lck_mtx_unlock_always(&c_seg
->c_lock
);
1244 PAGE_REPLACEMENT_DISALLOWED(FALSE
);
1249 vm_swap_create_file()
1253 boolean_t swap_file_created
= FALSE
;
1254 boolean_t swap_file_reuse
= FALSE
;
1255 boolean_t swap_file_pin
= FALSE
;
1256 struct swapfile
*swf
= NULL
;
1259 * make sure we've got all the info we need
1260 * to potentially pin a swap file... we could
1261 * be swapping out due to hibernation w/o ever
1262 * having run vm_pageout_scan, which is normally
1263 * the trigger to do the init
1265 vm_compaction_swapper_do_init();
1268 * Any swapfile structure ready for re-use?
1271 lck_mtx_lock(&vm_swap_data_lock
);
1273 swf
= (struct swapfile
*) queue_first(&swf_global_queue
);
1275 while (queue_end(&swf_global_queue
, (queue_entry_t
)swf
) == FALSE
) {
1276 if (swf
->swp_flags
== SWAP_REUSE
) {
1277 swap_file_reuse
= TRUE
;
1280 swf
= (struct swapfile
*) queue_next(&swf
->swp_queue
);
1283 lck_mtx_unlock(&vm_swap_data_lock
);
1285 if (swap_file_reuse
== FALSE
) {
1286 namelen
= (int)strlen(swapfilename
) + SWAPFILENAME_INDEX_LEN
+ 1;
1288 swf
= (struct swapfile
*) kalloc(sizeof *swf
);
1289 memset(swf
, 0, sizeof(*swf
));
1291 swf
->swp_index
= vm_num_swap_files
+ 1;
1292 swf
->swp_pathlen
= namelen
;
1293 swf
->swp_path
= (char*)kalloc(swf
->swp_pathlen
);
1295 memset(swf
->swp_path
, 0, namelen
);
1297 snprintf(swf
->swp_path
, namelen
, "%s%d", swapfilename
, vm_num_swap_files
);
1300 vm_swapfile_open(swf
->swp_path
, &swf
->swp_vp
);
1302 if (swf
->swp_vp
== NULL
) {
1303 if (swap_file_reuse
== FALSE
) {
1304 kfree(swf
->swp_path
, swf
->swp_pathlen
);
1305 kfree(swf
, sizeof *swf
);
1309 vm_swapfile_can_be_created
= TRUE
;
1311 size
= MAX_SWAP_FILE_SIZE
;
1313 while (size
>= MIN_SWAP_FILE_SIZE
) {
1314 swap_file_pin
= VM_SWAP_SHOULD_PIN(size
);
1316 if (vm_swapfile_preallocate(swf
->swp_vp
, &size
, &swap_file_pin
) == 0) {
1317 int num_bytes_for_bitmap
= 0;
1319 swap_file_created
= TRUE
;
1321 swf
->swp_size
= size
;
1322 swf
->swp_nsegs
= (unsigned int) (size
/ COMPRESSED_SWAP_CHUNK_SIZE
);
1323 swf
->swp_nseginuse
= 0;
1324 swf
->swp_free_hint
= 0;
1326 num_bytes_for_bitmap
= MAX((swf
->swp_nsegs
>> 3), 1);
1328 * Allocate a bitmap that describes the
1329 * number of segments held by this swapfile.
1331 swf
->swp_bitmap
= (uint8_t*)kalloc(num_bytes_for_bitmap
);
1332 memset(swf
->swp_bitmap
, 0, num_bytes_for_bitmap
);
1334 swf
->swp_csegs
= (c_segment_t
*) kalloc(swf
->swp_nsegs
* sizeof(c_segment_t
));
1335 memset(swf
->swp_csegs
, 0, (swf
->swp_nsegs
* sizeof(c_segment_t
)));
1338 * passing a NULL trim_list into vnode_trim_list
1339 * will return ENOTSUP if trim isn't supported
1342 if (vnode_trim_list(swf
->swp_vp
, NULL
, FALSE
) == 0) {
1343 swp_trim_supported
= TRUE
;
1346 lck_mtx_lock(&vm_swap_data_lock
);
1348 swf
->swp_flags
= SWAP_READY
;
1350 if (swap_file_reuse
== FALSE
) {
1351 queue_enter(&swf_global_queue
, swf
, struct swapfile
*, swp_queue
);
1354 vm_num_swap_files
++;
1356 vm_swapfile_total_segs_alloced
+= swf
->swp_nsegs
;
1358 if (swap_file_pin
== TRUE
) {
1359 vm_num_pinned_swap_files
++;
1360 swf
->swp_flags
|= SWAP_PINNED
;
1361 vm_swappin_avail
-= swf
->swp_size
;
1364 lck_mtx_unlock(&vm_swap_data_lock
);
1366 thread_wakeup((event_t
) &vm_num_swap_files
);
1368 if (vm_num_swap_files
== 1) {
1369 c_overage_swapped_limit
= (uint32_t)size
/ C_SEG_BUFSIZE
;
1371 if (VM_CONFIG_FREEZER_SWAP_IS_ACTIVE
) {
1372 c_overage_swapped_limit
/= 2;
1381 if (swap_file_created
== FALSE
) {
1382 vm_swapfile_close((uint64_t)(swf
->swp_path
), swf
->swp_vp
);
1386 if (swap_file_reuse
== FALSE
) {
1387 kfree(swf
->swp_path
, swf
->swp_pathlen
);
1388 kfree(swf
, sizeof *swf
);
1391 return swap_file_created
;
1396 vm_swap_get(c_segment_t c_seg
, uint64_t f_offset
, uint64_t size
)
1398 struct swapfile
*swf
= NULL
;
1399 uint64_t file_offset
= 0;
1402 assert(c_seg
->c_store
.c_buffer
);
1404 lck_mtx_lock(&vm_swap_data_lock
);
1406 swf
= vm_swapfile_for_handle(f_offset
);
1408 if (swf
== NULL
|| (!(swf
->swp_flags
& SWAP_READY
) && !(swf
->swp_flags
& SWAP_RECLAIM
))) {
1409 vm_swap_get_failures
++;
1413 swf
->swp_io_count
++;
1415 lck_mtx_unlock(&vm_swap_data_lock
);
1417 #if DEVELOPMENT || DEBUG
1418 C_SEG_MAKE_WRITEABLE(c_seg
);
1420 file_offset
= (f_offset
& SWAP_SLOT_MASK
);
1421 retval
= vm_swapfile_io(swf
->swp_vp
, file_offset
, (uint64_t)c_seg
->c_store
.c_buffer
, (int)(size
/ PAGE_SIZE_64
), SWAP_READ
, NULL
);
1423 #if DEVELOPMENT || DEBUG
1424 C_SEG_WRITE_PROTECT(c_seg
);
1427 VM_STAT_INCR_BY(swapins
, size
>> PAGE_SHIFT
);
1429 vm_swap_get_failures
++;
1433 * Free this slot in the swap structure.
1435 vm_swap_free(f_offset
);
1437 lck_mtx_lock(&vm_swap_data_lock
);
1438 swf
->swp_io_count
--;
1440 if ((swf
->swp_flags
& SWAP_WANTED
) && swf
->swp_io_count
== 0) {
1441 swf
->swp_flags
&= ~SWAP_WANTED
;
1442 thread_wakeup((event_t
) &swf
->swp_flags
);
1445 lck_mtx_unlock(&vm_swap_data_lock
);
1448 return KERN_SUCCESS
;
1450 return KERN_FAILURE
;
1455 vm_swap_put(vm_offset_t addr
, uint64_t *f_offset
, uint32_t size
, c_segment_t c_seg
, struct swapout_io_completion
*soc
)
1457 unsigned int segidx
= 0;
1458 struct swapfile
*swf
= NULL
;
1459 uint64_t file_offset
= 0;
1460 uint64_t swapfile_index
= 0;
1461 unsigned int byte_for_segidx
= 0;
1462 unsigned int offset_within_byte
= 0;
1463 boolean_t swf_eligible
= FALSE
;
1464 boolean_t waiting
= FALSE
;
1465 boolean_t retried
= FALSE
;
1469 void *upl_ctx
= NULL
;
1471 if (addr
== 0 || f_offset
== NULL
) {
1472 return KERN_FAILURE
;
1475 lck_mtx_lock(&vm_swap_data_lock
);
1477 swf
= (struct swapfile
*) queue_first(&swf_global_queue
);
1479 while (queue_end(&swf_global_queue
, (queue_entry_t
)swf
) == FALSE
) {
1480 segidx
= swf
->swp_free_hint
;
1482 swf_eligible
= (swf
->swp_flags
& SWAP_READY
) && (swf
->swp_nseginuse
< swf
->swp_nsegs
);
1485 while (segidx
< swf
->swp_nsegs
) {
1486 byte_for_segidx
= segidx
>> 3;
1487 offset_within_byte
= segidx
% 8;
1489 if ((swf
->swp_bitmap
)[byte_for_segidx
] & (1 << offset_within_byte
)) {
1494 (swf
->swp_bitmap
)[byte_for_segidx
] |= (1 << offset_within_byte
);
1496 file_offset
= segidx
* COMPRESSED_SWAP_CHUNK_SIZE
;
1497 swf
->swp_nseginuse
++;
1498 swf
->swp_io_count
++;
1499 swf
->swp_csegs
[segidx
] = c_seg
;
1501 swapfile_index
= swf
->swp_index
;
1502 vm_swapfile_total_segs_used
++;
1504 clock_get_system_nanotime(&sec
, &nsec
);
1506 if (VM_SWAP_SHOULD_CREATE(sec
) && !vm_swapfile_create_thread_running
) {
1507 thread_wakeup((event_t
) &vm_swapfile_create_needed
);
1510 lck_mtx_unlock(&vm_swap_data_lock
);
1515 swf
= (struct swapfile
*) queue_next(&swf
->swp_queue
);
1517 assert(queue_end(&swf_global_queue
, (queue_entry_t
) swf
));
1520 * we've run out of swap segments, but may not
1521 * be in a position to immediately create a new swap
1522 * file if we've recently failed to create due to a lack
1523 * of free space in the root filesystem... we'll try
1524 * to kick that create off, but in any event we're going
1525 * to take a breather (up to 1 second) so that we're not caught in a tight
1526 * loop back in "vm_compressor_compact_and_swap" trying to stuff
1527 * segments into swap files only to have them immediately put back
1528 * on the c_age queue due to vm_swap_put failing.
1530 * if we're doing these puts due to a hibernation flush,
1531 * no need to block... setting hibernate_no_swapspace to TRUE,
1532 * will cause "vm_compressor_compact_and_swap" to immediately abort
1534 clock_get_system_nanotime(&sec
, &nsec
);
1536 if (VM_SWAP_SHOULD_CREATE(sec
) && !vm_swapfile_create_thread_running
) {
1537 thread_wakeup((event_t
) &vm_swapfile_create_needed
);
1540 if (hibernate_flushing
== FALSE
|| VM_SWAP_SHOULD_CREATE(sec
)) {
1542 assert_wait_timeout((event_t
) &vm_num_swap_files
, THREAD_INTERRUPTIBLE
, 1000, 1000 * NSEC_PER_USEC
);
1544 hibernate_no_swapspace
= TRUE
;
1547 lck_mtx_unlock(&vm_swap_data_lock
);
1549 if (waiting
== TRUE
) {
1550 thread_block(THREAD_CONTINUE_NULL
);
1552 if (retried
== FALSE
&& hibernate_flushing
== TRUE
) {
1557 vm_swap_put_failures_no_swap_file
++;
1559 return KERN_FAILURE
;
1562 assert(c_seg
->c_busy_swapping
);
1563 assert(c_seg
->c_busy
);
1564 assert(!c_seg
->c_on_minorcompact_q
);
1566 *f_offset
= (swapfile_index
<< SWAP_DEVICE_SHIFT
) | file_offset
;
1569 soc
->swp_c_seg
= c_seg
;
1570 soc
->swp_c_size
= size
;
1574 soc
->swp_io_error
= 0;
1575 soc
->swp_io_done
= 0;
1577 upl_ctx
= (void *)&soc
->swp_upl_ctx
;
1579 error
= vm_swapfile_io(swf
->swp_vp
, file_offset
, addr
, (int) (size
/ PAGE_SIZE_64
), SWAP_WRITE
, upl_ctx
);
1581 if (error
|| upl_ctx
== NULL
) {
1582 return vm_swap_put_finish(swf
, f_offset
, error
);
1585 return KERN_SUCCESS
;
1589 vm_swap_put_finish(struct swapfile
*swf
, uint64_t *f_offset
, int error
)
1591 lck_mtx_lock(&vm_swap_data_lock
);
1593 swf
->swp_io_count
--;
1595 if ((swf
->swp_flags
& SWAP_WANTED
) && swf
->swp_io_count
== 0) {
1596 swf
->swp_flags
&= ~SWAP_WANTED
;
1597 thread_wakeup((event_t
) &swf
->swp_flags
);
1599 lck_mtx_unlock(&vm_swap_data_lock
);
1602 vm_swap_free(*f_offset
);
1603 vm_swap_put_failures
++;
1605 return KERN_FAILURE
;
1607 return KERN_SUCCESS
;
1612 vm_swap_free_now(struct swapfile
*swf
, uint64_t f_offset
)
1614 uint64_t file_offset
= 0;
1615 unsigned int segidx
= 0;
1618 if ((swf
->swp_flags
& SWAP_READY
) || (swf
->swp_flags
& SWAP_RECLAIM
)) {
1619 unsigned int byte_for_segidx
= 0;
1620 unsigned int offset_within_byte
= 0;
1622 file_offset
= (f_offset
& SWAP_SLOT_MASK
);
1623 segidx
= (unsigned int) (file_offset
/ COMPRESSED_SWAP_CHUNK_SIZE
);
1625 byte_for_segidx
= segidx
>> 3;
1626 offset_within_byte
= segidx
% 8;
1628 if ((swf
->swp_bitmap
)[byte_for_segidx
] & (1 << offset_within_byte
)) {
1629 (swf
->swp_bitmap
)[byte_for_segidx
] &= ~(1 << offset_within_byte
);
1631 swf
->swp_csegs
[segidx
] = NULL
;
1633 swf
->swp_nseginuse
--;
1634 vm_swapfile_total_segs_used
--;
1636 if (segidx
< swf
->swp_free_hint
) {
1637 swf
->swp_free_hint
= segidx
;
1640 if (VM_SWAP_SHOULD_RECLAIM() && !vm_swapfile_gc_thread_running
) {
1641 thread_wakeup((event_t
) &vm_swapfile_gc_needed
);
1647 uint32_t vm_swap_free_now_count
= 0;
1648 uint32_t vm_swap_free_delayed_count
= 0;
1652 vm_swap_free(uint64_t f_offset
)
1654 struct swapfile
*swf
= NULL
;
1655 struct trim_list
*tl
= NULL
;
1659 if (swp_trim_supported
== TRUE
) {
1660 tl
= kalloc(sizeof(struct trim_list
));
1663 lck_mtx_lock(&vm_swap_data_lock
);
1665 swf
= vm_swapfile_for_handle(f_offset
);
1667 if (swf
&& (swf
->swp_flags
& (SWAP_READY
| SWAP_RECLAIM
))) {
1668 if (swp_trim_supported
== FALSE
|| (swf
->swp_flags
& SWAP_RECLAIM
)) {
1670 * don't delay the free if the underlying disk doesn't support
1671 * trim, or we're in the midst of reclaiming this swap file since
1672 * we don't want to move segments that are technically free
1673 * but not yet handled by the delayed free mechanism
1675 vm_swap_free_now(swf
, f_offset
);
1677 vm_swap_free_now_count
++;
1680 tl
->tl_offset
= f_offset
& SWAP_SLOT_MASK
;
1681 tl
->tl_length
= COMPRESSED_SWAP_CHUNK_SIZE
;
1683 tl
->tl_next
= swf
->swp_delayed_trim_list_head
;
1684 swf
->swp_delayed_trim_list_head
= tl
;
1685 swf
->swp_delayed_trim_count
++;
1688 if (VM_SWAP_SHOULD_TRIM(swf
) && !vm_swapfile_create_thread_running
) {
1689 clock_get_system_nanotime(&sec
, &nsec
);
1691 if (sec
> dont_trim_until_ts
) {
1692 thread_wakeup((event_t
) &vm_swapfile_create_needed
);
1695 vm_swap_free_delayed_count
++;
1698 lck_mtx_unlock(&vm_swap_data_lock
);
1701 kfree(tl
, sizeof(struct trim_list
));
1707 vm_swap_wait_on_trim_handling_in_progress()
1709 while (delayed_trim_handling_in_progress
== TRUE
) {
1710 assert_wait((event_t
) &delayed_trim_handling_in_progress
, THREAD_UNINT
);
1711 lck_mtx_unlock(&vm_swap_data_lock
);
1713 thread_block(THREAD_CONTINUE_NULL
);
1715 lck_mtx_lock(&vm_swap_data_lock
);
1721 vm_swap_handle_delayed_trims(boolean_t force_now
)
1723 struct swapfile
*swf
= NULL
;
1726 * serialize the race between us and vm_swap_reclaim...
1727 * if vm_swap_reclaim wins it will turn off SWAP_READY
1728 * on the victim it has chosen... we can just skip over
1729 * that file since vm_swap_reclaim will first process
1730 * all of the delayed trims associated with it
1732 lck_mtx_lock(&vm_swap_data_lock
);
1734 delayed_trim_handling_in_progress
= TRUE
;
1736 lck_mtx_unlock(&vm_swap_data_lock
);
1739 * no need to hold the lock to walk the swf list since
1740 * vm_swap_create (the only place where we add to this list)
1741 * is run on the same thread as this function
1742 * and vm_swap_reclaim doesn't remove items from this list
1743 * instead marking them with SWAP_REUSE for future re-use
1745 swf
= (struct swapfile
*) queue_first(&swf_global_queue
);
1747 while (queue_end(&swf_global_queue
, (queue_entry_t
)swf
) == FALSE
) {
1748 if ((swf
->swp_flags
& SWAP_READY
) && (force_now
== TRUE
|| VM_SWAP_SHOULD_TRIM(swf
))) {
1749 assert(!(swf
->swp_flags
& SWAP_RECLAIM
));
1750 vm_swap_do_delayed_trim(swf
);
1752 swf
= (struct swapfile
*) queue_next(&swf
->swp_queue
);
1754 lck_mtx_lock(&vm_swap_data_lock
);
1756 delayed_trim_handling_in_progress
= FALSE
;
1757 thread_wakeup((event_t
) &delayed_trim_handling_in_progress
);
1759 if (VM_SWAP_SHOULD_RECLAIM() && !vm_swapfile_gc_thread_running
) {
1760 thread_wakeup((event_t
) &vm_swapfile_gc_needed
);
1763 lck_mtx_unlock(&vm_swap_data_lock
);
1767 vm_swap_do_delayed_trim(struct swapfile
*swf
)
1769 struct trim_list
*tl
, *tl_head
;
1771 lck_mtx_lock(&vm_swap_data_lock
);
1773 tl_head
= swf
->swp_delayed_trim_list_head
;
1774 swf
->swp_delayed_trim_list_head
= NULL
;
1775 swf
->swp_delayed_trim_count
= 0;
1777 lck_mtx_unlock(&vm_swap_data_lock
);
1779 vnode_trim_list(swf
->swp_vp
, tl_head
, TRUE
);
1781 while ((tl
= tl_head
) != NULL
) {
1782 unsigned int segidx
= 0;
1783 unsigned int byte_for_segidx
= 0;
1784 unsigned int offset_within_byte
= 0;
1786 lck_mtx_lock(&vm_swap_data_lock
);
1788 segidx
= (unsigned int) (tl
->tl_offset
/ COMPRESSED_SWAP_CHUNK_SIZE
);
1790 byte_for_segidx
= segidx
>> 3;
1791 offset_within_byte
= segidx
% 8;
1793 if ((swf
->swp_bitmap
)[byte_for_segidx
] & (1 << offset_within_byte
)) {
1794 (swf
->swp_bitmap
)[byte_for_segidx
] &= ~(1 << offset_within_byte
);
1796 swf
->swp_csegs
[segidx
] = NULL
;
1798 swf
->swp_nseginuse
--;
1799 vm_swapfile_total_segs_used
--;
1801 if (segidx
< swf
->swp_free_hint
) {
1802 swf
->swp_free_hint
= segidx
;
1805 lck_mtx_unlock(&vm_swap_data_lock
);
1807 tl_head
= tl
->tl_next
;
1809 kfree(tl
, sizeof(struct trim_list
));
1820 int vm_swap_reclaim_yielded
= 0;
1823 vm_swap_reclaim(void)
1825 vm_offset_t addr
= 0;
1826 unsigned int segidx
= 0;
1827 uint64_t f_offset
= 0;
1828 struct swapfile
*swf
= NULL
;
1829 struct swapfile
*smallest_swf
= NULL
;
1830 unsigned int min_nsegs
= 0;
1831 unsigned int byte_for_segidx
= 0;
1832 unsigned int offset_within_byte
= 0;
1833 uint32_t c_size
= 0;
1835 c_segment_t c_seg
= NULL
;
1837 if (kernel_memory_allocate(compressor_map
, (vm_offset_t
*)(&addr
), C_SEG_BUFSIZE
, 0, KMA_KOBJECT
, VM_KERN_MEMORY_COMPRESSOR
) != KERN_SUCCESS
) {
1838 panic("vm_swap_reclaim: kernel_memory_allocate failed\n");
1841 lck_mtx_lock(&vm_swap_data_lock
);
1844 * if we're running the swapfile list looking for
1845 * candidates with delayed trims, we need to
1846 * wait before making our decision concerning
1847 * the swapfile we want to reclaim
1849 vm_swap_wait_on_trim_handling_in_progress();
1852 * from here until we knock down the SWAP_READY bit,
1853 * we need to remain behind the vm_swap_data_lock...
1854 * once that bit has been turned off, "vm_swap_handle_delayed_trims"
1855 * will not consider this swapfile for processing
1857 swf
= (struct swapfile
*) queue_first(&swf_global_queue
);
1858 min_nsegs
= MAX_SWAP_FILE_SIZE
/ COMPRESSED_SWAP_CHUNK_SIZE
;
1859 smallest_swf
= NULL
;
1861 while (queue_end(&swf_global_queue
, (queue_entry_t
)swf
) == FALSE
) {
1862 if ((swf
->swp_flags
& SWAP_READY
) && (swf
->swp_nseginuse
<= min_nsegs
)) {
1864 min_nsegs
= swf
->swp_nseginuse
;
1866 swf
= (struct swapfile
*) queue_next(&swf
->swp_queue
);
1869 if (smallest_swf
== NULL
) {
1876 swf
->swp_flags
&= ~SWAP_READY
;
1877 swf
->swp_flags
|= SWAP_RECLAIM
;
1879 if (swf
->swp_delayed_trim_count
) {
1880 lck_mtx_unlock(&vm_swap_data_lock
);
1882 vm_swap_do_delayed_trim(swf
);
1884 lck_mtx_lock(&vm_swap_data_lock
);
1888 while (segidx
< swf
->swp_nsegs
) {
1891 * Wait for outgoing I/Os.
1893 while (swf
->swp_io_count
) {
1894 swf
->swp_flags
|= SWAP_WANTED
;
1896 assert_wait((event_t
) &swf
->swp_flags
, THREAD_UNINT
);
1897 lck_mtx_unlock(&vm_swap_data_lock
);
1899 thread_block(THREAD_CONTINUE_NULL
);
1901 lck_mtx_lock(&vm_swap_data_lock
);
1903 if (compressor_store_stop_compaction
== TRUE
|| VM_SWAP_SHOULD_ABORT_RECLAIM() || VM_SWAP_BUSY()) {
1904 vm_swap_reclaim_yielded
++;
1908 byte_for_segidx
= segidx
>> 3;
1909 offset_within_byte
= segidx
% 8;
1911 if (((swf
->swp_bitmap
)[byte_for_segidx
] & (1 << offset_within_byte
)) == 0) {
1916 c_seg
= swf
->swp_csegs
[segidx
];
1919 lck_mtx_lock_spin_always(&c_seg
->c_lock
);
1921 if (c_seg
->c_busy
) {
1923 * a swapped out c_segment in the process of being freed will remain in the
1924 * busy state until after the vm_swap_free is called on it... vm_swap_free
1925 * takes the vm_swap_data_lock, so can't change the swap state until after
1926 * we drop the vm_swap_data_lock... once we do, vm_swap_free will complete
1927 * which will allow c_seg_free_locked to clear busy and wake up this thread...
1928 * at that point, we re-look up the swap state which will now indicate that
1929 * this c_segment no longer exists.
1931 c_seg
->c_wanted
= 1;
1933 assert_wait((event_t
) (c_seg
), THREAD_UNINT
);
1934 lck_mtx_unlock_always(&c_seg
->c_lock
);
1936 lck_mtx_unlock(&vm_swap_data_lock
);
1938 thread_block(THREAD_CONTINUE_NULL
);
1940 lck_mtx_lock(&vm_swap_data_lock
);
1942 goto ReTry_for_cseg
;
1944 (swf
->swp_bitmap
)[byte_for_segidx
] &= ~(1 << offset_within_byte
);
1946 f_offset
= segidx
* COMPRESSED_SWAP_CHUNK_SIZE
;
1948 assert(c_seg
== swf
->swp_csegs
[segidx
]);
1949 swf
->swp_csegs
[segidx
] = NULL
;
1950 swf
->swp_nseginuse
--;
1952 vm_swapfile_total_segs_used
--;
1954 lck_mtx_unlock(&vm_swap_data_lock
);
1956 assert(C_SEG_IS_ONDISK(c_seg
));
1959 c_seg
->c_busy_swapping
= 1;
1960 #if !CHECKSUM_THE_SWAP
1961 c_seg_trim_tail(c_seg
);
1963 c_size
= round_page_32(C_SEG_OFFSET_TO_BYTES(c_seg
->c_populated_offset
));
1965 assert(c_size
<= C_SEG_BUFSIZE
&& c_size
);
1967 lck_mtx_unlock_always(&c_seg
->c_lock
);
1969 if (vm_swapfile_io(swf
->swp_vp
, f_offset
, addr
, (int)(c_size
/ PAGE_SIZE_64
), SWAP_READ
, NULL
)) {
1971 * reading the data back in failed, so convert c_seg
1972 * to a swapped in c_segment that contains no data
1974 c_seg_swapin_requeue(c_seg
, FALSE
, TRUE
, FALSE
);
1976 * returns with c_busy_swapping cleared
1979 vm_swap_get_failures
++;
1980 goto swap_io_failed
;
1982 VM_STAT_INCR_BY(swapins
, c_size
>> PAGE_SHIFT
);
1984 if (vm_swap_put(addr
, &f_offset
, c_size
, c_seg
, NULL
)) {
1985 vm_offset_t c_buffer
;
1988 * the put failed, so convert c_seg to a fully swapped in c_segment
1991 c_buffer
= (vm_offset_t
)C_SEG_BUFFER_ADDRESS(c_seg
->c_mysegno
);
1993 kernel_memory_populate(compressor_map
, c_buffer
, c_size
, KMA_COMPRESSOR
, VM_KERN_MEMORY_COMPRESSOR
);
1995 memcpy((char *)c_buffer
, (char *)addr
, c_size
);
1997 c_seg
->c_store
.c_buffer
= (int32_t *)c_buffer
;
1999 vm_swap_decrypt(c_seg
);
2000 #endif /* ENCRYPTED_SWAP */
2001 c_seg_swapin_requeue(c_seg
, TRUE
, TRUE
, FALSE
);
2003 * returns with c_busy_swapping cleared
2005 OSAddAtomic64(c_seg
->c_bytes_used
, &compressor_bytes_used
);
2007 goto swap_io_failed
;
2009 VM_STAT_INCR_BY(swapouts
, c_size
>> PAGE_SHIFT
);
2011 lck_mtx_lock_spin_always(&c_seg
->c_lock
);
2013 assert(C_SEG_IS_ONDISK(c_seg
));
2015 * The c_seg will now know about the new location on disk.
2017 c_seg
->c_store
.c_swap_handle
= f_offset
;
2019 assert(c_seg
->c_busy_swapping
);
2020 c_seg
->c_busy_swapping
= 0;
2022 assert(c_seg
->c_busy
);
2023 C_SEG_WAKEUP_DONE(c_seg
);
2025 lck_mtx_unlock_always(&c_seg
->c_lock
);
2026 lck_mtx_lock(&vm_swap_data_lock
);
2029 if (swf
->swp_nseginuse
) {
2030 swf
->swp_flags
&= ~SWAP_RECLAIM
;
2031 swf
->swp_flags
|= SWAP_READY
;
2036 * We don't remove this inactive swf from the queue.
2037 * That way, we can re-use it when needed again and
2038 * preserve the namespace. The delayed_trim processing
2039 * is also dependent on us not removing swfs from the queue.
2041 //queue_remove(&swf_global_queue, swf, struct swapfile*, swp_queue);
2043 vm_swapfile_total_segs_alloced
-= swf
->swp_nsegs
;
2045 lck_mtx_unlock(&vm_swap_data_lock
);
2047 vm_swapfile_close((uint64_t)(swf
->swp_path
), swf
->swp_vp
);
2049 kfree(swf
->swp_csegs
, swf
->swp_nsegs
* sizeof(c_segment_t
));
2050 kfree(swf
->swp_bitmap
, MAX((swf
->swp_nsegs
>> 3), 1));
2052 lck_mtx_lock(&vm_swap_data_lock
);
2054 if (swf
->swp_flags
& SWAP_PINNED
) {
2055 vm_num_pinned_swap_files
--;
2056 vm_swappin_avail
+= swf
->swp_size
;
2061 swf
->swp_free_hint
= 0;
2063 swf
->swp_flags
= SWAP_REUSE
;
2065 vm_num_swap_files
--;
2068 thread_wakeup((event_t
) &swf
->swp_flags
);
2069 lck_mtx_unlock(&vm_swap_data_lock
);
2071 kmem_free(compressor_map
, (vm_offset_t
) addr
, C_SEG_BUFSIZE
);
2076 vm_swap_get_total_space(void)
2078 uint64_t total_space
= 0;
2080 total_space
= (uint64_t)vm_swapfile_total_segs_alloced
* COMPRESSED_SWAP_CHUNK_SIZE
;
2086 vm_swap_get_used_space(void)
2088 uint64_t used_space
= 0;
2090 used_space
= (uint64_t)vm_swapfile_total_segs_used
* COMPRESSED_SWAP_CHUNK_SIZE
;
2096 vm_swap_get_free_space(void)
2098 return vm_swap_get_total_space() - vm_swap_get_used_space();
2103 vm_swap_low_on_space(void)
2105 if (vm_num_swap_files
== 0 && vm_swapfile_can_be_created
== FALSE
) {
2109 if (((vm_swapfile_total_segs_alloced
- vm_swapfile_total_segs_used
) < ((unsigned int)VM_SWAPFILE_HIWATER_SEGS
) / 8)) {
2110 if (vm_num_swap_files
== 0 && !SWAPPER_NEEDS_TO_UNTHROTTLE()) {
2114 if (vm_swapfile_last_failed_to_create_ts
>= vm_swapfile_last_successful_create_ts
) {
2122 vm_swap_files_pinned(void)
2126 if (vm_swappin_enabled
== FALSE
) {
2130 result
= (vm_num_pinned_swap_files
== vm_num_swap_files
);
2137 vm_swap_max_budget(uint64_t *freeze_daily_budget
)
2139 boolean_t use_device_value
= FALSE
;
2140 struct swapfile
*swf
= NULL
;
2142 if (vm_num_swap_files
) {
2143 lck_mtx_lock(&vm_swap_data_lock
);
2145 swf
= (struct swapfile
*) queue_first(&swf_global_queue
);
2148 while (queue_end(&swf_global_queue
, (queue_entry_t
)swf
) == FALSE
) {
2149 if (swf
->swp_flags
== SWAP_READY
) {
2150 assert(swf
->swp_vp
);
2152 if (vm_swap_vol_get_budget(swf
->swp_vp
, freeze_daily_budget
) == 0) {
2153 use_device_value
= TRUE
;
2157 swf
= (struct swapfile
*) queue_next(&swf
->swp_queue
);
2161 lck_mtx_unlock(&vm_swap_data_lock
);
2164 * This block is used for the initial budget value before any swap files
2165 * are created. We create a temp swap file to get the budget.
2168 struct vnode
*temp_vp
= NULL
;
2170 vm_swapfile_open(swapfilename
, &temp_vp
);
2173 if (vm_swap_vol_get_budget(temp_vp
, freeze_daily_budget
) == 0) {
2174 use_device_value
= TRUE
;
2177 vm_swapfile_close((uint64_t)&swapfilename
, temp_vp
);
2180 *freeze_daily_budget
= 0;
2184 return use_device_value
;
2186 #endif /* CONFIG_FREEZE */