]> git.saurik.com Git - apple/xnu.git/blame - bsd/vm/vnode_pager.c
xnu-1699.22.81.tar.gz
[apple/xnu.git] / bsd / vm / vnode_pager.c
CommitLineData
1c79356b 1/*
2d21ac55 2 * Copyright (c) 2000-2006 Apple Computer, Inc. All rights reserved.
5d5c5d0d 3 *
2d21ac55 4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
1c79356b 5 *
2d21ac55
A
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
8f6c56a5 14 *
2d21ac55
A
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
17 *
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
8f6c56a5
A
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
2d21ac55
A
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
8f6c56a5 25 *
2d21ac55 26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
1c79356b
A
27 */
28/*
29 * Mach Operating System
30 * Copyright (c) 1987 Carnegie-Mellon University
31 * All rights reserved. The CMU software License Agreement specifies
32 * the terms and conditions for use and redistribution.
33 */
34/*
35 * File: vnode_pager.c
36 *
37 * "Swap" pager that pages to/from vnodes. Also
38 * handles demand paging from files.
39 *
40 */
41
42#include <mach/boolean.h>
43#include <sys/param.h>
44#include <sys/systm.h>
91447636 45#include <sys/user.h>
1c79356b 46#include <sys/proc.h>
91447636 47#include <sys/kauth.h>
1c79356b
A
48#include <sys/buf.h>
49#include <sys/uio.h>
91447636 50#include <sys/vnode_internal.h>
1c79356b 51#include <sys/namei.h>
91447636
A
52#include <sys/mount_internal.h> /* needs internal due to fhandle_t */
53#include <sys/ubc_internal.h>
1c79356b 54#include <sys/lock.h>
6d2010ae 55#include <sys/disk.h> /* For DKIOC calls */
1c79356b
A
56
57#include <mach/mach_types.h>
58#include <mach/memory_object_types.h>
b0d623f7
A
59#include <mach/memory_object_control.h>
60#include <mach/vm_map.h>
61#include <mach/mach_vm.h>
62#include <mach/upl.h>
2d21ac55 63#include <mach/sdt.h>
1c79356b
A
64
65#include <vm/vm_map.h>
66#include <vm/vm_kern.h>
1c79356b
A
67#include <kern/zalloc.h>
68#include <kern/kalloc.h>
69#include <libkern/libkern.h>
70
71#include <vm/vnode_pager.h>
72#include <vm/vm_pageout.h>
73
74#include <kern/assert.h>
9bccf70c 75#include <sys/kdebug.h>
91447636
A
76#include <machine/spl.h>
77
78#include <nfs/rpcv2.h>
79#include <nfs/nfsproto.h>
80#include <nfs/nfs.h>
81
82#include <vm/vm_protos.h>
1c79356b 83
b0d623f7 84
6d2010ae
A
85void
86vnode_pager_throttle()
87{
88 struct uthread *ut;
89
90 ut = get_bsdthread_info(current_thread());
91
92 if (ut->uu_lowpri_window)
93 throttle_lowpri_io(TRUE);
94}
95
96
97boolean_t
98vnode_pager_isSSD(vnode_t vp)
99{
100 if (vp->v_mount->mnt_kern_flag & MNTK_SSD)
101 return (TRUE);
102 return (FALSE);
103}
104
105
b0d623f7
A
106uint32_t
107vnode_pager_isinuse(struct vnode *vp)
108{
109 if (vp->v_usecount > vp->v_kusecount)
110 return (1);
111 return (0);
112}
113
114uint32_t
115vnode_pager_return_hard_throttle_limit(struct vnode *vp, uint32_t *limit, uint32_t hard_throttle)
116{
117 return(cluster_hard_throttle_limit(vp, limit, hard_throttle));
118}
1c79356b 119
0b4e3aa0
A
120vm_object_offset_t
121vnode_pager_get_filesize(struct vnode *vp)
122{
0b4e3aa0
A
123
124 return (vm_object_offset_t) ubc_getsize(vp);
0b4e3aa0
A
125}
126
0c530ab8
A
127kern_return_t
128vnode_pager_get_pathname(
129 struct vnode *vp,
130 char *pathname,
131 vm_size_t *length_p)
132{
133 int error, len;
134
135 len = (int) *length_p;
136 error = vn_getpath(vp, pathname, &len);
137 if (error != 0) {
138 return KERN_FAILURE;
139 }
140 *length_p = (vm_size_t) len;
141 return KERN_SUCCESS;
142}
143
144kern_return_t
145vnode_pager_get_filename(
146 struct vnode *vp,
2d21ac55 147 const char **filename)
0c530ab8
A
148{
149 *filename = vp->v_name;
150 return KERN_SUCCESS;
151}
152
2d21ac55
A
153kern_return_t
154vnode_pager_get_cs_blobs(
155 struct vnode *vp,
156 void **blobs)
157{
158 *blobs = ubc_get_cs_blobs(vp);
159 return KERN_SUCCESS;
160}
161
6d2010ae
A
162/*
163 * vnode_trim:
164 * Used to call the DKIOCUNMAP ioctl on the underlying disk device for the specified vnode.
165 * Trims the region at offset bytes into the file, for length bytes.
166 *
167 * Care must be taken to ensure that the vnode is sufficiently reference counted at the time this
168 * function is called; no iocounts or usecounts are taken on the vnode.
169 * This function is non-idempotent in error cases; We cannot un-discard the blocks if only some of them
170 * are successfully discarded.
171 */
172u_int32_t vnode_trim (
173 struct vnode *vp,
174 off_t offset,
175 size_t length)
176{
177 daddr64_t io_blockno; /* Block number corresponding to the start of the extent */
178 size_t io_bytecount; /* Number of bytes in current extent for the specified range */
179 size_t trimmed = 0;
180 off_t current_offset = offset;
181 size_t remaining_length = length;
182 int error = 0;
183 u_int32_t blocksize = 0;
184 struct vnode *devvp;
185 dk_extent_t extent;
186 dk_unmap_t unmap;
187
188
189 /* Get the underlying device vnode */
190 devvp = vp->v_mount->mnt_devvp;
191
192 /* Figure out the underlying device block size */
193 error = VNOP_IOCTL(devvp, DKIOCGETBLOCKSIZE, (caddr_t)&blocksize, 0, vfs_context_kernel());
194 if (error) {
195 goto trim_exit;
196 }
197
198 /*
199 * We may not get the entire range from offset -> offset+length in a single
200 * extent from the blockmap call. Keep looping/going until we are sure we've hit
201 * the whole range or if we encounter an error.
202 */
203 while (trimmed < length) {
204 /*
205 * VNOP_BLOCKMAP will tell us the logical to physical block number mapping for the
206 * specified offset. It returns blocks in contiguous chunks, so if the logical range is
207 * broken into multiple extents, it must be called multiple times, increasing the offset
208 * in each call to ensure that the entire range is covered.
209 */
210 error = VNOP_BLOCKMAP (vp, current_offset, remaining_length,
211 &io_blockno, &io_bytecount, NULL, VNODE_READ, NULL);
212
213 if (error) {
214 goto trim_exit;
215 }
216 /*
217 * We have a contiguous run. Prepare & issue the ioctl for the device.
218 * the DKIOCUNMAP ioctl takes offset in bytes from the start of the device.
219 */
220 memset (&extent, 0, sizeof(dk_extent_t));
221 memset (&unmap, 0, sizeof(dk_unmap_t));
222 extent.offset = (uint64_t) io_blockno * (u_int64_t) blocksize;
223 extent.length = io_bytecount;
224 unmap.extents = &extent;
225 unmap.extentsCount = 1;
226 error = VNOP_IOCTL(devvp, DKIOCUNMAP, (caddr_t)&unmap, 0, vfs_context_kernel());
227
228 if (error) {
229 goto trim_exit;
230 }
231 remaining_length = remaining_length - io_bytecount;
232 trimmed = trimmed + io_bytecount;
233 current_offset = current_offset + io_bytecount;
234 }
235trim_exit:
236
237 return error;
238
239}
240
1c79356b
A
241pager_return_t
242vnode_pageout(struct vnode *vp,
243 upl_t upl,
b0d623f7 244 upl_offset_t upl_offset,
1c79356b 245 vm_object_offset_t f_offset,
b0d623f7 246 upl_size_t size,
1c79356b
A
247 int flags,
248 int *errorp)
249{
91447636 250 int result = PAGER_SUCCESS;
1c79356b 251 int error = 0;
91447636
A
252 int error_ret = 0;
253 daddr64_t blkno;
254 int isize;
1c79356b 255 int pg_index;
91447636 256 int base_index;
b0d623f7 257 upl_offset_t offset;
1c79356b 258 upl_page_info_t *pl;
2d21ac55 259 vfs_context_t ctx = vfs_context_current(); /* pager context */
1c79356b 260
1c79356b
A
261 isize = (int)size;
262
9bccf70c 263 if (isize <= 0) {
91447636
A
264 result = PAGER_ERROR;
265 error_ret = EINVAL;
9bccf70c
A
266 goto out;
267 }
1c79356b 268
2d21ac55 269 if (UBCINFOEXISTS(vp) == 0) {
91447636
A
270 result = PAGER_ERROR;
271 error_ret = EINVAL;
9bccf70c 272
fa4905b1 273 if (upl && !(flags & UPL_NOCOMMIT))
9bccf70c 274 ubc_upl_abort_range(upl, upl_offset, size, UPL_ABORT_FREE_ON_EMPTY);
1c79356b
A
275 goto out;
276 }
91447636 277 if ( !(flags & UPL_VNODE_PAGER)) {
1c79356b 278 /*
91447636
A
279 * This is a pageout from the default pager,
280 * just go ahead and call vnop_pageout since
281 * it has already sorted out the dirty ranges
1c79356b 282 */
9bccf70c
A
283 KERNEL_DEBUG_CONSTANT((MACHDBG_CODE(DBG_MACH_VM, 1)) | DBG_FUNC_START,
284 size, 1, 0, 0, 0);
285
91447636 286 if ( (error_ret = VNOP_PAGEOUT(vp, upl, upl_offset, (off_t)f_offset,
2d21ac55 287 (size_t)size, flags, ctx)) )
91447636 288 result = PAGER_ERROR;
9bccf70c
A
289
290 KERNEL_DEBUG_CONSTANT((MACHDBG_CODE(DBG_MACH_VM, 1)) | DBG_FUNC_END,
291 size, 1, 0, 0, 0);
292
1c79356b
A
293 goto out;
294 }
b0d623f7
A
295 if (upl == NULL) {
296 int request_flags;
297
298 if (vp->v_mount->mnt_vtable->vfc_vfsflags & VFC_VFSVNOP_PAGEOUTV2) {
299 /*
300 * filesystem has requested the new form of VNOP_PAGEOUT for file
301 * backed objects... we will not grab the UPL befofe calling VNOP_PAGEOUT...
302 * it is the fileystem's responsibility to grab the range we're denoting
303 * via 'f_offset' and 'size' into a UPL... this allows the filesystem to first
304 * take any locks it needs, before effectively locking the pages into a UPL...
305 */
306 KERNEL_DEBUG_CONSTANT((MACHDBG_CODE(DBG_MACH_VM, 1)) | DBG_FUNC_START,
307 size, (int)f_offset, 0, 0, 0);
308
309 if ( (error_ret = VNOP_PAGEOUT(vp, NULL, upl_offset, (off_t)f_offset,
310 size, flags, ctx)) ) {
311 result = PAGER_ERROR;
312 }
313 KERNEL_DEBUG_CONSTANT((MACHDBG_CODE(DBG_MACH_VM, 1)) | DBG_FUNC_END,
314 size, 0, 0, 0, 0);
315
316 goto out;
317 }
318 if (flags & UPL_MSYNC)
319 request_flags = UPL_UBC_MSYNC | UPL_RET_ONLY_DIRTY;
320 else
321 request_flags = UPL_UBC_PAGEOUT | UPL_RET_ONLY_DIRTY;
322
6d2010ae 323 if (ubc_create_upl(vp, f_offset, size, &upl, &pl, request_flags) != KERN_SUCCESS) {
b0d623f7
A
324 result = PAGER_ERROR;
325 error_ret = EINVAL;
326 goto out;
327 }
328 upl_offset = 0;
329 } else
330 pl = ubc_upl_pageinfo(upl);
331
9bccf70c 332 /*
91447636
A
333 * we come here for pageouts to 'real' files and
334 * for msyncs... the upl may not contain any
335 * dirty pages.. it's our responsibility to sort
336 * through it and find the 'runs' of dirty pages
337 * to call VNOP_PAGEOUT on...
9bccf70c 338 */
fa4905b1 339 if (ubc_getsize(vp) == 0) {
91447636
A
340 /*
341 * if the file has been effectively deleted, then
342 * we need to go through the UPL and invalidate any
343 * buffer headers we might have that reference any
344 * of it's pages
345 */
346 for (offset = upl_offset; isize; isize -= PAGE_SIZE, offset += PAGE_SIZE) {
347#if NFSCLIENT
348 if (vp->v_tag == VT_NFS)
349 /* check with nfs if page is OK to drop */
350 error = nfs_buf_page_inval(vp, (off_t)f_offset);
351 else
352#endif
353 {
354 blkno = ubc_offtoblk(vp, (off_t)f_offset);
355 error = buf_invalblkno(vp, blkno, 0);
356 }
357 if (error) {
358 if ( !(flags & UPL_NOCOMMIT))
359 ubc_upl_abort_range(upl, offset, PAGE_SIZE, UPL_ABORT_FREE_ON_EMPTY);
360 if (error_ret == 0)
361 error_ret = error;
362 result = PAGER_ERROR;
363
364 } else if ( !(flags & UPL_NOCOMMIT)) {
365 ubc_upl_commit_range(upl, offset, PAGE_SIZE, UPL_COMMIT_FREE_ON_EMPTY);
fa4905b1 366 }
91447636 367 f_offset += PAGE_SIZE;
1c79356b 368 }
1c79356b
A
369 goto out;
370 }
91447636
A
371 /*
372 * Ignore any non-present pages at the end of the
373 * UPL so that we aren't looking at a upl that
374 * may already have been freed by the preceeding
375 * aborts/completions.
376 */
377 base_index = upl_offset / PAGE_SIZE;
378
379 for (pg_index = (upl_offset + isize) / PAGE_SIZE; pg_index > base_index;) {
380 if (upl_page_present(pl, --pg_index))
381 break;
382 if (pg_index == base_index) {
383 /*
384 * no pages were returned, so release
385 * our hold on the upl and leave
386 */
387 if ( !(flags & UPL_NOCOMMIT))
388 ubc_upl_abort_range(upl, upl_offset, isize, UPL_ABORT_FREE_ON_EMPTY);
389
390 goto out;
391 }
392 }
2d21ac55 393 isize = ((pg_index + 1) - base_index) * PAGE_SIZE;
91447636
A
394
395 offset = upl_offset;
396 pg_index = base_index;
1c79356b
A
397
398 while (isize) {
399 int xsize;
400 int num_of_pages;
401
91447636
A
402 if ( !upl_page_present(pl, pg_index)) {
403 /*
404 * we asked for RET_ONLY_DIRTY, so it's possible
405 * to get back empty slots in the UPL
406 * just skip over them
407 */
2d21ac55
A
408 f_offset += PAGE_SIZE;
409 offset += PAGE_SIZE;
410 isize -= PAGE_SIZE;
1c79356b
A
411 pg_index++;
412
413 continue;
414 }
415 if ( !upl_dirty_page(pl, pg_index)) {
416 /*
417 * if the page is not dirty and reached here it is
418 * marked precious or it is due to invalidation in
419 * memory_object_lock request as part of truncation
420 * We also get here from vm_object_terminate()
421 * So all you need to do in these
422 * cases is to invalidate incore buffer if it is there
91447636 423 * Note we must not sleep here if the buffer is busy - that is
fa4905b1 424 * a lock inversion which causes deadlock.
1c79356b 425 */
91447636
A
426#if NFSCLIENT
427 if (vp->v_tag == VT_NFS)
55e303ae 428 /* check with nfs if page is OK to drop */
2d21ac55 429 error = nfs_buf_page_inval(vp, (off_t)f_offset);
91447636
A
430 else
431#endif
432 {
2d21ac55 433 blkno = ubc_offtoblk(vp, (off_t)f_offset);
91447636
A
434 error = buf_invalblkno(vp, blkno, 0);
435 }
436 if (error) {
437 if ( !(flags & UPL_NOCOMMIT))
438 ubc_upl_abort_range(upl, offset, PAGE_SIZE, UPL_ABORT_FREE_ON_EMPTY);
439 if (error_ret == 0)
440 error_ret = error;
441 result = PAGER_ERROR;
442
443 } else if ( !(flags & UPL_NOCOMMIT)) {
444 ubc_upl_commit_range(upl, offset, PAGE_SIZE, UPL_COMMIT_FREE_ON_EMPTY);
445 }
2d21ac55
A
446 f_offset += PAGE_SIZE;
447 offset += PAGE_SIZE;
448 isize -= PAGE_SIZE;
1c79356b
A
449 pg_index++;
450
451 continue;
452 }
1c79356b
A
453 num_of_pages = 1;
454 xsize = isize - PAGE_SIZE;
455
456 while (xsize) {
1c79356b
A
457 if ( !upl_dirty_page(pl, pg_index + num_of_pages))
458 break;
459 num_of_pages++;
460 xsize -= PAGE_SIZE;
461 }
462 xsize = num_of_pages * PAGE_SIZE;
463
9bccf70c 464 KERNEL_DEBUG_CONSTANT((MACHDBG_CODE(DBG_MACH_VM, 1)) | DBG_FUNC_START,
2d21ac55 465 xsize, (int)f_offset, 0, 0, 0);
9bccf70c 466
b0d623f7 467 if ( (error = VNOP_PAGEOUT(vp, upl, offset, (off_t)f_offset,
2d21ac55 468 xsize, flags, ctx)) ) {
91447636
A
469 if (error_ret == 0)
470 error_ret = error;
471 result = PAGER_ERROR;
472 }
9bccf70c
A
473 KERNEL_DEBUG_CONSTANT((MACHDBG_CODE(DBG_MACH_VM, 1)) | DBG_FUNC_END,
474 xsize, 0, 0, 0, 0);
475
2d21ac55
A
476 f_offset += xsize;
477 offset += xsize;
478 isize -= xsize;
1c79356b
A
479 pg_index += num_of_pages;
480 }
481out:
482 if (errorp)
91447636 483 *errorp = error_ret;
1c79356b 484
91447636 485 return (result);
1c79356b
A
486}
487
488
489pager_return_t
490vnode_pagein(
491 struct vnode *vp,
9bccf70c 492 upl_t upl,
b0d623f7 493 upl_offset_t upl_offset,
1c79356b 494 vm_object_offset_t f_offset,
b0d623f7 495 upl_size_t size,
1c79356b
A
496 int flags,
497 int *errorp)
498{
91447636 499 struct uthread *ut;
9bccf70c
A
500 upl_page_info_t *pl;
501 int result = PAGER_SUCCESS;
1c79356b 502 int error = 0;
9bccf70c
A
503 int pages_in_upl;
504 int start_pg;
505 int last_pg;
506 int first_pg;
507 int xsize;
2d21ac55 508 int must_commit = 1;
1c79356b 509
2d21ac55
A
510 if (flags & UPL_NOCOMMIT)
511 must_commit = 0;
1c79356b 512
2d21ac55 513 if (UBCINFOEXISTS(vp) == 0) {
1c79356b
A
514 result = PAGER_ERROR;
515 error = PAGER_ERROR;
2d21ac55
A
516
517 if (upl && must_commit)
9bccf70c 518 ubc_upl_abort_range(upl, upl_offset, size, UPL_ABORT_FREE_ON_EMPTY | UPL_ABORT_ERROR);
2d21ac55 519
1c79356b
A
520 goto out;
521 }
9bccf70c 522 if (upl == (upl_t)NULL) {
b0d623f7 523 flags &= ~UPL_NOCOMMIT;
2d21ac55 524
b0d623f7 525 if (size > (MAX_UPL_SIZE * PAGE_SIZE)) {
9bccf70c
A
526 result = PAGER_ERROR;
527 error = PAGER_ERROR;
528 goto out;
529 }
b0d623f7
A
530 if (vp->v_mount->mnt_vtable->vfc_vfsflags & VFC_VFSVNOP_PAGEINV2) {
531 /*
532 * filesystem has requested the new form of VNOP_PAGEIN for file
533 * backed objects... we will not grab the UPL befofe calling VNOP_PAGEIN...
534 * it is the fileystem's responsibility to grab the range we're denoting
535 * via 'f_offset' and 'size' into a UPL... this allows the filesystem to first
536 * take any locks it needs, before effectively locking the pages into a UPL...
537 * so we pass a NULL into the filesystem instead of a UPL pointer... the 'upl_offset'
538 * is used to identify the "must have" page in the extent... the filesystem is free
539 * to clip the extent to better fit the underlying FS blocksize if it desires as
540 * long as it continues to include the "must have" page... 'f_offset' + 'upl_offset'
541 * identifies that page
542 */
543 if ( (error = VNOP_PAGEIN(vp, NULL, upl_offset, (off_t)f_offset,
544 size, flags, vfs_context_current())) ) {
545 result = PAGER_ERROR;
546 error = PAGER_ERROR;
547 }
548 goto out;
549 }
550 ubc_create_upl(vp, f_offset, size, &upl, &pl, UPL_UBC_PAGEIN | UPL_RET_ONLY_ABSENT);
1c79356b 551
9bccf70c
A
552 if (upl == (upl_t)NULL) {
553 result = PAGER_ABSENT;
554 error = PAGER_ABSENT;
555 goto out;
1c79356b 556 }
9bccf70c 557 upl_offset = 0;
2d21ac55
A
558 first_pg = 0;
559
9bccf70c
A
560 /*
561 * if we get here, we've created the upl and
562 * are responsible for commiting/aborting it
563 * regardless of what the caller has passed in
564 */
2d21ac55 565 must_commit = 1;
1c79356b 566 } else {
9bccf70c 567 pl = ubc_upl_pageinfo(upl);
2d21ac55 568 first_pg = upl_offset / PAGE_SIZE;
9bccf70c
A
569 }
570 pages_in_upl = size / PAGE_SIZE;
2d21ac55 571 DTRACE_VM2(pgpgin, int, pages_in_upl, (uint64_t *), NULL);
9bccf70c
A
572
573 /*
574 * before we start marching forward, we must make sure we end on
575 * a present page, otherwise we will be working with a freed
576 * upl
577 */
578 for (last_pg = pages_in_upl - 1; last_pg >= first_pg; last_pg--) {
579 if (upl_page_present(pl, last_pg))
580 break;
2d21ac55
A
581 if (last_pg == first_pg) {
582 /*
583 * empty UPL, no pages are present
584 */
585 if (must_commit)
586 ubc_upl_abort_range(upl, upl_offset, size, UPL_ABORT_FREE_ON_EMPTY);
587 goto out;
588 }
9bccf70c
A
589 }
590 pages_in_upl = last_pg + 1;
2d21ac55 591 last_pg = first_pg;
9bccf70c 592
2d21ac55 593 while (last_pg < pages_in_upl) {
9bccf70c 594 /*
2d21ac55 595 * skip over missing pages...
9bccf70c 596 */
2d21ac55 597 for ( ; last_pg < pages_in_upl; last_pg++) {
9bccf70c
A
598 if (upl_page_present(pl, last_pg))
599 break;
600 }
9bccf70c 601 /*
2d21ac55 602 * skip over 'valid' pages... we don't want to issue I/O for these
9bccf70c
A
603 */
604 for (start_pg = last_pg; last_pg < pages_in_upl; last_pg++) {
2d21ac55 605 if (!upl_valid_page(pl, last_pg))
9bccf70c
A
606 break;
607 }
608 if (last_pg > start_pg) {
609 /*
610 * we've found a range of valid pages
611 * if we've got COMMIT responsibility
612 * commit this range of pages back to the
613 * cache unchanged
614 */
615 xsize = (last_pg - start_pg) * PAGE_SIZE;
1c79356b 616
2d21ac55 617 if (must_commit)
9bccf70c 618 ubc_upl_abort_range(upl, start_pg * PAGE_SIZE, xsize, UPL_ABORT_FREE_ON_EMPTY);
9bccf70c
A
619 }
620 if (last_pg == pages_in_upl)
2d21ac55
A
621 /*
622 * we're done... all pages that were present
623 * have either had I/O issued on them or
624 * were aborted unchanged...
625 */
9bccf70c
A
626 break;
627
2d21ac55 628 if (!upl_page_present(pl, last_pg)) {
9bccf70c 629 /*
2d21ac55
A
630 * we found a range of valid pages
631 * terminated by a missing page...
632 * bump index to the next page and continue on
9bccf70c 633 */
2d21ac55 634 last_pg++;
9bccf70c 635 continue;
2d21ac55 636 }
9bccf70c
A
637 /*
638 * scan from the found invalid page looking for a valid
639 * or non-present page before the end of the upl is reached, if we
640 * find one, then it will be the last page of the request to
641 * 'cluster_io'
642 */
643 for (start_pg = last_pg; last_pg < pages_in_upl; last_pg++) {
644 if (upl_valid_page(pl, last_pg) || !upl_page_present(pl, last_pg))
645 break;
646 }
647 if (last_pg > start_pg) {
648 int xoff;
9bccf70c
A
649 xsize = (last_pg - start_pg) * PAGE_SIZE;
650 xoff = start_pg * PAGE_SIZE;
651
b0d623f7 652 if ( (error = VNOP_PAGEIN(vp, upl, (upl_offset_t) xoff,
9bccf70c 653 (off_t)f_offset + xoff,
2d21ac55 654 xsize, flags, vfs_context_current())) ) {
b0d623f7
A
655 /*
656 * Usually this UPL will be aborted/committed by the lower cluster layer.
6d2010ae
A
657 *
658 * a) In the case of decmpfs, however, we may return an error (EAGAIN) to avoid
659 * a deadlock with another thread already inflating the file.
660 *
661 * b) In the case of content protection, EPERM is a valid error and we should respect it.
662 *
663 * In those cases, we must take care of our UPL at this layer itself.
b0d623f7
A
664 */
665 if (must_commit) {
666 if(error == EAGAIN) {
667 ubc_upl_abort_range(upl, (upl_offset_t) xoff, xsize, UPL_ABORT_FREE_ON_EMPTY | UPL_ABORT_RESTART);
668 }
6d2010ae
A
669#if CONFIG_PROTECT
670 if(error == EPERM) {
671 ubc_upl_abort_range(upl, (upl_offset_t) xoff, xsize, UPL_ABORT_FREE_ON_EMPTY | UPL_ABORT_ERROR);
672 }
673#endif
b0d623f7 674 }
0b4e3aa0
A
675 result = PAGER_ERROR;
676 error = PAGER_ERROR;
9bccf70c 677
0b4e3aa0 678 }
1c79356b 679 }
9bccf70c 680 }
1c79356b
A
681out:
682 if (errorp)
fa4905b1 683 *errorp = result;
1c79356b 684
91447636
A
685 ut = get_bsdthread_info(current_thread());
686
593a1d5f 687 if (ut->uu_lowpri_window) {
91447636
A
688 /*
689 * task is marked as a low priority I/O type
593a1d5f 690 * and the I/O we issued while in this page fault
91447636
A
691 * collided with normal I/O operations... we'll
692 * delay in order to mitigate the impact of this
693 * task on the normal operation of the system
694 */
593a1d5f 695 throttle_lowpri_io(TRUE);
91447636 696 }
1c79356b
A
697 return (error);
698}
699
700void
91447636 701vnode_pager_shutdown(void)
1c79356b
A
702{
703 int i;
91447636 704 vnode_t vp;
1c79356b
A
705
706 for(i = 0; i < MAX_BACKING_STORE; i++) {
91447636 707 vp = (vnode_t)(bs_port_table[i]).vp;
1c79356b
A
708 if (vp) {
709 (bs_port_table[i]).vp = 0;
1c79356b 710
91447636
A
711 /* get rid of macx_swapon() reference */
712 vnode_rele(vp);
1c79356b
A
713 }
714 }
715}
716
0b4e3aa0
A
717
718void *
1c79356b
A
719upl_get_internal_page_list(upl_t upl)
720{
0b4e3aa0 721 return(UPL_GET_INTERNAL_PAGE_LIST(upl));
1c79356b
A
722
723}