]>
git.saurik.com Git - apple/xnu.git/blob - bsd/sys/buf.h
43af7fb1a44dd2e086ed8e42f770e95dd652a749
2 * Copyright (c) 2000-2005 Apple Computer, Inc. All rights reserved.
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
28 /* Copyright (c) 1995 NeXT Computer, Inc. All Rights Reserved */
30 * Copyright (c) 1982, 1986, 1989, 1993
31 * The Regents of the University of California. All rights reserved.
32 * (c) UNIX System Laboratories, Inc.
33 * All or some portions of this file are derived from material licensed
34 * to the University of California by American Telephone and Telegraph
35 * Co. or Unix System Laboratories, Inc. and are reproduced herein with
36 * the permission of UNIX System Laboratories, Inc.
38 * Redistribution and use in source and binary forms, with or without
39 * modification, are permitted provided that the following conditions
41 * 1. Redistributions of source code must retain the above copyright
42 * notice, this list of conditions and the following disclaimer.
43 * 2. Redistributions in binary form must reproduce the above copyright
44 * notice, this list of conditions and the following disclaimer in the
45 * documentation and/or other materials provided with the distribution.
46 * 3. All advertising materials mentioning features or use of this software
47 * must display the following acknowledgement:
48 * This product includes software developed by the University of
49 * California, Berkeley and its contributors.
50 * 4. Neither the name of the University nor the names of its contributors
51 * may be used to endorse or promote products derived from this software
52 * without specific prior written permission.
54 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
55 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
56 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
57 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
58 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
59 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
60 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
61 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
62 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
63 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
66 * @(#)buf.h 8.9 (Berkeley) 3/30/95
72 #include <sys/cdefs.h>
73 #include <sys/kernel_types.h>
74 #include <sys/ucred.h>
75 #include <mach/memory_object_types.h>
78 #define B_WRITE 0x00000000 /* Write buffer (pseudo flag). */
79 #define B_READ 0x00000001 /* Read buffer. */
80 #define B_ASYNC 0x00000002 /* Start I/O, do not wait. */
81 #define B_NOCACHE 0x00000004 /* Do not cache block after use. */
82 #define B_DELWRI 0x00000008 /* Delay I/O until buffer reused. */
83 #define B_LOCKED 0x00000010 /* Locked in core (not reusable). */
84 #define B_PHYS 0x00000020 /* I/O to user memory. */
85 #define B_CLUSTER 0x00000040 /* UPL based I/O generated by cluster layer */
86 #define B_PAGEIO 0x00000080 /* Page in/out */
87 #define B_META 0x00000100 /* buffer contains meta-data. */
88 #define B_RAW 0x00000200 /* Set by physio for raw transfers. */
89 #define B_FUA 0x00000400 /* Write-through disk cache(if supported) */
90 #define B_PASSIVE 0x00000800 /* PASSIVE I/Os are ignored by THROTTLE I/O */
91 #define B_IOSTREAMING 0x00001000 /* sequential access pattern detected */
92 #define B_THROTTLED_IO 0x00002000 /* low priority I/O */
93 #define B_ENCRYPTED_IO 0x00004000 /* Encrypted I/O */
94 #define B_STATICCONTENT 0x00008000 /* Buffer is likely to remain unaltered */
97 * make sure to check when adding flags that
98 * that the new flags don't overlap the definitions
105 @function buf_markaged
106 @abstract Mark a buffer as "aged," i.e. as a good candidate to be discarded and reused after buf_brelse().
107 @param bp Buffer to mark.
109 void buf_markaged(buf_t
);
112 @function buf_markinvalid
113 @abstract Mark a buffer as not having valid data and being ready for immediate reuse after buf_brelse().
114 @param bp Buffer to mark.
116 void buf_markinvalid(buf_t
);
119 @function buf_markdelayed
120 @abstract Mark a buffer as a delayed write: mark it dirty without actually scheduling I/O.
121 @discussion Data will be flushed to disk at some later time, not with brelse(). A sync()/fsync()
122 or pressure necessitating reuse of the buffer will cause it to be written back to disk.
123 @param bp Buffer to mark.
125 void buf_markdelayed(buf_t
);
127 void buf_markclean(buf_t
);
130 @function buf_markeintr
131 @abstract Mark a buffer as having been interrupted during I/O.
132 @discussion Waiters for I/O to complete (buf_biowait()) will return with EINTR when woken up.
133 buf_markeintr does not itself do a wakeup.
134 @param bp Buffer to mark.
136 void buf_markeintr(buf_t
);
139 @function buf_markfua
140 @abstract Mark a buffer for write through disk cache, if disk supports it.
141 @param bp Buffer to mark.
143 void buf_markfua(buf_t
);
147 @abstract Check if a buffer is marked for write through disk caches.
148 @param bp Buffer to test.
149 @return Nonzero if buffer is marked for write-through, 0 if not.
155 @abstract Check if a buffer contains valid data.
156 @param bp Buffer to test.
157 @return Nonzero if buffer has valid data, 0 if not.
159 int buf_valid(buf_t
);
162 @function buf_fromcache
163 @abstract Check if a buffer's data was found in core.
164 @discussion Will return truth after a buf_getblk that finds a valid buffer in the cache or the relevant
165 data in core (but not in a buffer).
166 @param bp Buffer to test.
167 @return Nonzero if we got this buffer's data without doing I/O, 0 if not.
169 int buf_fromcache(buf_t
);
173 @abstract Get the upl (Universal Page List) associated with a buffer.
174 @discussion Buffers allocated with buf_alloc() are not returned with a upl, and
175 traditional buffers only have a upl while an I/O is in progress.
176 @param bp Buffer whose upl to grab.
177 @return Buffer's upl if it has one, else NULL.
179 void * buf_upl(buf_t
);
182 @function buf_uploffset
183 @abstract Get the offset into a UPL at which this buffer begins.
184 @discussion This function should only be called on iobufs, i.e. buffers allocated with buf_alloc().
185 @param bp Buffer whose uploffset to grab.
186 @return Buffer's uploffset--does not check whether that value makes sense for this buffer.
188 uint32_t buf_uploffset(buf_t
);
192 @abstract Get the credential associated with a buffer for reading.
193 @discussion No reference is taken; if the credential is to be held on to persistently, an additional
194 reference must be taken with kauth_cred_ref.
195 @param bp Buffer whose credential to grab.
196 @return Credential if it exists, else NULL.
198 kauth_cred_t
buf_rcred(buf_t
);
202 @abstract Get the credential associated with a buffer for writing.
203 @discussion No reference is taken; if the credential is to be held on to persistently, an additional
204 reference must be taken with kauth_cred_ref.
205 @param bp Buffer whose credential to grab.
206 @return Credential if it exists, else NULL.
208 kauth_cred_t
buf_wcred(buf_t
);
212 @abstract Get the process associated with this buffer.
213 @discussion buf_proc() will generally return NULL; a process is currently only associated with
214 a buffer in the event of a physio() call.
215 @param bp Buffer whose associated process to find.
216 @return Associated process, possibly NULL.
218 proc_t
buf_proc(buf_t
);
221 @function buf_dirtyoff
222 @abstract Get the starting offset of the dirty region associated with a buffer.
223 @discussion The dirty offset is zero unless someone explicitly calls buf_setdirtyoff() (which the kernel does not).
224 @param bp Buffer whose dirty offset to get.
225 @return Dirty offset (0 if not explicitly changed).
227 uint32_t buf_dirtyoff(buf_t
);
230 @function buf_dirtyend
231 @abstract Get the ending offset of the dirty region associated with a buffer.
232 @discussion If the buffer's data was found incore and dirty, the dirty end is the size of the block; otherwise, unless
233 someone outside of xnu explicitly changes it by calling buf_setdirtyend(), it will be zero.
234 @param bp Buffer whose dirty end to get.
235 @return 0 if buffer is found clean; size of buffer if found dirty. Can be set to any value by callers of buf_setdirtyend().
237 uint32_t buf_dirtyend(buf_t
);
240 @function buf_setdirtyoff
241 @abstract Set the starting offset of the dirty region associated with a buffer.
242 @discussion This value is zero unless someone set it explicitly.
243 @param bp Buffer whose dirty end to set.
246 void buf_setdirtyoff(buf_t
, uint32_t);
249 @function buf_setdirtyend
250 @abstract Set the ending offset of the dirty region associated with a buffer.
251 @discussion If the buffer's data was found incore and dirty, the dirty end is the size of the block; otherwise, unless
252 someone outside of xnu explicitly changes it by calling buf_setdirtyend(), it will be zero.
253 @param bp Buffer whose dirty end to set.
256 void buf_setdirtyend(buf_t
, uint32_t);
260 @abstract Get the error value associated with a buffer.
261 @discussion Errors are set with buf_seterror().
262 @param bp Buffer whose error value to retrieve.
263 @return Error value, directly.
265 errno_t
buf_error(buf_t
);
268 @function buf_seterror
269 @abstract Set an error value on a buffer.
270 @param bp Buffer whose error value to set.
273 void buf_seterror(buf_t
, errno_t
);
276 @function buf_setflags
277 @abstract Set flags on a buffer.
278 @discussion: buffer_flags |= flags
279 @param bp Buffer whose flags to set.
280 @param flags Flags to add to buffer's mask. B_LOCKED/B_NOCACHE/B_ASYNC/B_READ/B_WRITE/B_PAGEIO/B_FUA
283 void buf_setflags(buf_t
, int32_t);
286 @function buf_clearflags
287 @abstract Clear flags on a buffer.
288 @discussion: buffer_flags &= ~flags
289 @param bp Buffer whose flags to clear.
290 @param flags Flags to remove from buffer's mask. B_LOCKED/B_NOCACHE/B_ASYNC/B_READ/B_WRITE/B_PAGEIO/B_FUA
293 void buf_clearflags(buf_t
, int32_t);
297 @abstract Get flags set on a buffer.
298 @discussion Valid flags are B_LOCKED/B_NOCACHE/B_ASYNC/B_READ/B_WRITE/B_PAGEIO/B_FUA.
299 @param bp Buffer whose flags to grab.
302 int32_t buf_flags(buf_t
);
306 @abstract Reset I/O flag state on a buffer.
307 @discussion Clears current flags on a buffer (internal and external) and allows some new flags to be set.
308 Used perhaps to prepare an iobuf for reuse.
309 @param bp Buffer whose flags to grab.
310 @param flags Flags to set on buffer: B_READ, B_WRITE, B_ASYNC, B_NOCACHE.
313 void buf_reset(buf_t
, int32_t);
317 @abstract Get virtual mappings for buffer data.
318 @discussion For buffers created through buf_getblk() (i.e. traditional buffer cache usage),
319 buf_map() just returns the address at which data was mapped by but_getblk(). For a B_CLUSTER buffer, i.e. an iobuf
320 whose upl state is managed manually, there are two possibilities. If the buffer was created
321 with an underlying "real" buffer through cluster_bp(), the mapping of the "real" buffer is returned.
322 Otherwise, the buffer was created with buf_alloc() and buf_setupl() was subsequently called; buf_map()
323 will call ubc_upl_map() to get a mapping for the buffer's upl and return the start of that mapping
324 plus the buffer's upl offset (set in buf_setupl()). In the last case, buf_unmap() must later be called
325 to tear down the mapping. NOTE: buf_map() does not set the buffer data pointer; this must be done with buf_setdataptr().
326 @param bp Buffer whose mapping to find or create.
327 @param io_addr Destination for mapping address.
328 @return 0 for success, ENOMEM if unable to map the buffer.
330 errno_t
buf_map(buf_t
, caddr_t
*);
334 @abstract Release mappings for buffer data.
335 @discussion For buffers created through buf_getblk() (i.e. traditional buffer cache usage),
336 buf_unmap() does nothing; buf_brelse() will take care of unmapping. For a B_CLUSTER buffer, i.e. an iobuf
337 whose upl state is managed manually, there are two possibilities. If the buffer was created
338 with an underlying "real" buffer through cluster_bp(), buf_unmap() does nothing; buf_brelse() on the
339 underlying buffer will tear down the mapping. Otherwise, the buffer was created with buf_alloc() and
340 buf_setupl() was subsequently called; buf_map() created the mapping. In this case, buf_unmap() will
342 @param bp Buffer whose mapping to find or create.
343 @param io_addr Destination for mapping address.
344 @return 0 for success, EINVAL if unable to unmap buffer.
346 errno_t
buf_unmap(buf_t
);
349 @function buf_setdrvdata
350 @abstract Set driver-specific data on a buffer.
351 @param bp Buffer whose driver-data to set.
352 @param drvdata Opaque driver data.
355 void buf_setdrvdata(buf_t
, void *);
358 @function buf_setdrvdata
359 @abstract Get driver-specific data from a buffer.
360 @param bp Buffer whose driver data to get.
361 @return Opaque driver data.
363 void * buf_drvdata(buf_t
);
366 @function buf_setfsprivate
367 @abstract Set filesystem-specific data on a buffer.
368 @param bp Buffer whose filesystem data to set.
369 @param fsprivate Opaque filesystem data.
372 void buf_setfsprivate(buf_t
, void *);
375 @function buf_fsprivate
376 @abstract Get filesystem-specific data from a buffer.
377 @param bp Buffer whose filesystem data to get.
378 @return Opaque filesystem data.
380 void * buf_fsprivate(buf_t
);
384 @abstract Get physical block number associated with a buffer, in the sense of VNOP_BLOCKMAP.
385 @discussion When a buffer's physical block number is the same is its logical block number, then the physical
386 block number is considered uninitialized. A physical block number of -1 indicates that there is no valid
387 physical mapping (e.g. the logical block is invalid or corresponds to a sparse region in a file). Physical
388 block number is normally set by the cluster layer or by buf_getblk().
389 @param bp Buffer whose physical block number to get.
390 @return Block number.
392 daddr64_t
buf_blkno(buf_t
);
396 @abstract Get logical block number associated with a buffer.
397 @discussion Logical block number is set on traditionally-used buffers by an argument passed to buf_getblk(),
398 for example by buf_bread().
399 @param bp Buffer whose logical block number to get.
400 @return Block number.
402 daddr64_t
buf_lblkno(buf_t
);
405 @function buf_setblkno
406 @abstract Set physical block number associated with a buffer.
407 @discussion Physical block number is generally set by the cluster layer or by buf_getblk().
408 @param bp Buffer whose physical block number to set.
409 @param blkno Block number to set.
412 void buf_setblkno(buf_t
, daddr64_t
);
415 @function buf_setlblkno
416 @abstract Set logical block number associated with a buffer.
417 @discussion Logical block number is set on traditionally-used buffers by an argument passed to buf_getblk(),
418 for example by buf_bread().
419 @param bp Buffer whose logical block number to set.
420 @param lblkno Block number to set.
423 void buf_setlblkno(buf_t
, daddr64_t
);
427 @abstract Get count of valid bytes in a buffer. This may be less than the space allocated to the buffer.
428 @param bp Buffer whose byte count to get.
431 uint32_t buf_count(buf_t
);
435 @abstract Get size of data region allocated to a buffer.
436 @discussion May be larger than amount of valid data in buffer.
437 @param bp Buffer whose size to get.
440 uint32_t buf_size(buf_t
);
444 @abstract Get a count of bytes which were not consumed by an I/O on a buffer.
445 @discussion Set when an I/O operations completes.
446 @param bp Buffer whose outstanding count to get.
447 @return Count of unwritten/unread bytes.
449 uint32_t buf_resid(buf_t
);
452 @function buf_setcount
453 @abstract Set count of valid bytes in a buffer. This may be less than the space allocated to the buffer.
454 @param bp Buffer whose byte count to set.
455 @param bcount Count to set.
458 void buf_setcount(buf_t
, uint32_t);
461 @function buf_setsize
462 @abstract Set size of data region allocated to a buffer.
463 @discussion May be larger than amount of valid data in buffer. Should be used by
464 code which is manually providing storage for an iobuf, one allocated with buf_alloc().
465 @param bp Buffer whose size to set.
468 void buf_setsize(buf_t
, uint32_t);
471 @function buf_setresid
472 @abstract Set a count of bytes outstanding for I/O in a buffer.
473 @discussion Set when an I/O operations completes. Examples: called by IOStorageFamily when I/O
474 completes, often called on an "original" buffer when using a manipulated buffer to perform I/O
475 on behalf of the first.
476 @param bp Buffer whose outstanding count to set.
477 @return Count of unwritten/unread bytes.
479 void buf_setresid(buf_t
, uint32_t);
482 @function buf_setdataptr
483 @abstract Set the address at which a buffer's data will be stored.
484 @discussion In traditional buffer use, the data pointer will be set automatically. This routine is
485 useful with iobufs (allocated with buf_alloc()).
486 @param bp Buffer whose data pointer to set.
487 @param data Pointer to data region.
490 void buf_setdataptr(buf_t
, uintptr_t);
493 @function buf_dataptr
494 @abstract Get the address at which a buffer's data is stored; for iobufs, this must
495 be set with buf_setdataptr(). See buf_map().
496 @param bp Buffer whose data pointer to retrieve.
497 @return Data pointer; NULL if unset.
499 uintptr_t buf_dataptr(buf_t
);
503 @abstract Get the vnode associated with a buffer.
504 @discussion Every buffer is associated with a file. Because there is an I/O in flight,
505 there is an iocount on this vnode; it is returned WITHOUT an extra iocount, and vnode_put()
507 @param bp Buffer whose vnode to retrieve.
508 @return Buffer's vnode.
510 vnode_t
buf_vnode(buf_t
);
513 @function buf_setvnode
514 @abstract Set the vnode associated with a buffer.
515 @discussion This call need not be used on traditional buffers; it is for use with iobufs.
516 @param bp Buffer whose vnode to set.
517 @param vp The vnode to attach to the buffer.
520 void buf_setvnode(buf_t
, vnode_t
);
524 @abstract Get the device ID associated with a buffer.
525 @discussion In traditional buffer use, this value is NODEV until buf_strategy() is called unless
526 buf_getblk() was passed a device vnode. It is set on an iobuf if buf_alloc() is passed a device
527 vnode or if buf_setdevice() is called.
528 @param bp Buffer whose device ID to retrieve.
531 dev_t
buf_device(buf_t
);
534 @function buf_setdevice
535 @abstract Set the device associated with a buffer.
536 @discussion A buffer's device is set in buf_strategy() (or in buf_getblk() if the file is a device).
537 It is also set on an iobuf if buf_alloc() is passed a device vnode.
538 @param bp Buffer whose device ID to set.
539 @param vp Device to set on the buffer.
540 @return 0 for success, EINVAL if vp is not a device file.
542 errno_t
buf_setdevice(buf_t
, vnode_t
);
545 @function buf_strategy
546 @abstract Pass an I/O request for a buffer down to the device layer.
547 @discussion This is one of the most important routines in the buffer cache layer. For buffers obtained
548 through buf_getblk, it handles finding physical block numbers for the I/O (with VNOP_BLKTOOFF and
549 VNOP_BLOCKMAP), packaging the I/O into page-sized chunks, and initiating I/O on the disk by calling
550 the device's strategy routine. If a buffer's UPL has been set manually with buf_setupl(), it assumes
551 that the request is already correctly configured with a block number and a size divisible by page size
552 and will just call directly to the device.
553 @param devvp Device on which to perform I/O
554 @param ap vnop_strategy_args structure (most importantly, a buffer).
555 @return 0 for success, or errors from filesystem or device layers.
557 errno_t
buf_strategy(vnode_t
, void *);
560 * Flags for buf_invalblkno()
562 #define BUF_WAIT 0x01
565 @function buf_invalblkno
566 @abstract Invalidate a filesystem logical block in a file.
567 @discussion buf_invalblkno() tries to make the data for a given block in a file
568 invalid; if the buffer for that block is found in core and is not busy, we mark it
569 invalid and call buf_brelse() (see "flags" param for what happens if the buffer is busy).
570 buf_brelse(), noticing that it is invalid, will
571 will return the buffer to the empty-buffer list and tell the VM subsystem to abandon
572 the relevant pages. Data will not be written to backing store--it will be cast aside.
573 Note that this function will only work if the block in question has been
574 obtained with a buf_getblk(). If data has been read into core without using
575 traditional buffer cache routines, buf_invalblkno() will not be able to invalidate it--this
576 includes the use of iobufs.
577 @param bp Buffer whose block to invalidate.
578 @param lblkno Logical block number.
579 @param flags BUF_WAIT: wait for busy buffers to become unbusy and invalidate them then. Otherwise,
580 just return EBUSY for busy blocks.
581 @return 0 for success, EINVAL if vp is not a device file.
583 errno_t
buf_invalblkno(vnode_t
, daddr64_t
, int);
586 @function buf_callback
587 @abstract Get the function set to be called when I/O on a buffer completes.
588 @discussion A function returned by buf_callback was originally set with buf_setcallback().
589 @param bp Buffer whose callback to get.
590 @return 0 for success, or errors from filesystem or device layers.
592 void * buf_callback(buf_t
);
595 @function buf_setcallback
596 @abstract Set a function to be called once when I/O on a buffer completes.
597 @discussion A one-shot callout set with buf_setcallback() will be called from buf_biodone()
598 when I/O completes. It will be passed the "transaction" argument as well as the buffer.
599 buf_setcallback() also marks the buffer as B_ASYNC.
600 @param bp Buffer whose callback to set.
601 @param callback function to use as callback.
602 @param transaction Additional argument to callback function.
603 @return 0; always succeeds.
605 errno_t
buf_setcallback(buf_t
, void (*)(buf_t
, void *), void *);
609 @abstract Set the UPL (Universal Page List), and offset therein, on a buffer.
610 @discussion buf_setupl() should only be called on buffers allocated with buf_alloc().
611 A subsequent call to buf_map() will map the UPL and give back the address at which data
612 begins. After buf_setupl() is called, a buffer is marked B_CLUSTER; when this is the case,
613 buf_strategy() assumes that a buffer is correctly configured to be passed to the device
614 layer without modification. Passing a NULL upl will clear the upl and the B_CLUSTER flag on the
616 @param bp Buffer whose upl to set.
617 @param upl UPL to set in the buffer.
618 @parma offset Offset within upl at which relevant data begin.
619 @return 0 for success, EINVAL if the buffer was not allocated with buf_alloc().
621 errno_t
buf_setupl(buf_t
, upl_t
, uint32_t);
625 @abstract Clone a buffer with a restricted range and an optional callback.
626 @discussion Generates a buffer which is identical to its "bp" argument except that
627 it spans a subset of the data of the original. The buffer to be cloned should
628 have been allocated with buf_alloc(). Checks its arguments to make sure
629 that the data subset is coherent. Optionally, adds a callback function and argument to it
630 to be called when I/O completes (as with buf_setcallback(), but B_ASYNC is not set). If the original buffer had
631 a upl set through buf_setupl(), this upl is copied to the new buffer; otherwise, the original's
632 data pointer is used raw. The buffer must be released with buf_free().
633 @param bp Buffer to clone.
634 @param io_offset Offset, relative to start of data in original buffer, at which new buffer's data will begin.
635 @param io_size Size of buffer region in new buffer, in the sense of buf_count().
636 @param iodone Callback to be called from buf_biodone() when I/O completes, in the sense of buf_setcallback().
637 @param arg Argument to pass to iodone() callback.
638 @return NULL if io_offset/io_size combination is invalid for the buffer to be cloned; otherwise, the new buffer.
640 buf_t
buf_clone(buf_t
, int, int, void (*)(buf_t
, void *), void *);
644 @function buf_create_shadow
645 @abstract Create a shadow buffer with optional private storage and an optional callback.
646 @param bp Buffer to shadow.
647 @param force_copy If TRUE, do not link the shadaow to 'bp' and if 'external_storage' == NULL,
648 force a copy of the data associated with 'bp'.
649 @param external_storage If non-NULL, associate it with the new buffer as its storage instead of the
650 storage currently associated with 'bp'.
651 @param iodone Callback to be called from buf_biodone() when I/O completes, in the sense of buf_setcallback().
652 @param arg Argument to pass to iodone() callback.
653 @return NULL if the buffer to be shadowed is not B_META or a primary buffer (i.e. not a shadow buffer); otherwise, the new buffer.
656 buf_t
buf_create_shadow(buf_t bp
, boolean_t force_copy
, uintptr_t external_storage
, void (*iodone
)(buf_t
, void *), void *arg
);
661 @abstract returns true if 'bp' is a shadow of another buffer.
662 @param bp Buffer to query.
663 @return 1 if 'bp' is a shadow, 0 otherwise.
665 int buf_shadow(buf_t bp
);
670 @abstract Allocate an uninitialized buffer.
671 @discussion A buffer returned by buf_alloc() is marked as busy and as an iobuf; it has no storage set up and must be
672 set up using buf_setdataptr() or buf_setupl()/buf_map().
673 @param vp vnode to associate with the buffer: optionally NULL. If vp is a device file, then
674 the buffer's associated device will be set. If vp is NULL, it can be set later with buf_setvnode().
677 buf_t
buf_alloc(vnode_t
);
681 @abstract Free a buffer that was allocated with buf_alloc().
682 @discussion The storage (UPL, data pointer) associated with an iobuf must be freed manually.
683 @param bp The buffer to free.
686 void buf_free(buf_t
);
689 * flags for buf_invalidateblks
691 #define BUF_WRITE_DATA 0x0001 /* write data blocks first */
692 #define BUF_SKIP_META 0x0002 /* skip over metadata blocks */
693 #define BUF_INVALIDATE_LOCKED 0x0004 /* force B_LOCKED blocks to be invalidated */
696 @function buf_invalidateblks
697 @abstract Invalidate all the blocks associated with a vnode.
698 @discussion This function does for all blocks associated with a vnode what buf_invalblkno does for one block.
699 Again, it will only be able to invalidate data which were populated with traditional buffer cache routines,
700 i.e. by buf_getblk() and callers thereof. Unlike buf_invalblkno(), it can be made to write dirty data to disk
701 rather than casting it aside.
702 @param bp The buffer whose data to invalidate.
703 @param flags BUF_WRITE_DATA: write dirty data to disk with VNOP_BWRITE() before kicking buffer cache entries out.
704 BUF_SKIP_META: do not invalidate metadata blocks.
705 @param slpflag Flags to pass to "msleep" while waiting to acquire busy buffers.
706 @param slptimeo Timeout in "hz" (1/100 second) to wait for a buffer to become unbusy before waking from sleep
707 and re-starting the scan.
708 @return 0 for success, error values from msleep().
710 int buf_invalidateblks(vnode_t
, int, int, int);
713 * flags for buf_flushdirtyblks and buf_iterate
715 #define BUF_SKIP_NONLOCKED 0x01
716 #define BUF_SKIP_LOCKED 0x02
717 #define BUF_SCAN_CLEAN 0x04 /* scan the clean buffers */
718 #define BUF_SCAN_DIRTY 0x08 /* scan the dirty buffers */
719 #define BUF_NOTIFY_BUSY 0x10 /* notify the caller about the busy pages during the scan */
722 #define BUF_RETURNED 0
723 #define BUF_RETURNED_DONE 1
724 #define BUF_CLAIMED 2
725 #define BUF_CLAIMED_DONE 3
727 @function buf_flushdirtyblks
728 @abstract Write dirty file blocks to disk.
729 @param vp The vnode whose blocks to flush.
730 @param wait Wait for writes to complete before returning.
731 @param flags Can pass zero, meaning "flush all dirty buffers."
732 BUF_SKIP_NONLOCKED: Skip buffers which are not busy when we encounter them.
733 BUF_SKIP_LOCKED: Skip buffers which are busy when we encounter them.
734 @param msg String to pass to msleep().
737 void buf_flushdirtyblks(vnode_t
, int, int, const char *);
740 @function buf_iterate
741 @abstract Perform some operation on all buffers associated with a vnode.
742 @param vp The vnode whose buffers to scan.
743 @param callout Function to call on each buffer. Should return one of:
744 BUF_RETURNED: buf_iterate() should call buf_brelse() on the buffer.
745 BUF_RETURNED_DONE: buf_iterate() should call buf_brelse() on the buffer and then stop iterating.
746 BUF_CLAIMED: buf_iterate() should continue iterating (and not call buf_brelse()).
747 BUF_CLAIMED_DONE: buf_iterate() should stop iterating (and not call buf_brelse()).
749 BUF_SKIP_NONLOCKED: Skip buffers which are not busy when we encounter them. BUF_SKIP_LOCKED: Skip buffers which are busy when we encounter them.
750 BUF_SCAN_CLEAN: Call out on clean buffers.
751 BUF_SCAN_DIRTY: Call out on dirty buffers.
752 BUF_NOTIFY_BUSY: If a buffer cannot be acquired, pass a NULL buffer to callout; otherwise,
753 that buffer will be silently skipped.
754 @param arg Argument to pass to callout in addition to buffer.
757 void buf_iterate(vnode_t
, int (*)(buf_t
, void *), int, void *);
761 @abstract Zero out the storage associated with a buffer.
762 @discussion Calls buf_map() to get the buffer's data address; for a B_CLUSTER
763 buffer (one which has had buf_setupl() called on it), it tries to map the buffer's
764 UPL into memory; should only be called once during the life cycle of an iobuf (one allocated
766 @param bp The buffer to zero out.
769 void buf_clear(buf_t
);
772 @function buf_bawrite
773 @abstract Start an asychronous write on a buffer.
774 @discussion Calls VNOP_BWRITE to start the process of propagating an asynchronous write down to the device layer.
775 Callers can wait for writes to complete at their discretion using buf_biowait(). When this function is called,
776 data should already have been written to the buffer's data region.
777 @param bp The buffer on which to initiate I/O.
778 @param throttle If "throttle" is nonzero and more than VNODE_ASYNC_THROTTLE writes are in progress on this file,
779 buf_bawrite() will block until the write count drops below VNODE_ASYNC_THROTTLE. If "throttle" is zero and the write
780 count is high, it will fail with EWOULDBLOCK; the caller can decide whether to make a blocking call or pursue
782 @return EWOULDBLOCK if write count is high and "throttle" is zero; otherwise, errors from VNOP_BWRITE.
784 errno_t
buf_bawrite(buf_t
);
787 @function buf_bdwrite
788 @abstract Mark a buffer for delayed write.
789 @discussion Marks a buffer as waiting for delayed write and the current I/O as complete; data will be written to backing store
790 before the buffer is reused, but it will not be queued for I/O immediately. Note that for buffers allocated
791 with buf_alloc(), there are no such guarantees; you must take care of your own flushing to disk. If
792 the number of delayed writes pending on the system is greater than an internal limit and the caller has not
793 requested otherwise [see return_error] , buf_bdwrite() will unilaterally launch an asynchronous I/O with buf_bawrite() to keep the pile of
794 delayed writes from getting too large.
795 @param bp The buffer to mark for delayed write.
796 @param return_error If the number of pending delayed writes systemwide is larger than an internal limit,
797 return EAGAIN rather than doing an asynchronous write.
798 @return EAGAIN for return_error != 0 case, 0 for succeess, errors from buf_bawrite.
800 errno_t
buf_bdwrite(buf_t
);
804 @abstract Write a buffer's data to backing store.
805 @discussion Once the data in a buffer has been modified, buf_bwrite() starts sending it to disk by calling
806 VNOP_STRATEGY. Unless B_ASYNC has been set on the buffer (by buf_setflags() or otherwise), data will have
807 been written to disk when buf_bwrite() returns. See Bach (p 56).
808 @param bp The buffer to write to disk.
809 @return 0 for success; errors from buf_biowait().
811 errno_t
buf_bwrite(buf_t
);
814 @function buf_biodone
815 @abstract Mark an I/O as completed.
816 @discussion buf_biodone() should be called by whosoever decides that an I/O on a buffer is complete; for example,
817 IOStorageFamily. It clears the dirty flag on a buffer and signals on the vnode that a write has completed
818 with vnode_writedone(). If a callout or filter has been set on the buffer, that function is called. In the case
819 of a callout, that function is expected to take care of cleaning up and freeing the buffer.
820 Otherwise, if the buffer is marked B_ASYNC (e.g. it was passed to buf_bawrite()), then buf_biodone()
821 considers itself justified in calling buf_brelse() to return it to free lists--no one is waiting for it. Finally,
822 waiters on the bp (e.g. in buf_biowait()) are woken up.
823 @param bp The buffer to mark as done with I/O.
826 void buf_biodone(buf_t
);
829 @function buf_biowait
830 @abstract Wait for I/O on a buffer to complete.
831 @discussion Waits for I/O on a buffer to finish, as marked by a buf_biodone() call.
832 @param bp The buffer to wait on.
833 @return 0 for a successful wait; nonzero the buffer has been marked as EINTR or had an error set on it.
835 errno_t
buf_biowait(buf_t
);
839 @abstract Release any claim to a buffer, sending it back to free lists.
840 @discussion buf_brelse() cleans up buffer state and releases a buffer to the free lists. If the buffer
841 is not marked invalid and its pages are dirty (e.g. a delayed write was made), its data will be commited
842 to backing store. If it is marked invalid, its data will be discarded completely.
843 A valid, cacheable buffer will be put on a list and kept in the buffer hash so it
844 can be found again; otherwise, it will be dissociated from its vnode and treated as empty. Which list a valid
845 buffer is placed on depends on the use of buf_markaged(), whether it is metadata, and the B_LOCKED flag. A
846 B_LOCKED buffer will not be available for reuse by other files, though its data may be paged out.
847 Note that buf_brelse() is intended for use with traditionally allocated buffers.
848 @param bp The buffer to release.
851 void buf_brelse(buf_t
);
855 @abstract Synchronously read a block of a file.
856 @discussion buf_bread() is the traditional way to read a single logical block of a file through the buffer cache.
857 It tries to find the buffer and corresponding page(s) in core, calls VNOP_STRATEGY if necessary to bring the data
858 into memory, and waits for I/O to complete. It should not be used to read blocks of greater than 4K (one VM page)
859 in size; use cluster routines for large reads. Indeed, the cluster layer is a more efficient choice for reading DATA
860 unless you need some finely-tuned semantics that it cannot provide.
861 @param vp The file from which to read.
862 @param blkno The logical (filesystem) block number to read.
863 @param size Size of block; do not use for sizes > 4K.
864 @param cred Credential to store and use for reading from disk if data are not already in core.
865 @param bpp Destination pointer for buffer.
866 @return 0 for success, or an error from buf_biowait().
868 errno_t
buf_bread(vnode_t
, daddr64_t
, int, kauth_cred_t
, buf_t
*);
872 @abstract Read a block from a file with read-ahead.
873 @discussion buf_breadn() reads one block synchronously in the style of buf_bread() and fires
874 off a specified set of asynchronous reads to improve the likelihood of future cache hits.
875 It should not be used to read blocks of greater than 4K (one VM page) in size; use cluster
876 routines for large reads. Indeed, the cluster layer is a more efficient choice for reading DATA
877 unless you need some finely-tuned semantics that it cannot provide.
878 @param vp The file from which to read.
879 @param blkno The logical (filesystem) block number to read synchronously.
880 @param size Size of block; do not use for sizes > 4K.
881 @param rablks Array of logical block numbers for asynchronous read-aheads.
882 @param rasizes Array of block sizes for asynchronous read-aheads, each index corresponding to same index in "rablks."
883 @param nrablks Number of entries in read-ahead arrays.
884 @param cred Credential to store and use for reading from disk if data are not already in core.
885 @param bpp Destination pointer for buffer.
886 @return 0 for success, or an error from buf_biowait().
888 errno_t
buf_breadn(vnode_t
, daddr64_t
, int, daddr64_t
*, int *, int, kauth_cred_t
, buf_t
*);
891 @function buf_meta_bread
892 @abstract Synchronously read a metadata block of a file.
893 @discussion buf_meta_bread() is the traditional way to read a single logical block of a file through the buffer cache.
894 It tries to find the buffer and corresponding page(s) in core, calls VNOP_STRATEGY if necessary to bring the data
895 into memory, and waits for I/O to complete. It should not be used to read blocks of greater than 4K (one VM page)
896 in size; use cluster routines for large reads. Reading meta-data through the traditional buffer cache, unlike
897 reading data, is efficient and encouraged, especially if the blocks being read are significantly smaller than page size.
898 @param vp The file from which to read.
899 @param blkno The logical (filesystem) block number to read.
900 @param size Size of block; do not use for sizes > 4K.
901 @param cred Credential to store and use for reading from disk if data are not already in core.
902 @param bpp Destination pointer for buffer.
903 @return 0 for success, or an error from buf_biowait().
905 errno_t
buf_meta_bread(vnode_t
, daddr64_t
, int, kauth_cred_t
, buf_t
*);
908 @function buf_meta_breadn
909 @abstract Read a metadata block from a file with read-ahead.
910 @discussion buf_meta_breadn() reads one block synchronously in the style of buf_meta_bread() and fires
911 off a specified set of asynchronous reads to improve the likelihood of future cache hits.
912 It should not be used to read blocks of greater than 4K (one VM page) in size; use cluster
913 routines for large reads.
914 @param vp The file from which to read.
915 @param blkno The logical (filesystem) block number to read synchronously.
916 @param size Size of block; do not use for sizes > 4K.
917 @param rablks Array of logical block numbers for asynchronous read-aheads.
918 @param rasizes Array of block sizes for asynchronous read-aheads, each index corresponding to same index in "rablks."
919 @param nrablks Number of entries in read-ahead arrays.
920 @param cred Credential to store and use for reading from disk if data are not already in core.
921 @param bpp Destination pointer for buffer.
922 @return 0 for success, or an error from buf_biowait().
924 errno_t
buf_meta_breadn(vnode_t
, daddr64_t
, int, daddr64_t
*, int *, int, kauth_cred_t
, buf_t
*);
928 @abstract Adjust a buffer's count to be no more than maximum physical I/O transfer size for the host architecture.
929 @discussion physio() takes as a parameter a function to bound transfer sizes for each VNOP_STRATEGY() call. minphys()
930 is a default implementation. It calls buf_setcount() to make the buffer's count the min() of its current count
931 and the max I/O size for the host architecture.
932 @param bp The buffer whose byte count to modify.
933 @return New byte count.
935 u_int
minphys(buf_t bp
);
939 @abstract Perform I/O on a device to/from target memory described by a uio.
940 @discussion physio() allows I/O directly from a device to user-space memory. It waits
941 for all I/O to complete before returning.
942 @param f_strategy Strategy routine to call to initiate I/O.
943 @param bp Buffer to configure and pass to strategy routine; can be NULL.
944 @param dev Device on which to perform I/O.
945 @param flags B_READ or B_WRITE.
946 @param f_minphys Function which calls buf_setcount() to set a byte count which is suitably
947 small for the device in question. Returns byte count that has been set (or unchanged) on the buffer.
948 @param uio UIO describing the I/O operation.
949 @param blocksize Logical block size for this vnode.
950 @return 0 for success; EFAULT for an invalid uio; errors from buf_biowait().
952 int physio(void (*)(buf_t
), buf_t
, dev_t
, int , u_int (*)(buf_t
), struct uio
*, int );
956 * Flags for operation type in getblk()
958 #define BLK_READ 0x01 /* buffer for read */
959 #define BLK_WRITE 0x02 /* buffer for write */
960 #define BLK_META 0x10 /* buffer for metadata */
962 * modifier for above flags... if set, getblk will only return
963 * a bp that is already valid... i.e. found in the cache
965 #define BLK_ONLYVALID 0x80000000
969 @abstract Traditional buffer cache routine to get a buffer corresponding to a logical block in a file.
970 @discussion buf_getblk() gets a buffer, not necessarily containing valid data, representing a block in a file.
971 A metadata buffer will be returned with its own zone-allocated storage, managed by the traditional buffer-cache
972 layer, whereas data buffers will be returned hooked into backing by the UBC (which in fact controls the caching of data).
973 buf_getblk() first looks for the buffer header in cache; if the buffer is in-core but busy, buf_getblk() will wait for it to become
974 unbusy, depending on the slpflag and slptimeo parameters. If the buffer is found unbusy and is a metadata buffer,
975 it must already contain valid data and will be returned directly; data buffers will have a UPL configured to
976 prepare for interaction with the underlying UBC. If the buffer is found in core, it will be marked as such
977 and buf_fromcache() will return truth. A buffer is allocated and initialized (but not filled with data)
978 if none is found in core. buf_bread(), buf_breadn(), buf_meta_bread(), and buf_meta_breadn() all
979 return buffers obtained with buf_getblk().
980 @param vp File for which to get block.
981 @param blkno Logical block number.
982 @param size Size of block.
983 @param slpflag Flag to pass to msleep() while waiting for buffer to become unbusy.
984 @param slptimeo Time, in milliseconds, to wait for buffer to become unbusy. 0 means to wait indefinitely.
985 @param operation BLK_READ: want a read buffer. BLK_WRITE: want a write buffer. BLK_META: want a metadata buffer. BLK_ONLYVALID:
986 only return buffers which are found in core (do not allocate anew), and do not change buffer size. The last remark means
987 that if a given logical block is found in core with a different size than what is requested, the buffer size will not be modified.
988 @return Buffer found in core or newly allocated, either containing valid data or ready for I/O.
990 buf_t
buf_getblk(vnode_t
, daddr64_t
, int, int, int, int);
993 @function buf_geteblk
994 @abstract Get a metadata buffer which is marked invalid and not associated with any vnode.
995 @discussion A buffer is returned with zone-allocated storage of the specified size, marked B_META and invalid.
996 It has no vnode and is not visible in the buffer hash.
997 @param size Size of buffer.
998 @return Always returns a new buffer.
1000 buf_t
buf_geteblk(int);
1003 @function buf_clear_redundancy_flags
1004 @abstract Clear flags on a buffer.
1005 @discussion: buffer_redundancy_flags &= ~flags
1006 @param bp Buffer whose flags to clear.
1007 @param flags Flags to remove from buffer's mask
1010 void buf_clear_redundancy_flags(buf_t
, uint32_t);
1013 @function buf_redundancyflags
1014 @abstract Get redundancy flags set on a buffer.
1015 @param bp Buffer whose redundancy flags to grab.
1018 uint32_t buf_redundancy_flags(buf_t
);
1021 @function buf_setredundancyflags
1022 @abstract Set redundancy flags on a buffer.
1023 @discussion: buffer_redundancy_flags |= flags
1024 @param bp Buffer whose flags to set.
1025 @param flags Flags to add to buffer's redundancy flags
1028 void buf_set_redundancy_flags(buf_t
, uint32_t);
1032 @abstract Gets the attributes for this buf.
1033 @param bp Buffer whose attributes to get.
1036 bufattr_t
buf_attr(buf_t
);
1039 @function buf_markstatic
1040 @abstract Mark a buffer as being likely to contain static data.
1041 @param bp Buffer to mark.
1044 void buf_markstatic(buf_t
);
1047 @function buf_static
1048 @abstract Check if a buffer contains static data.
1049 @param bp Buffer to test.
1050 @return Nonzero if buffer has static data, 0 otherwise.
1052 int buf_static(buf_t
);
1054 #ifdef KERNEL_PRIVATE
1055 void buf_setfilter(buf_t
, void (*)(buf_t
, void *), void *, void (**)(buf_t
, void *), void **);
1057 bufattr_t
bufattr_alloc(void);
1059 void bufattr_free(bufattr_t bap
);
1062 @function bufattr_cpaddr
1063 @abstract Get the address of cp_entry on a buffer.
1064 @param bap Buffer Attribute whose cp_entry to get.
1067 void *bufattr_cpaddr(bufattr_t
);
1070 @function bufattr_cpoff
1071 @abstract Gets the file offset on the buffer.
1072 @param bap Buffer Attribute whose file offset value is used
1075 uint64_t bufattr_cpoff(bufattr_t
);
1079 @function bufattr_setcpaddr
1080 @abstract Set the address of cp_entry on a buffer attribute.
1081 @param bap Buffer Attribute whose cp entry value has to be set
1084 void bufattr_setcpaddr(bufattr_t
, void *);
1087 @function bufattr_setcpoff
1088 @abstract Set the file offset for a content protected I/O on
1090 @param bap Buffer Attribute whose cp file offset has to be set
1093 void bufattr_setcpoff(bufattr_t
, uint64_t);
1096 @function bufattr_rawencrypted
1097 @abstract Check if a buffer contains raw encrypted data.
1098 @param bap Buffer attribute to test.
1099 @return Nonzero if buffer has raw encrypted data, 0 otherwise.
1101 int bufattr_rawencrypted(bufattr_t bap
);
1104 @function bufattr_throttled
1105 @abstract Check if a buffer is throttled.
1106 @param bap Buffer attribute to test.
1107 @return Nonzero if the buffer is throttled, 0 otherwise.
1109 int bufattr_throttled(bufattr_t bap
);
1112 @function bufattr_nocache
1113 @abstract Check if a buffer has nocache attribute.
1114 @param bap Buffer attribute to test.
1115 @return Nonzero if the buffer is not cached, 0 otherwise.
1117 int bufattr_nocache(bufattr_t bap
);
1120 @function bufattr_meta
1121 @abstract Check if a buffer has meta attribute.
1122 @param bap Buffer attribute to test.
1123 @return Nonzero if the buffer has meta attribute, 0 otherwise.
1126 int bufattr_meta(bufattr_t bap
);
1129 @function bufattr_delayidlesleep
1130 @abstract Check if a buffer is marked to delay idle sleep on disk IO.
1131 @param bap Buffer attribute to test.
1132 @return Nonzero if the buffer is marked to delay idle sleep on disk IO, 0 otherwise.
1134 int bufattr_delayidlesleep(bufattr_t bap
);
1136 #endif /* KERNEL_PRIVATE */
1141 /* Macros to clear/set/test flags. */
1142 #define SET(t, f) (t) |= (f)
1143 #define CLR(t, f) (t) &= ~(f)
1144 #define ISSET(t, f) ((t) & (f))
1147 #endif /* !_SYS_BUF_H_ */