]>
git.saurik.com Git - apple/xnu.git/blob - bsd/sys/buf.h
08216cac0e1e898b9eb60eb073a8d4222019eeed
2 * Copyright (c) 2000-2005 Apple Computer, Inc. All rights reserved.
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
28 /* Copyright (c) 1995 NeXT Computer, Inc. All Rights Reserved */
30 * Copyright (c) 1982, 1986, 1989, 1993
31 * The Regents of the University of California. All rights reserved.
32 * (c) UNIX System Laboratories, Inc.
33 * All or some portions of this file are derived from material licensed
34 * to the University of California by American Telephone and Telegraph
35 * Co. or Unix System Laboratories, Inc. and are reproduced herein with
36 * the permission of UNIX System Laboratories, Inc.
38 * Redistribution and use in source and binary forms, with or without
39 * modification, are permitted provided that the following conditions
41 * 1. Redistributions of source code must retain the above copyright
42 * notice, this list of conditions and the following disclaimer.
43 * 2. Redistributions in binary form must reproduce the above copyright
44 * notice, this list of conditions and the following disclaimer in the
45 * documentation and/or other materials provided with the distribution.
46 * 3. All advertising materials mentioning features or use of this software
47 * must display the following acknowledgement:
48 * This product includes software developed by the University of
49 * California, Berkeley and its contributors.
50 * 4. Neither the name of the University nor the names of its contributors
51 * may be used to endorse or promote products derived from this software
52 * without specific prior written permission.
54 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
55 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
56 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
57 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
58 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
59 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
60 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
61 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
62 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
63 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
66 * @(#)buf.h 8.9 (Berkeley) 3/30/95
72 #include <sys/cdefs.h>
73 #include <sys/kernel_types.h>
74 #include <sys/ucred.h>
75 #include <mach/memory_object_types.h>
78 #define B_WRITE 0x00000000 /* Write buffer (pseudo flag). */
79 #define B_READ 0x00000001 /* Read buffer. */
80 #define B_ASYNC 0x00000002 /* Start I/O, do not wait. */
81 #define B_NOCACHE 0x00000004 /* Do not cache block after use. */
82 #define B_DELWRI 0x00000008 /* Delay I/O until buffer reused. */
83 #define B_LOCKED 0x00000010 /* Locked in core (not reusable). */
84 #define B_PHYS 0x00000020 /* I/O to user memory. */
85 #define B_CLUSTER 0x00000040 /* UPL based I/O generated by cluster layer */
86 #define B_PAGEIO 0x00000080 /* Page in/out */
87 #define B_META 0x00000100 /* buffer contains meta-data. */
88 #define B_RAW 0x00000200 /* Set by physio for raw transfers. */
89 #define B_FUA 0x00000400 /* Write-through disk cache(if supported) */
90 #define B_PASSIVE 0x00000800 /* PASSIVE I/Os are ignored by THROTTLE I/O */
91 #define B_IOSTREAMING 0x00001000 /* sequential access pattern detected */
92 #define B_THROTTLED_IO 0x00002000 /* low priority I/O */
93 #define B_ENCRYPTED_IO 0x00004000 /* Encrypted I/O */
95 * make sure to check when adding flags that
96 * that the new flags don't overlap the definitions
103 @function buf_markaged
104 @abstract Mark a buffer as "aged," i.e. as a good candidate to be discarded and reused after buf_brelse().
105 @param bp Buffer to mark.
107 void buf_markaged(buf_t
);
110 @function buf_markinvalid
111 @abstract Mark a buffer as not having valid data and being ready for immediate reuse after buf_brelse().
112 @param bp Buffer to mark.
114 void buf_markinvalid(buf_t
);
117 @function buf_markdelayed
118 @abstract Mark a buffer as a delayed write: mark it dirty without actually scheduling I/O.
119 @discussion Data will be flushed to disk at some later time, not with brelse(). A sync()/fsync()
120 or pressure necessitating reuse of the buffer will cause it to be written back to disk.
121 @param bp Buffer to mark.
123 void buf_markdelayed(buf_t
);
125 void buf_markclean(buf_t
);
128 @function buf_markeintr
129 @abstract Mark a buffer as having been interrupted during I/O.
130 @discussion Waiters for I/O to complete (buf_biowait()) will return with EINTR when woken up.
131 buf_markeintr does not itself do a wakeup.
132 @param bp Buffer to mark.
134 void buf_markeintr(buf_t
);
137 @function buf_markfua
138 @abstract Mark a buffer for write through disk cache, if disk supports it.
139 @param bp Buffer to mark.
141 void buf_markfua(buf_t
);
145 @abstract Check if a buffer is marked for write through disk caches.
146 @param bp Buffer to test.
147 @return Nonzero if buffer is marked for write-through, 0 if not.
153 @abstract Check if a buffer contains valid data.
154 @param bp Buffer to test.
155 @return Nonzero if buffer has valid data, 0 if not.
157 int buf_valid(buf_t
);
160 @function buf_fromcache
161 @abstract Check if a buffer's data was found in core.
162 @discussion Will return truth after a buf_getblk that finds a valid buffer in the cache or the relevant
163 data in core (but not in a buffer).
164 @param bp Buffer to test.
165 @return Nonzero if we got this buffer's data without doing I/O, 0 if not.
167 int buf_fromcache(buf_t
);
171 @abstract Get the upl (Universal Page List) associated with a buffer.
172 @discussion Buffers allocated with buf_alloc() are not returned with a upl, and
173 traditional buffers only have a upl while an I/O is in progress.
174 @param bp Buffer whose upl to grab.
175 @return Buffer's upl if it has one, else NULL.
177 void * buf_upl(buf_t
);
180 @function buf_uploffset
181 @abstract Get the offset into a UPL at which this buffer begins.
182 @discussion This function should only be called on iobufs, i.e. buffers allocated with buf_alloc().
183 @param bp Buffer whose uploffset to grab.
184 @return Buffer's uploffset--does not check whether that value makes sense for this buffer.
186 uint32_t buf_uploffset(buf_t
);
190 @abstract Get the credential associated with a buffer for reading.
191 @discussion No reference is taken; if the credential is to be held on to persistently, an additional
192 reference must be taken with kauth_cred_ref.
193 @param bp Buffer whose credential to grab.
194 @return Credential if it exists, else NULL.
196 kauth_cred_t
buf_rcred(buf_t
);
200 @abstract Get the credential associated with a buffer for writing.
201 @discussion No reference is taken; if the credential is to be held on to persistently, an additional
202 reference must be taken with kauth_cred_ref.
203 @param bp Buffer whose credential to grab.
204 @return Credential if it exists, else NULL.
206 kauth_cred_t
buf_wcred(buf_t
);
210 @abstract Get the process associated with this buffer.
211 @discussion buf_proc() will generally return NULL; a process is currently only associated with
212 a buffer in the event of a physio() call.
213 @param bp Buffer whose associated process to find.
214 @return Associated process, possibly NULL.
216 proc_t
buf_proc(buf_t
);
219 @function buf_dirtyoff
220 @abstract Get the starting offset of the dirty region associated with a buffer.
221 @discussion The dirty offset is zero unless someone explicitly calls buf_setdirtyoff() (which the kernel does not).
222 @param bp Buffer whose dirty offset to get.
223 @return Dirty offset (0 if not explicitly changed).
225 uint32_t buf_dirtyoff(buf_t
);
228 @function buf_dirtyend
229 @abstract Get the ending offset of the dirty region associated with a buffer.
230 @discussion If the buffer's data was found incore and dirty, the dirty end is the size of the block; otherwise, unless
231 someone outside of xnu explicitly changes it by calling buf_setdirtyend(), it will be zero.
232 @param bp Buffer whose dirty end to get.
233 @return 0 if buffer is found clean; size of buffer if found dirty. Can be set to any value by callers of buf_setdirtyend().
235 uint32_t buf_dirtyend(buf_t
);
238 @function buf_setdirtyoff
239 @abstract Set the starting offset of the dirty region associated with a buffer.
240 @discussion This value is zero unless someone set it explicitly.
241 @param bp Buffer whose dirty end to set.
244 void buf_setdirtyoff(buf_t
, uint32_t);
247 @function buf_setdirtyend
248 @abstract Set the ending offset of the dirty region associated with a buffer.
249 @discussion If the buffer's data was found incore and dirty, the dirty end is the size of the block; otherwise, unless
250 someone outside of xnu explicitly changes it by calling buf_setdirtyend(), it will be zero.
251 @param bp Buffer whose dirty end to set.
254 void buf_setdirtyend(buf_t
, uint32_t);
258 @abstract Get the error value associated with a buffer.
259 @discussion Errors are set with buf_seterror().
260 @param bp Buffer whose error value to retrieve.
261 @return Error value, directly.
263 errno_t
buf_error(buf_t
);
266 @function buf_seterror
267 @abstract Set an error value on a buffer.
268 @param bp Buffer whose error value to set.
271 void buf_seterror(buf_t
, errno_t
);
274 @function buf_setflags
275 @abstract Set flags on a buffer.
276 @discussion: buffer_flags |= flags
277 @param bp Buffer whose flags to set.
278 @param flags Flags to add to buffer's mask. B_LOCKED/B_NOCACHE/B_ASYNC/B_READ/B_WRITE/B_PAGEIO/B_FUA
281 void buf_setflags(buf_t
, int32_t);
284 @function buf_clearflags
285 @abstract Clear flags on a buffer.
286 @discussion: buffer_flags &= ~flags
287 @param bp Buffer whose flags to clear.
288 @param flags Flags to remove from buffer's mask. B_LOCKED/B_NOCACHE/B_ASYNC/B_READ/B_WRITE/B_PAGEIO/B_FUA
291 void buf_clearflags(buf_t
, int32_t);
295 @abstract Get flags set on a buffer.
296 @discussion Valid flags are B_LOCKED/B_NOCACHE/B_ASYNC/B_READ/B_WRITE/B_PAGEIO/B_FUA.
297 @param bp Buffer whose flags to grab.
300 int32_t buf_flags(buf_t
);
304 @abstract Reset I/O flag state on a buffer.
305 @discussion Clears current flags on a buffer (internal and external) and allows some new flags to be set.
306 Used perhaps to prepare an iobuf for reuse.
307 @param bp Buffer whose flags to grab.
308 @param flags Flags to set on buffer: B_READ, B_WRITE, B_ASYNC, B_NOCACHE.
311 void buf_reset(buf_t
, int32_t);
315 @abstract Get virtual mappings for buffer data.
316 @discussion For buffers created through buf_getblk() (i.e. traditional buffer cache usage),
317 buf_map() just returns the address at which data was mapped by but_getblk(). For a B_CLUSTER buffer, i.e. an iobuf
318 whose upl state is managed manually, there are two possibilities. If the buffer was created
319 with an underlying "real" buffer through cluster_bp(), the mapping of the "real" buffer is returned.
320 Otherwise, the buffer was created with buf_alloc() and buf_setupl() was subsequently called; buf_map()
321 will call ubc_upl_map() to get a mapping for the buffer's upl and return the start of that mapping
322 plus the buffer's upl offset (set in buf_setupl()). In the last case, buf_unmap() must later be called
323 to tear down the mapping. NOTE: buf_map() does not set the buffer data pointer; this must be done with buf_setdataptr().
324 @param bp Buffer whose mapping to find or create.
325 @param io_addr Destination for mapping address.
326 @return 0 for success, ENOMEM if unable to map the buffer.
328 errno_t
buf_map(buf_t
, caddr_t
*);
332 @abstract Release mappings for buffer data.
333 @discussion For buffers created through buf_getblk() (i.e. traditional buffer cache usage),
334 buf_unmap() does nothing; buf_brelse() will take care of unmapping. For a B_CLUSTER buffer, i.e. an iobuf
335 whose upl state is managed manually, there are two possibilities. If the buffer was created
336 with an underlying "real" buffer through cluster_bp(), buf_unmap() does nothing; buf_brelse() on the
337 underlying buffer will tear down the mapping. Otherwise, the buffer was created with buf_alloc() and
338 buf_setupl() was subsequently called; buf_map() created the mapping. In this case, buf_unmap() will
340 @param bp Buffer whose mapping to find or create.
341 @param io_addr Destination for mapping address.
342 @return 0 for success, EINVAL if unable to unmap buffer.
344 errno_t
buf_unmap(buf_t
);
347 @function buf_setdrvdata
348 @abstract Set driver-specific data on a buffer.
349 @param bp Buffer whose driver-data to set.
350 @param drvdata Opaque driver data.
353 void buf_setdrvdata(buf_t
, void *);
356 @function buf_setdrvdata
357 @abstract Get driver-specific data from a buffer.
358 @param bp Buffer whose driver data to get.
359 @return Opaque driver data.
361 void * buf_drvdata(buf_t
);
364 @function buf_setfsprivate
365 @abstract Set filesystem-specific data on a buffer.
366 @param bp Buffer whose filesystem data to set.
367 @param fsprivate Opaque filesystem data.
370 void buf_setfsprivate(buf_t
, void *);
373 @function buf_fsprivate
374 @abstract Get filesystem-specific data from a buffer.
375 @param bp Buffer whose filesystem data to get.
376 @return Opaque filesystem data.
378 void * buf_fsprivate(buf_t
);
382 @abstract Get physical block number associated with a buffer, in the sense of VNOP_BLOCKMAP.
383 @discussion When a buffer's physical block number is the same is its logical block number, then the physical
384 block number is considered uninitialized. A physical block number of -1 indicates that there is no valid
385 physical mapping (e.g. the logical block is invalid or corresponds to a sparse region in a file). Physical
386 block number is normally set by the cluster layer or by buf_getblk().
387 @param bp Buffer whose physical block number to get.
388 @return Block number.
390 daddr64_t
buf_blkno(buf_t
);
394 @abstract Get logical block number associated with a buffer.
395 @discussion Logical block number is set on traditionally-used buffers by an argument passed to buf_getblk(),
396 for example by buf_bread().
397 @param bp Buffer whose logical block number to get.
398 @return Block number.
400 daddr64_t
buf_lblkno(buf_t
);
403 @function buf_setblkno
404 @abstract Set physical block number associated with a buffer.
405 @discussion Physical block number is generally set by the cluster layer or by buf_getblk().
406 @param bp Buffer whose physical block number to set.
407 @param blkno Block number to set.
410 void buf_setblkno(buf_t
, daddr64_t
);
413 @function buf_setlblkno
414 @abstract Set logical block number associated with a buffer.
415 @discussion Logical block number is set on traditionally-used buffers by an argument passed to buf_getblk(),
416 for example by buf_bread().
417 @param bp Buffer whose logical block number to set.
418 @param lblkno Block number to set.
421 void buf_setlblkno(buf_t
, daddr64_t
);
425 @abstract Get count of valid bytes in a buffer. This may be less than the space allocated to the buffer.
426 @param bp Buffer whose byte count to get.
429 uint32_t buf_count(buf_t
);
433 @abstract Get size of data region allocated to a buffer.
434 @discussion May be larger than amount of valid data in buffer.
435 @param bp Buffer whose size to get.
438 uint32_t buf_size(buf_t
);
442 @abstract Get a count of bytes which were not consumed by an I/O on a buffer.
443 @discussion Set when an I/O operations completes.
444 @param bp Buffer whose outstanding count to get.
445 @return Count of unwritten/unread bytes.
447 uint32_t buf_resid(buf_t
);
450 @function buf_setcount
451 @abstract Set count of valid bytes in a buffer. This may be less than the space allocated to the buffer.
452 @param bp Buffer whose byte count to set.
453 @param bcount Count to set.
456 void buf_setcount(buf_t
, uint32_t);
459 @function buf_setsize
460 @abstract Set size of data region allocated to a buffer.
461 @discussion May be larger than amount of valid data in buffer. Should be used by
462 code which is manually providing storage for an iobuf, one allocated with buf_alloc().
463 @param bp Buffer whose size to set.
466 void buf_setsize(buf_t
, uint32_t);
469 @function buf_setresid
470 @abstract Set a count of bytes outstanding for I/O in a buffer.
471 @discussion Set when an I/O operations completes. Examples: called by IOStorageFamily when I/O
472 completes, often called on an "original" buffer when using a manipulated buffer to perform I/O
473 on behalf of the first.
474 @param bp Buffer whose outstanding count to set.
475 @return Count of unwritten/unread bytes.
477 void buf_setresid(buf_t
, uint32_t);
480 @function buf_setdataptr
481 @abstract Set the address at which a buffer's data will be stored.
482 @discussion In traditional buffer use, the data pointer will be set automatically. This routine is
483 useful with iobufs (allocated with buf_alloc()).
484 @param bp Buffer whose data pointer to set.
485 @param data Pointer to data region.
488 void buf_setdataptr(buf_t
, uintptr_t);
491 @function buf_dataptr
492 @abstract Get the address at which a buffer's data is stored; for iobufs, this must
493 be set with buf_setdataptr(). See buf_map().
494 @param bp Buffer whose data pointer to retrieve.
495 @return Data pointer; NULL if unset.
497 uintptr_t buf_dataptr(buf_t
);
501 @abstract Get the vnode associated with a buffer.
502 @discussion Every buffer is associated with a file. Because there is an I/O in flight,
503 there is an iocount on this vnode; it is returned WITHOUT an extra iocount, and vnode_put()
505 @param bp Buffer whose vnode to retrieve.
506 @return Buffer's vnode.
508 vnode_t
buf_vnode(buf_t
);
511 @function buf_setvnode
512 @abstract Set the vnode associated with a buffer.
513 @discussion This call need not be used on traditional buffers; it is for use with iobufs.
514 @param bp Buffer whose vnode to set.
515 @param vp The vnode to attach to the buffer.
518 void buf_setvnode(buf_t
, vnode_t
);
522 @abstract Get the device ID associated with a buffer.
523 @discussion In traditional buffer use, this value is NODEV until buf_strategy() is called unless
524 buf_getblk() was passed a device vnode. It is set on an iobuf if buf_alloc() is passed a device
525 vnode or if buf_setdevice() is called.
526 @param bp Buffer whose device ID to retrieve.
529 dev_t
buf_device(buf_t
);
532 @function buf_setdevice
533 @abstract Set the device associated with a buffer.
534 @discussion A buffer's device is set in buf_strategy() (or in buf_getblk() if the file is a device).
535 It is also set on an iobuf if buf_alloc() is passed a device vnode.
536 @param bp Buffer whose device ID to set.
537 @param vp Device to set on the buffer.
538 @return 0 for success, EINVAL if vp is not a device file.
540 errno_t
buf_setdevice(buf_t
, vnode_t
);
543 @function buf_strategy
544 @abstract Pass an I/O request for a buffer down to the device layer.
545 @discussion This is one of the most important routines in the buffer cache layer. For buffers obtained
546 through buf_getblk, it handles finding physical block numbers for the I/O (with VNOP_BLKTOOFF and
547 VNOP_BLOCKMAP), packaging the I/O into page-sized chunks, and initiating I/O on the disk by calling
548 the device's strategy routine. If a buffer's UPL has been set manually with buf_setupl(), it assumes
549 that the request is already correctly configured with a block number and a size divisible by page size
550 and will just call directly to the device.
551 @param devvp Device on which to perform I/O
552 @param ap vnop_strategy_args structure (most importantly, a buffer).
553 @return 0 for success, or errors from filesystem or device layers.
555 errno_t
buf_strategy(vnode_t
, void *);
558 * Flags for buf_invalblkno()
560 #define BUF_WAIT 0x01
563 @function buf_invalblkno
564 @abstract Invalidate a filesystem logical block in a file.
565 @discussion buf_invalblkno() tries to make the data for a given block in a file
566 invalid; if the buffer for that block is found in core and is not busy, we mark it
567 invalid and call buf_brelse() (see "flags" param for what happens if the buffer is busy).
568 buf_brelse(), noticing that it is invalid, will
569 will return the buffer to the empty-buffer list and tell the VM subsystem to abandon
570 the relevant pages. Data will not be written to backing store--it will be cast aside.
571 Note that this function will only work if the block in question has been
572 obtained with a buf_getblk(). If data has been read into core without using
573 traditional buffer cache routines, buf_invalblkno() will not be able to invalidate it--this
574 includes the use of iobufs.
575 @param bp Buffer whose block to invalidate.
576 @param lblkno Logical block number.
577 @param flags BUF_WAIT: wait for busy buffers to become unbusy and invalidate them then. Otherwise,
578 just return EBUSY for busy blocks.
579 @return 0 for success, EINVAL if vp is not a device file.
581 errno_t
buf_invalblkno(vnode_t
, daddr64_t
, int);
584 @function buf_callback
585 @abstract Get the function set to be called when I/O on a buffer completes.
586 @discussion A function returned by buf_callback was originally set with buf_setcallback().
587 @param bp Buffer whose callback to get.
588 @return 0 for success, or errors from filesystem or device layers.
590 void * buf_callback(buf_t
);
593 @function buf_setcallback
594 @abstract Set a function to be called once when I/O on a buffer completes.
595 @discussion A one-shot callout set with buf_setcallback() will be called from buf_biodone()
596 when I/O completes. It will be passed the "transaction" argument as well as the buffer.
597 buf_setcallback() also marks the buffer as B_ASYNC.
598 @param bp Buffer whose callback to set.
599 @param callback function to use as callback.
600 @param transaction Additional argument to callback function.
601 @return 0; always succeeds.
603 errno_t
buf_setcallback(buf_t
, void (*)(buf_t
, void *), void *);
607 @abstract Set the UPL (Universal Page List), and offset therein, on a buffer.
608 @discussion buf_setupl() should only be called on buffers allocated with buf_alloc().
609 A subsequent call to buf_map() will map the UPL and give back the address at which data
610 begins. After buf_setupl() is called, a buffer is marked B_CLUSTER; when this is the case,
611 buf_strategy() assumes that a buffer is correctly configured to be passed to the device
612 layer without modification. Passing a NULL upl will clear the upl and the B_CLUSTER flag on the
614 @param bp Buffer whose upl to set.
615 @param upl UPL to set in the buffer.
616 @parma offset Offset within upl at which relevant data begin.
617 @return 0 for success, EINVAL if the buffer was not allocated with buf_alloc().
619 errno_t
buf_setupl(buf_t
, upl_t
, uint32_t);
623 @abstract Clone a buffer with a restricted range and an optional callback.
624 @discussion Generates a buffer which is identical to its "bp" argument except that
625 it spans a subset of the data of the original. The buffer to be cloned should
626 have been allocated with buf_alloc(). Checks its arguments to make sure
627 that the data subset is coherent. Optionally, adds a callback function and argument to it
628 to be called when I/O completes (as with buf_setcallback(), but B_ASYNC is not set). If the original buffer had
629 a upl set through buf_setupl(), this upl is copied to the new buffer; otherwise, the original's
630 data pointer is used raw. The buffer must be released with buf_free().
631 @param bp Buffer to clone.
632 @param io_offset Offset, relative to start of data in original buffer, at which new buffer's data will begin.
633 @param io_size Size of buffer region in new buffer, in the sense of buf_count().
634 @param iodone Callback to be called from buf_biodone() when I/O completes, in the sense of buf_setcallback().
635 @param arg Argument to pass to iodone() callback.
636 @return NULL if io_offset/io_size combination is invalid for the buffer to be cloned; otherwise, the new buffer.
638 buf_t
buf_clone(buf_t
, int, int, void (*)(buf_t
, void *), void *);
642 @function buf_create_shadow
643 @abstract Create a shadow buffer with optional private storage and an optional callback.
644 @param bp Buffer to shadow.
645 @param force_copy If TRUE, do not link the shadaow to 'bp' and if 'external_storage' == NULL,
646 force a copy of the data associated with 'bp'.
647 @param external_storage If non-NULL, associate it with the new buffer as its storage instead of the
648 storage currently associated with 'bp'.
649 @param iodone Callback to be called from buf_biodone() when I/O completes, in the sense of buf_setcallback().
650 @param arg Argument to pass to iodone() callback.
651 @return NULL if the buffer to be shadowed is not B_META or a primary buffer (i.e. not a shadow buffer); otherwise, the new buffer.
654 buf_t
buf_create_shadow(buf_t bp
, boolean_t force_copy
, uintptr_t external_storage
, void (*iodone
)(buf_t
, void *), void *arg
);
659 @abstract returns true if 'bp' is a shadow of another buffer.
660 @param bp Buffer to query.
661 @return 1 if 'bp' is a shadow, 0 otherwise.
663 int buf_shadow(buf_t bp
);
668 @abstract Allocate an uninitialized buffer.
669 @discussion A buffer returned by buf_alloc() is marked as busy and as an iobuf; it has no storage set up and must be
670 set up using buf_setdataptr() or buf_setupl()/buf_map().
671 @param vp vnode to associate with the buffer: optionally NULL. If vp is a device file, then
672 the buffer's associated device will be set. If vp is NULL, it can be set later with buf_setvnode().
675 buf_t
buf_alloc(vnode_t
);
679 @abstract Free a buffer that was allocated with buf_alloc().
680 @discussion The storage (UPL, data pointer) associated with an iobuf must be freed manually.
681 @param bp The buffer to free.
684 void buf_free(buf_t
);
687 * flags for buf_invalidateblks
689 #define BUF_WRITE_DATA 0x0001 /* write data blocks first */
690 #define BUF_SKIP_META 0x0002 /* skip over metadata blocks */
691 #define BUF_INVALIDATE_LOCKED 0x0004 /* force B_LOCKED blocks to be invalidated */
694 @function buf_invalidateblks
695 @abstract Invalidate all the blocks associated with a vnode.
696 @discussion This function does for all blocks associated with a vnode what buf_invalblkno does for one block.
697 Again, it will only be able to invalidate data which were populated with traditional buffer cache routines,
698 i.e. by buf_getblk() and callers thereof. Unlike buf_invalblkno(), it can be made to write dirty data to disk
699 rather than casting it aside.
700 @param bp The buffer whose data to invalidate.
701 @param flags BUF_WRITE_DATA: write dirty data to disk with VNOP_BWRITE() before kicking buffer cache entries out.
702 BUF_SKIP_META: do not invalidate metadata blocks.
703 @param slpflag Flags to pass to "msleep" while waiting to acquire busy buffers.
704 @param slptimeo Timeout in "hz" (1/100 second) to wait for a buffer to become unbusy before waking from sleep
705 and re-starting the scan.
706 @return 0 for success, error values from msleep().
708 int buf_invalidateblks(vnode_t
, int, int, int);
711 * flags for buf_flushdirtyblks and buf_iterate
713 #define BUF_SKIP_NONLOCKED 0x01
714 #define BUF_SKIP_LOCKED 0x02
715 #define BUF_SCAN_CLEAN 0x04 /* scan the clean buffers */
716 #define BUF_SCAN_DIRTY 0x08 /* scan the dirty buffers */
717 #define BUF_NOTIFY_BUSY 0x10 /* notify the caller about the busy pages during the scan */
720 #define BUF_RETURNED 0
721 #define BUF_RETURNED_DONE 1
722 #define BUF_CLAIMED 2
723 #define BUF_CLAIMED_DONE 3
725 @function buf_flushdirtyblks
726 @abstract Write dirty file blocks to disk.
727 @param vp The vnode whose blocks to flush.
728 @param wait Wait for writes to complete before returning.
729 @param flags Can pass zero, meaning "flush all dirty buffers."
730 BUF_SKIP_NONLOCKED: Skip buffers which are not busy when we encounter them.
731 BUF_SKIP_LOCKED: Skip buffers which are busy when we encounter them.
732 @param msg String to pass to msleep().
735 void buf_flushdirtyblks(vnode_t
, int, int, const char *);
738 @function buf_iterate
739 @abstract Perform some operation on all buffers associated with a vnode.
740 @param vp The vnode whose buffers to scan.
741 @param callout Function to call on each buffer. Should return one of:
742 BUF_RETURNED: buf_iterate() should call buf_brelse() on the buffer.
743 BUF_RETURNED_DONE: buf_iterate() should call buf_brelse() on the buffer and then stop iterating.
744 BUF_CLAIMED: buf_iterate() should continue iterating (and not call buf_brelse()).
745 BUF_CLAIMED_DONE: buf_iterate() should stop iterating (and not call buf_brelse()).
747 BUF_SKIP_NONLOCKED: Skip buffers which are not busy when we encounter them. BUF_SKIP_LOCKED: Skip buffers which are busy when we encounter them.
748 BUF_SCAN_CLEAN: Call out on clean buffers.
749 BUF_SCAN_DIRTY: Call out on dirty buffers.
750 BUF_NOTIFY_BUSY: If a buffer cannot be acquired, pass a NULL buffer to callout; otherwise,
751 that buffer will be silently skipped.
752 @param arg Argument to pass to callout in addition to buffer.
755 void buf_iterate(vnode_t
, int (*)(buf_t
, void *), int, void *);
759 @abstract Zero out the storage associated with a buffer.
760 @discussion Calls buf_map() to get the buffer's data address; for a B_CLUSTER
761 buffer (one which has had buf_setupl() called on it), it tries to map the buffer's
762 UPL into memory; should only be called once during the life cycle of an iobuf (one allocated
764 @param bp The buffer to zero out.
767 void buf_clear(buf_t
);
770 @function buf_bawrite
771 @abstract Start an asychronous write on a buffer.
772 @discussion Calls VNOP_BWRITE to start the process of propagating an asynchronous write down to the device layer.
773 Callers can wait for writes to complete at their discretion using buf_biowait(). When this function is called,
774 data should already have been written to the buffer's data region.
775 @param bp The buffer on which to initiate I/O.
776 @param throttle If "throttle" is nonzero and more than VNODE_ASYNC_THROTTLE writes are in progress on this file,
777 buf_bawrite() will block until the write count drops below VNODE_ASYNC_THROTTLE. If "throttle" is zero and the write
778 count is high, it will fail with EWOULDBLOCK; the caller can decide whether to make a blocking call or pursue
780 @return EWOULDBLOCK if write count is high and "throttle" is zero; otherwise, errors from VNOP_BWRITE.
782 errno_t
buf_bawrite(buf_t
);
785 @function buf_bdwrite
786 @abstract Mark a buffer for delayed write.
787 @discussion Marks a buffer as waiting for delayed write and the current I/O as complete; data will be written to backing store
788 before the buffer is reused, but it will not be queued for I/O immediately. Note that for buffers allocated
789 with buf_alloc(), there are no such guarantees; you must take care of your own flushing to disk. If
790 the number of delayed writes pending on the system is greater than an internal limit and the caller has not
791 requested otherwise [see return_error] , buf_bdwrite() will unilaterally launch an asynchronous I/O with buf_bawrite() to keep the pile of
792 delayed writes from getting too large.
793 @param bp The buffer to mark for delayed write.
794 @param return_error If the number of pending delayed writes systemwide is larger than an internal limit,
795 return EAGAIN rather than doing an asynchronous write.
796 @return EAGAIN for return_error != 0 case, 0 for succeess, errors from buf_bawrite.
798 errno_t
buf_bdwrite(buf_t
);
802 @abstract Write a buffer's data to backing store.
803 @discussion Once the data in a buffer has been modified, buf_bwrite() starts sending it to disk by calling
804 VNOP_STRATEGY. Unless B_ASYNC has been set on the buffer (by buf_setflags() or otherwise), data will have
805 been written to disk when buf_bwrite() returns. See Bach (p 56).
806 @param bp The buffer to write to disk.
807 @return 0 for success; errors from buf_biowait().
809 errno_t
buf_bwrite(buf_t
);
812 @function buf_biodone
813 @abstract Mark an I/O as completed.
814 @discussion buf_biodone() should be called by whosoever decides that an I/O on a buffer is complete; for example,
815 IOStorageFamily. It clears the dirty flag on a buffer and signals on the vnode that a write has completed
816 with vnode_writedone(). If a callout or filter has been set on the buffer, that function is called. In the case
817 of a callout, that function is expected to take care of cleaning up and freeing the buffer.
818 Otherwise, if the buffer is marked B_ASYNC (e.g. it was passed to buf_bawrite()), then buf_biodone()
819 considers itself justified in calling buf_brelse() to return it to free lists--no one is waiting for it. Finally,
820 waiters on the bp (e.g. in buf_biowait()) are woken up.
821 @param bp The buffer to mark as done with I/O.
824 void buf_biodone(buf_t
);
827 @function buf_biowait
828 @abstract Wait for I/O on a buffer to complete.
829 @discussion Waits for I/O on a buffer to finish, as marked by a buf_biodone() call.
830 @param bp The buffer to wait on.
831 @return 0 for a successful wait; nonzero the buffer has been marked as EINTR or had an error set on it.
833 errno_t
buf_biowait(buf_t
);
837 @abstract Release any claim to a buffer, sending it back to free lists.
838 @discussion buf_brelse() cleans up buffer state and releases a buffer to the free lists. If the buffer
839 is not marked invalid and its pages are dirty (e.g. a delayed write was made), its data will be commited
840 to backing store. If it is marked invalid, its data will be discarded completely.
841 A valid, cacheable buffer will be put on a list and kept in the buffer hash so it
842 can be found again; otherwise, it will be dissociated from its vnode and treated as empty. Which list a valid
843 buffer is placed on depends on the use of buf_markaged(), whether it is metadata, and the B_LOCKED flag. A
844 B_LOCKED buffer will not be available for reuse by other files, though its data may be paged out.
845 Note that buf_brelse() is intended for use with traditionally allocated buffers.
846 @param bp The buffer to release.
849 void buf_brelse(buf_t
);
853 @abstract Synchronously read a block of a file.
854 @discussion buf_bread() is the traditional way to read a single logical block of a file through the buffer cache.
855 It tries to find the buffer and corresponding page(s) in core, calls VNOP_STRATEGY if necessary to bring the data
856 into memory, and waits for I/O to complete. It should not be used to read blocks of greater than 4K (one VM page)
857 in size; use cluster routines for large reads. Indeed, the cluster layer is a more efficient choice for reading DATA
858 unless you need some finely-tuned semantics that it cannot provide.
859 @param vp The file from which to read.
860 @param blkno The logical (filesystem) block number to read.
861 @param size Size of block; do not use for sizes > 4K.
862 @param cred Credential to store and use for reading from disk if data are not already in core.
863 @param bpp Destination pointer for buffer.
864 @return 0 for success, or an error from buf_biowait().
866 errno_t
buf_bread(vnode_t
, daddr64_t
, int, kauth_cred_t
, buf_t
*);
870 @abstract Read a block from a file with read-ahead.
871 @discussion buf_breadn() reads one block synchronously in the style of buf_bread() and fires
872 off a specified set of asynchronous reads to improve the likelihood of future cache hits.
873 It should not be used to read blocks of greater than 4K (one VM page) in size; use cluster
874 routines for large reads. Indeed, the cluster layer is a more efficient choice for reading DATA
875 unless you need some finely-tuned semantics that it cannot provide.
876 @param vp The file from which to read.
877 @param blkno The logical (filesystem) block number to read synchronously.
878 @param size Size of block; do not use for sizes > 4K.
879 @param rablks Array of logical block numbers for asynchronous read-aheads.
880 @param rasizes Array of block sizes for asynchronous read-aheads, each index corresponding to same index in "rablks."
881 @param nrablks Number of entries in read-ahead arrays.
882 @param cred Credential to store and use for reading from disk if data are not already in core.
883 @param bpp Destination pointer for buffer.
884 @return 0 for success, or an error from buf_biowait().
886 errno_t
buf_breadn(vnode_t
, daddr64_t
, int, daddr64_t
*, int *, int, kauth_cred_t
, buf_t
*);
889 @function buf_meta_bread
890 @abstract Synchronously read a metadata block of a file.
891 @discussion buf_meta_bread() is the traditional way to read a single logical block of a file through the buffer cache.
892 It tries to find the buffer and corresponding page(s) in core, calls VNOP_STRATEGY if necessary to bring the data
893 into memory, and waits for I/O to complete. It should not be used to read blocks of greater than 4K (one VM page)
894 in size; use cluster routines for large reads. Reading meta-data through the traditional buffer cache, unlike
895 reading data, is efficient and encouraged, especially if the blocks being read are significantly smaller than page size.
896 @param vp The file from which to read.
897 @param blkno The logical (filesystem) block number to read.
898 @param size Size of block; do not use for sizes > 4K.
899 @param cred Credential to store and use for reading from disk if data are not already in core.
900 @param bpp Destination pointer for buffer.
901 @return 0 for success, or an error from buf_biowait().
903 errno_t
buf_meta_bread(vnode_t
, daddr64_t
, int, kauth_cred_t
, buf_t
*);
906 @function buf_meta_breadn
907 @abstract Read a metadata block from a file with read-ahead.
908 @discussion buf_meta_breadn() reads one block synchronously in the style of buf_meta_bread() and fires
909 off a specified set of asynchronous reads to improve the likelihood of future cache hits.
910 It should not be used to read blocks of greater than 4K (one VM page) in size; use cluster
911 routines for large reads.
912 @param vp The file from which to read.
913 @param blkno The logical (filesystem) block number to read synchronously.
914 @param size Size of block; do not use for sizes > 4K.
915 @param rablks Array of logical block numbers for asynchronous read-aheads.
916 @param rasizes Array of block sizes for asynchronous read-aheads, each index corresponding to same index in "rablks."
917 @param nrablks Number of entries in read-ahead arrays.
918 @param cred Credential to store and use for reading from disk if data are not already in core.
919 @param bpp Destination pointer for buffer.
920 @return 0 for success, or an error from buf_biowait().
922 errno_t
buf_meta_breadn(vnode_t
, daddr64_t
, int, daddr64_t
*, int *, int, kauth_cred_t
, buf_t
*);
926 @abstract Adjust a buffer's count to be no more than maximum physical I/O transfer size for the host architecture.
927 @discussion physio() takes as a parameter a function to bound transfer sizes for each VNOP_STRATEGY() call. minphys()
928 is a default implementation. It calls buf_setcount() to make the buffer's count the min() of its current count
929 and the max I/O size for the host architecture.
930 @param bp The buffer whose byte count to modify.
931 @return New byte count.
933 u_int
minphys(buf_t bp
);
937 @abstract Perform I/O on a device to/from target memory described by a uio.
938 @discussion physio() allows I/O directly from a device to user-space memory. It waits
939 for all I/O to complete before returning.
940 @param f_strategy Strategy routine to call to initiate I/O.
941 @param bp Buffer to configure and pass to strategy routine; can be NULL.
942 @param dev Device on which to perform I/O.
943 @param flags B_READ or B_WRITE.
944 @param f_minphys Function which calls buf_setcount() to set a byte count which is suitably
945 small for the device in question. Returns byte count that has been set (or unchanged) on the buffer.
946 @param uio UIO describing the I/O operation.
947 @param blocksize Logical block size for this vnode.
948 @return 0 for success; EFAULT for an invalid uio; errors from buf_biowait().
950 int physio(void (*)(buf_t
), buf_t
, dev_t
, int , u_int (*)(buf_t
), struct uio
*, int );
954 * Flags for operation type in getblk()
956 #define BLK_READ 0x01 /* buffer for read */
957 #define BLK_WRITE 0x02 /* buffer for write */
958 #define BLK_META 0x10 /* buffer for metadata */
960 * modifier for above flags... if set, getblk will only return
961 * a bp that is already valid... i.e. found in the cache
963 #define BLK_ONLYVALID 0x80000000
967 @abstract Traditional buffer cache routine to get a buffer corresponding to a logical block in a file.
968 @discussion buf_getblk() gets a buffer, not necessarily containing valid data, representing a block in a file.
969 A metadata buffer will be returned with its own zone-allocated storage, managed by the traditional buffer-cache
970 layer, whereas data buffers will be returned hooked into backing by the UBC (which in fact controls the caching of data).
971 buf_getblk() first looks for the buffer header in cache; if the buffer is in-core but busy, buf_getblk() will wait for it to become
972 unbusy, depending on the slpflag and slptimeo parameters. If the buffer is found unbusy and is a metadata buffer,
973 it must already contain valid data and will be returned directly; data buffers will have a UPL configured to
974 prepare for interaction with the underlying UBC. If the buffer is found in core, it will be marked as such
975 and buf_fromcache() will return truth. A buffer is allocated and initialized (but not filled with data)
976 if none is found in core. buf_bread(), buf_breadn(), buf_meta_bread(), and buf_meta_breadn() all
977 return buffers obtained with buf_getblk().
978 @param vp File for which to get block.
979 @param blkno Logical block number.
980 @param size Size of block.
981 @param slpflag Flag to pass to msleep() while waiting for buffer to become unbusy.
982 @param slptimeo Time, in milliseconds, to wait for buffer to become unbusy. 0 means to wait indefinitely.
983 @param operation BLK_READ: want a read buffer. BLK_WRITE: want a write buffer. BLK_META: want a metadata buffer. BLK_ONLYVALID:
984 only return buffers which are found in core (do not allocate anew), and do not change buffer size. The last remark means
985 that if a given logical block is found in core with a different size than what is requested, the buffer size will not be modified.
986 @return Buffer found in core or newly allocated, either containing valid data or ready for I/O.
988 buf_t
buf_getblk(vnode_t
, daddr64_t
, int, int, int, int);
991 @function buf_geteblk
992 @abstract Get a metadata buffer which is marked invalid and not associated with any vnode.
993 @discussion A buffer is returned with zone-allocated storage of the specified size, marked B_META and invalid.
994 It has no vnode and is not visible in the buffer hash.
995 @param size Size of buffer.
996 @return Always returns a new buffer.
998 buf_t
buf_geteblk(int);
1001 @function buf_clear_redundancy_flags
1002 @abstract Clear flags on a buffer.
1003 @discussion: buffer_redundancy_flags &= ~flags
1004 @param bp Buffer whose flags to clear.
1005 @param flags Flags to remove from buffer's mask
1008 void buf_clear_redundancy_flags(buf_t
, uint32_t);
1011 @function buf_redundancyflags
1012 @abstract Get redundancy flags set on a buffer.
1013 @param bp Buffer whose redundancy flags to grab.
1016 uint32_t buf_redundancy_flags(buf_t
);
1019 @function buf_setredundancyflags
1020 @abstract Set redundancy flags on a buffer.
1021 @discussion: buffer_redundancy_flags |= flags
1022 @param bp Buffer whose flags to set.
1023 @param flags Flags to add to buffer's redundancy flags
1026 void buf_set_redundancy_flags(buf_t
, uint32_t);
1030 @abstract Gets the attributes for this buf.
1031 @param bp Buffer whose attributes to get.
1034 bufattr_t
buf_attr(buf_t
);
1036 #ifdef KERNEL_PRIVATE
1037 void buf_setfilter(buf_t
, void (*)(buf_t
, void *), void *, void (**)(buf_t
, void *), void **);
1041 @function buf_getcpaddr
1042 @abstract Set the address of cp_entry on a buffer.
1043 @param bp Buffer whose cp entry value has to be set
1046 void buf_setcpaddr(buf_t
, void *);
1049 @function buf_getcpaddr
1050 @abstract Get the address of cp_entry on a buffer.
1051 @param bp Buffer whose error value to set.
1054 void *buf_getcpaddr(buf_t
);
1057 @function buf_throttled
1058 @abstract Check if a buffer is throttled.
1059 @param bap Buffer attribute to test.
1060 @return Nonzero if the buffer is throttled, 0 otherwise.
1062 int bufattr_throttled(bufattr_t bap
);
1063 #endif /* KERNEL_PRIVATE */
1069 /* Macros to clear/set/test flags. */
1070 #define SET(t, f) (t) |= (f)
1071 #define CLR(t, f) (t) &= ~(f)
1072 #define ISSET(t, f) ((t) & (f))
1075 #endif /* !_SYS_BUF_H_ */