]> git.saurik.com Git - apple/xnu.git/blame - bsd/sys/buf_internal.h
xnu-3248.60.10.tar.gz
[apple/xnu.git] / bsd / sys / buf_internal.h
CommitLineData
91447636 1/*
fe8ab488 2 * Copyright (c) 2000-2014 Apple Inc. All rights reserved.
5d5c5d0d 3 *
2d21ac55 4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
91447636 5 *
2d21ac55
A
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
8f6c56a5 14 *
2d21ac55
A
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
17 *
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
8f6c56a5
A
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
2d21ac55
A
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
8f6c56a5 25 *
2d21ac55 26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
91447636
A
27 */
28/* Copyright (c) 1995 NeXT Computer, Inc. All Rights Reserved */
29/*
30 * Copyright (c) 1982, 1986, 1989, 1993
31 * The Regents of the University of California. All rights reserved.
32 * (c) UNIX System Laboratories, Inc.
33 * All or some portions of this file are derived from material licensed
34 * to the University of California by American Telephone and Telegraph
35 * Co. or Unix System Laboratories, Inc. and are reproduced herein with
36 * the permission of UNIX System Laboratories, Inc.
37 *
38 * Redistribution and use in source and binary forms, with or without
39 * modification, are permitted provided that the following conditions
40 * are met:
41 * 1. Redistributions of source code must retain the above copyright
42 * notice, this list of conditions and the following disclaimer.
43 * 2. Redistributions in binary form must reproduce the above copyright
44 * notice, this list of conditions and the following disclaimer in the
45 * documentation and/or other materials provided with the distribution.
46 * 3. All advertising materials mentioning features or use of this software
47 * must display the following acknowledgement:
48 * This product includes software developed by the University of
49 * California, Berkeley and its contributors.
50 * 4. Neither the name of the University nor the names of its contributors
51 * may be used to endorse or promote products derived from this software
52 * without specific prior written permission.
53 *
54 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
55 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
56 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
57 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
58 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
59 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
60 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
61 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
62 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
63 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
64 * SUCH DAMAGE.
65 *
66 * @(#)buf.h 8.9 (Berkeley) 3/30/95
67 */
68
69#ifndef _SYS_BUF_INTERNAL_H_
70#define _SYS_BUF_INTERNAL_H_
71
72#include <sys/appleapiopts.h>
73
74#ifdef KERNEL
75#include <sys/queue.h>
76#include <sys/errno.h>
77#include <sys/vm.h>
78#include <sys/cdefs.h>
79#include <sys/buf.h>
80#include <sys/lock.h>
81
3e170ce0
A
82#if CONFIG_PROTECT
83#include <sys/cprotect.h>
84#endif
85
91447636
A
86#define NOLIST ((struct buf *)0x87654321)
87
7ddcb079
A
88/*
89 * Attributes of an I/O to be used by lower layers
90 */
91struct bufattr {
316670eb 92#if CONFIG_PROTECT
3e170ce0
A
93 struct cpx *ba_cpx;
94 uint64_t ba_cp_file_off;
316670eb 95#endif
7ddcb079
A
96 uint64_t ba_flags; /* flags. Some are only in-use on embedded devices */
97};
98
91447636
A
99/*
100 * The buffer header describes an I/O operation in the kernel.
101 */
102struct buf {
103 LIST_ENTRY(buf) b_hash; /* Hash chain. */
104 LIST_ENTRY(buf) b_vnbufs; /* Buffer's associated vnode. */
105 TAILQ_ENTRY(buf) b_freelist; /* Free list position if not active. */
106 int b_timestamp; /* timestamp for queuing operation */
b0d623f7
A
107 int b_whichq; /* the free list the buffer belongs to */
108 volatile uint32_t b_flags; /* B_* flags. */
109 volatile uint32_t b_lflags; /* BL_BUSY | BL_WANTED flags... protected by buf_mtx */
91447636 110 int b_error; /* errno value. */
b0d623f7
A
111 int b_bufsize; /* Allocated buffer size. */
112 int b_bcount; /* Valid bytes in buffer. */
113 int b_resid; /* Remaining I/O. */
91447636 114 dev_t b_dev; /* Device associated with buffer. */
b0d623f7 115 uintptr_t b_datap; /* Memory, superblocks, indirect etc.*/
91447636
A
116 daddr64_t b_lblkno; /* Logical block number. */
117 daddr64_t b_blkno; /* Underlying physical block number. */
118 void (*b_iodone)(buf_t, void *); /* Function to call upon completion. */
2d21ac55
A
119 vnode_t b_vp; /* File vnode for data, device vnode for metadata. */
120 kauth_cred_t b_rcred; /* Read credentials reference. */
121 kauth_cred_t b_wcred; /* Write credentials reference. */
91447636
A
122 void * b_upl; /* Pointer to UPL */
123 buf_t b_real_bp; /* used to track bp generated through cluster_bp */
124 TAILQ_ENTRY(buf) b_act; /* Device driver queue when active */
125 void * b_drvdata; /* Device driver private use */
b0d623f7 126 void * b_fsprivate; /* filesystem private use */
91447636
A
127 void * b_transaction; /* journal private use */
128 int b_dirtyoff; /* Offset in buffer of dirty region. */
129 int b_dirtyend; /* Offset of end of dirty region. */
130 int b_validoff; /* Offset in buffer of valid region. */
131 int b_validend; /* Offset of end of valid region. */
6d2010ae
A
132
133 /* store extra information related to redundancy of data, such as
134 * which redundancy copy to use, etc
135 */
136 uint32_t b_redundancy_flags;
137
91447636 138 proc_t b_proc; /* Associated proc; NULL if kernel. */
6d2010ae
A
139#ifdef BUF_MAKE_PRIVATE
140 buf_t b_data_store;
141#endif
7ddcb079 142 struct bufattr b_attr;
91447636
A
143#ifdef JOE_DEBUG
144 void * b_owner;
145 int b_tag;
146 void * b_lastbrelse;
b0d623f7
A
147 void * b_stackbrelse[6];
148 void * b_stackgetblk[6];
91447636
A
149#endif
150};
151
39236c6e 152extern vm_offset_t buf_kernel_addrperm;
91447636
A
153
154/* cluster_io definitions for use with io bufs */
155#define b_uploffset b_bufsize
6d2010ae
A
156#define b_orig b_freelist.tqe_prev
157#define b_shadow b_freelist.tqe_next
158#define b_shadow_ref b_validoff
159#ifdef BUF_MAKE_PRIVATE
160#define b_data_ref b_validend
161#endif
91447636
A
162#define b_trans_head b_freelist.tqe_prev
163#define b_trans_next b_freelist.tqe_next
164#define b_iostate b_rcred
2d21ac55 165#define b_cliodone b_wcred
91447636
A
166
167/*
316670eb 168 * These flags are kept in b_lflags...
91447636
A
169 * buf_mtxp must be held before examining/updating
170 */
171#define BL_BUSY 0x00000001 /* I/O in progress. */
172#define BL_WANTED 0x00000002 /* Process wants this buffer. */
173#define BL_IOBUF 0x00000004 /* buffer allocated via 'buf_alloc' */
b0d623f7 174#define BL_WANTDEALLOC 0x00000010 /* buffer should be put on empty list when clean */
6d2010ae
A
175#define BL_SHADOW 0x00000020
176#define BL_EXTERNAL 0x00000040
177#define BL_WAITSHADOW 0x00000080
178#define BL_IOBUF_ALLOC 0x00000100
316670eb 179#define BL_WANTED_REF 0x00000200
b0d623f7
A
180
181/*
182 * Parameters for buffer cache garbage collection
183 */
184#define BUF_STALE_THRESHHOLD 30 /* Collect if untouched in the last 30 seconds */
316670eb 185#define BUF_MAX_GC_BATCH_SIZE 64 /* Under a single grab of the lock */
91447636
A
186
187/*
188 * mask used by buf_flags... these are the readable external flags
189 */
2d21ac55 190#define BUF_X_RDFLAGS (B_PHYS | B_RAW | B_LOCKED | B_ASYNC | B_READ | B_WRITE | B_PAGEIO |\
39236c6e 191 B_META | B_CLUSTER | B_DELWRI | B_FUA | B_PASSIVE | B_IOSTREAMING |\
316670eb 192 B_ENCRYPTED_IO | B_STATICCONTENT)
91447636
A
193/*
194 * mask used by buf_clearflags/buf_setflags... these are the writable external flags
195 */
2d21ac55 196#define BUF_X_WRFLAGS (B_PHYS | B_RAW | B_LOCKED | B_ASYNC | B_READ | B_WRITE | B_PAGEIO |\
b0d623f7 197 B_NOCACHE | B_FUA | B_PASSIVE | B_IOSTREAMING)
91447636 198
39236c6e
A
199#if 0
200/* b_flags defined in buf.h */
201#define B_WRITE 0x00000000 /* Write buffer (pseudo flag). */
202#define B_READ 0x00000001 /* Read buffer. */
203#define B_ASYNC 0x00000002 /* Start I/O, do not wait. */
204#define B_NOCACHE 0x00000004 /* Do not cache block after use. */
205#define B_DELWRI 0x00000008 /* Delay I/O until buffer reused. */
206#define B_LOCKED 0x00000010 /* Locked in core (not reusable). */
207#define B_PHYS 0x00000020 /* I/O to user memory. */
208#define B_CLUSTER 0x00000040 /* UPL based I/O generated by cluster layer */
209#define B_PAGEIO 0x00000080 /* Page in/out */
210#define B_META 0x00000100 /* buffer contains meta-data. */
211#define B_RAW 0x00000200 /* Set by physio for raw transfers. */
212#define B_FUA 0x00000400 /* Write-through disk cache(if supported) */
213#define B_PASSIVE 0x00000800 /* PASSIVE I/Os are ignored by THROTTLE I/O */
214#define B_IOSTREAMING 0x00001000 /* sequential access pattern detected */
215#define B_ENCRYPTED_IO 0x00004000 /* Encrypted I/O */
216#define B_STATICCONTENT 0x00008000 /* Buffer is likely to remain unaltered */
217#endif
218
91447636
A
219/*
220 * These flags are kept in b_flags... access is lockless
221 * External flags are defined in buf.h and cannot overlap
222 * the internal flags
223 *
224 * these flags are internal... there definition may change
225 */
226#define B_CACHE 0x00010000 /* getblk found us in the cache. */
227#define B_DONE 0x00020000 /* I/O completed. */
228#define B_INVAL 0x00040000 /* Does not contain valid info. */
229#define B_ERROR 0x00080000 /* I/O error occurred. */
230#define B_EINTR 0x00100000 /* I/O was interrupted */
231#define B_AGE 0x00200000 /* Move to age queue when I/O done. */
232#define B_FILTER 0x00400000 /* call b_iodone from biodone as an in-line filter */
233#define B_CALL 0x00800000 /* Call b_iodone from biodone, assumes b_iodone consumes bp */
2d21ac55 234#define B_EOT 0x01000000 /* last buffer in a transaction list created by cluster_io */
91447636
A
235#define B_WASDIRTY 0x02000000 /* page was found dirty in the VM cache */
236#define B_HDRALLOC 0x04000000 /* zone allocated buffer header */
237#define B_ZALLOC 0x08000000 /* b_datap is zalloc()ed */
238/*
239 * private flags used by the journal layer
240 */
241#define B_NORELSE 0x10000000 /* don't brelse() in bwrite() */
242/*
243 * private flags used by by the cluster layer
244 */
6d2010ae 245#define B_TWANTED 0x20000000 /* but_t that is part of a cluster level transaction is wanted */
91447636 246#define B_COMMIT_UPL 0x40000000 /* commit/abort the UPL on I/O success/failure */
060df5ea 247#define B_TDONE 0x80000000 /* buf_t that is part of a cluster level transaction has completed */
91447636 248
91447636
A
249/* Flags to low-level allocation routines. */
250#define B_CLRBUF 0x01 /* Request allocated buffer be cleared. */
251#define B_SYNC 0x02 /* Do all allocations synchronously. */
252#define B_NOBUFF 0x04 /* Do not allocate struct buf */
253
7ddcb079
A
254/*
255 * ba_flags (Buffer Attribute flags)
256 * Some of these may be in-use only on embedded devices.
257 */
316670eb
A
258#define BA_RAW_ENCRYPTED_IO 0x00000001
259#define BA_THROTTLED_IO 0x00000002
260#define BA_DELAYIDLESLEEP 0x00000004 /* Process is marked to delay idle sleep on disk IO */
261#define BA_NOCACHE 0x00000008
262#define BA_META 0x00000010
39236c6e
A
263#define BA_GREEDY_MODE 0x00000020 /* High speed writes that consume more storage */
264#define BA_QUICK_COMPLETE 0x00000040 /* Request quick completion at expense of storage efficiency */
fe8ab488
A
265#define BA_PASSIVE 0x00000080
266
267/*
268 * Note: IO_TIERs consume 0x0100, 0x0200, 0x0400, 0x0800
269 * These are now in-use by the I/O tiering system.
270 */
271#define BA_IO_TIER_MASK 0x00000f00
272#define BA_IO_TIER_SHIFT 8
273
274#define BA_ISOCHRONOUS 0x00001000 /* device specific isochronous throughput to media */
275
7ddcb079 276
39236c6e 277#define GET_BUFATTR_IO_TIER(bap) ((bap->ba_flags & BA_IO_TIER_MASK) >> BA_IO_TIER_SHIFT)
fe8ab488
A
278#define SET_BUFATTR_IO_TIER(bap, tier) \
279do { \
280 (bap)->ba_flags &= (~BA_IO_TIER_MASK); \
281 (bap)->ba_flags |= (((tier) << BA_IO_TIER_SHIFT) & BA_IO_TIER_MASK); \
282} while(0)
91447636 283
2d21ac55
A
284extern int niobuf_headers; /* The number of IO buffer headers for cluster IO */
285extern int nbuf_headers; /* The number of buffer headers */
0c530ab8
A
286extern int max_nbuf_headers; /* The max number of buffer headers */
287extern int nbuf_hashelements; /* The number of elements in bufhash */
2d21ac55 288extern struct buf *buf_headers; /* The buffer headers. */
91447636
A
289
290
291/*
292 * Definitions for the buffer free lists.
293 */
294#define BQUEUES 6 /* number of free buffer queues */
295
296#define BQ_LOCKED 0 /* super-blocks &c */
297#define BQ_LRU 1 /* lru, useful buffers */
298#define BQ_AGE 2 /* rubbish */
299#define BQ_EMPTY 3 /* buffer headers with no memory */
300#define BQ_META 4 /* buffer containing metadata */
301#define BQ_LAUNDRY 5 /* buffers that need cleaning */
302
303
304__BEGIN_DECLS
305
6d2010ae
A
306buf_t buf_create_shadow_priv(buf_t bp, boolean_t force_copy, uintptr_t external_storage, void (*iodone)(buf_t, void *), void *arg);
307
91447636
A
308buf_t alloc_io_buf(vnode_t, int);
309void free_io_buf(buf_t);
310
311int allocbuf(struct buf *, int);
39236c6e 312void bufinit(void);
91447636 313
91447636
A
314/*
315 * Flags for buf_acquire
316 */
317#define BAC_NOWAIT 0x01 /* Don't wait if buffer is busy */
318#define BAC_REMOVE 0x02 /* Remove from free list once buffer is acquired */
319#define BAC_SKIP_NONLOCKED 0x04 /* Don't return LOCKED buffers */
320#define BAC_SKIP_LOCKED 0x08 /* Only return LOCKED buffers */
321
2d21ac55
A
322void buf_list_lock(void);
323void buf_list_unlock(void);
324
39236c6e 325void cluster_init(void);
91447636
A
326void buf_drop(buf_t);
327errno_t buf_acquire(buf_t, int, int, int);
328
329int count_busy_buffers(void);
330int count_lock_queue(void);
331
316670eb
A
332int buf_flushdirtyblks_skipinfo (vnode_t, int, int, const char *);
333void buf_wait_for_shadow_io (vnode_t, daddr64_t);
334
6d2010ae
A
335#ifdef BUF_MAKE_PRIVATE
336errno_t buf_make_private(buf_t bp);
337#endif
91447636 338
316670eb 339#ifdef CONFIG_PROTECT
316670eb
A
340void buf_setcpoff (buf_t, uint64_t);
341#endif
342
91447636
A
343__END_DECLS
344
345
346/*
347 * Stats on usefulness of the buffer cache
348 */
349struct bufstats {
350 long bufs_incore; /* found incore */
351 long bufs_busyincore; /* found incore. was busy */
352 long bufs_vmhits; /* not incore. found in VM */
353 long bufs_miss; /* not incore. not in VM */
354 long bufs_sleeps; /* buffer starvation */
355 long bufs_eblk; /* Calls to geteblk */
356 long bufs_iobufmax; /* Max. number of IO buffers used */
357 long bufs_iobufinuse; /* number of IO buffers in use */
358 long bufs_iobufsleeps; /* IO buffer starvation */
359};
360
361#endif /* KERNEL */
362#endif /* !_SYS_BUF_H_ */