2 * Copyright (c) 2000-2011 Apple Inc. All rights reserved.
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
29 #include <sys/param.h>
30 #include <sys/systm.h>
32 #include <sys/buf_internal.h>
33 #include <sys/kernel.h>
34 #include <sys/malloc.h>
35 #include <sys/mount.h>
36 #include <sys/vnode.h>
40 #include "hfs_cnode.h"
42 #include "hfs_endian.h"
43 #include "hfs_btreeio.h"
45 #include "hfscommon/headers/FileMgrInternal.h"
46 #include "hfscommon/headers/BTreesPrivate.h"
48 #define FORCESYNCBTREEWRITES 0
50 /* From bsd/vfs/vfs_bio.c */
51 extern int bdwrite_internal(struct buf
*, int);
53 static int ClearBTNodes(struct vnode
*vp
, long blksize
, off_t offset
, off_t amount
);
54 static int btree_journal_modify_block_end(struct hfsmount
*hfsmp
, struct buf
*bp
);
56 void btree_swap_node(struct buf
*bp
, __unused
void *arg
);
59 * Return btree node size for given vnode.
62 * For btree vnode, returns btree node size.
63 * For non-btree vnodes, returns 0.
65 u_int16_t
get_btree_nodesize(struct vnode
*vp
)
67 BTreeControlBlockPtr btree
;
68 u_int16_t node_size
= 0;
70 if (vnode_issystem(vp
)) {
71 btree
= (BTreeControlBlockPtr
) VTOF(vp
)->fcbBTCBPtr
;
73 node_size
= btree
->nodeSize
;
80 OSStatus
SetBTreeBlockSize(FileReference vp
, ByteCount blockSize
, __unused ItemCount minBlockCount
)
82 BTreeControlBlockPtr bTreePtr
;
84 DBG_ASSERT(vp
!= NULL
);
85 DBG_ASSERT(blockSize
>= kMinNodeSize
);
86 if (blockSize
> MAXBSIZE
)
87 return (fsBTBadNodeSize
);
89 bTreePtr
= (BTreeControlBlockPtr
)VTOF(vp
)->fcbBTCBPtr
;
90 bTreePtr
->nodeSize
= blockSize
;
96 OSStatus
GetBTreeBlock(FileReference vp
, u_int32_t blockNum
, GetBlockOptions options
, BlockDescriptor
*block
)
98 OSStatus retval
= E_NONE
;
99 struct buf
*bp
= NULL
;
100 u_int8_t allow_empty_node
;
102 /* If the btree block is being read using hint, it is
103 * fine for the swap code to find zeroed out nodes.
105 if (options
& kGetBlockHint
) {
106 allow_empty_node
= true;
108 allow_empty_node
= false;
111 if (options
& kGetEmptyBlock
) {
115 offset
= (daddr64_t
)blockNum
* (daddr64_t
)block
->blockSize
;
116 bp
= buf_getblk(vp
, (daddr64_t
)blockNum
, block
->blockSize
, 0, 0, BLK_META
);
118 VNOP_BLOCKMAP(vp
, offset
, block
->blockSize
, &blkno
, NULL
, NULL
, 0, NULL
) == 0) {
119 buf_setblkno(bp
, blkno
);
122 retval
= buf_meta_bread(vp
, (daddr64_t
)blockNum
, block
->blockSize
, NOCRED
, &bp
);
125 retval
= -1; //XXX need better error
127 if (retval
== E_NONE
) {
128 block
->blockHeader
= bp
;
129 block
->buffer
= (char *)buf_dataptr(bp
);
130 block
->blockNum
= buf_lblkno(bp
);
131 block
->blockReadFromDisk
= (buf_fromcache(bp
) == 0); /* not found in cache ==> came from disk */
134 block
->isModified
= 0;
136 /* Check and endian swap B-Tree node (only if it's a valid block) */
137 if (!(options
& kGetEmptyBlock
)) {
138 /* This happens when we first open the b-tree, we might not have all the node data on hand */
139 if ((((BTNodeDescriptor
*)block
->buffer
)->kind
== kBTHeaderNode
) &&
140 (((BTHeaderRec
*)((char *)block
->buffer
+ 14))->nodeSize
!= buf_count(bp
)) &&
141 (SWAP_BE16 (((BTHeaderRec
*)((char *)block
->buffer
+ 14))->nodeSize
) != buf_count(bp
))) {
144 * Don't swap the node descriptor, record offsets, or other records.
145 * This record will be invalidated and re-read with the correct node
146 * size once the B-tree control block is set up with the node size
147 * from the header record.
149 retval
= hfs_swap_BTNode (block
, vp
, kSwapBTNodeHeaderRecordOnly
, allow_empty_node
);
151 } else if (block
->blockReadFromDisk
) {
153 * The node was just read from disk, so always swap/check it.
154 * This is necessary on big endian since the test below won't trigger.
156 retval
= hfs_swap_BTNode (block
, vp
, kSwapBTNodeBigToHost
, allow_empty_node
);
157 } else if (*((u_int16_t
*)((char *)block
->buffer
+ (block
->blockSize
- sizeof (u_int16_t
)))) == 0x0e00) {
159 * The node was left in the cache in non-native order, so swap it.
160 * This only happens on little endian, after the node is written
163 retval
= hfs_swap_BTNode (block
, vp
, kSwapBTNodeBigToHost
, allow_empty_node
);
167 * If we got an error, then the node is only partially swapped.
168 * We mark the buffer invalid so that the next attempt to get the
169 * node will read it and attempt to swap again, and will notice
170 * the error again. If we didn't do this, the next attempt to get
171 * the node might use the partially swapped node as-is.
181 block
->blockHeader
= NULL
;
182 block
->buffer
= NULL
;
189 void ModifyBlockStart(FileReference vp
, BlockDescPtr blockPtr
)
191 struct hfsmount
*hfsmp
= VTOHFS(vp
);
192 struct buf
*bp
= NULL
;
194 if (hfsmp
->jnl
== NULL
) {
198 bp
= (struct buf
*) blockPtr
->blockHeader
;
200 panic("hfs: ModifyBlockStart: null bp for blockdescptr %p?!?\n", blockPtr
);
204 journal_modify_block_start(hfsmp
->jnl
, bp
);
205 blockPtr
->isModified
= 1;
209 btree_swap_node(struct buf
*bp
, __unused
void *arg
)
211 // struct hfsmount *hfsmp = (struct hfsmount *)arg;
213 struct vnode
*vp
= buf_vnode(bp
);
214 BlockDescriptor block
;
216 /* Prepare the block pointer */
217 block
.blockHeader
= bp
;
218 block
.buffer
= (char *)buf_dataptr(bp
);
219 block
.blockNum
= buf_lblkno(bp
);
220 /* not found in cache ==> came from disk */
221 block
.blockReadFromDisk
= (buf_fromcache(bp
) == 0);
222 block
.blockSize
= buf_count(bp
);
224 /* Swap the data now that this node is ready to go to disk.
225 * We allow swapping of zeroed out nodes here because we might
226 * be writing node whose last record just got deleted.
228 retval
= hfs_swap_BTNode (&block
, vp
, kSwapBTNodeHostToBig
, true);
230 panic("hfs: btree_swap_node: about to write corrupt node!\n");
235 btree_journal_modify_block_end(struct hfsmount
*hfsmp
, struct buf
*bp
)
237 return journal_modify_block_end(hfsmp
->jnl
, bp
, btree_swap_node
, hfsmp
);
241 OSStatus
ReleaseBTreeBlock(FileReference vp
, BlockDescPtr blockPtr
, ReleaseBlockOptions options
)
243 struct hfsmount
*hfsmp
= VTOHFS(vp
);
244 OSStatus retval
= E_NONE
;
245 struct buf
*bp
= NULL
;
247 bp
= (struct buf
*) blockPtr
->blockHeader
;
254 if (options
& kTrashBlock
) {
257 if (hfsmp
->jnl
&& (buf_flags(bp
) & B_LOCKED
)) {
258 journal_kill_block(hfsmp
->jnl
, bp
);
260 buf_brelse(bp
); /* note: B-tree code will clear blockPtr->blockHeader and blockPtr->buffer */
263 /* Don't let anyone else try to use this bp, it's been consumed */
264 blockPtr
->blockHeader
= NULL
;
267 if (options
& kForceWriteBlock
) {
269 if (blockPtr
->isModified
== 0) {
270 panic("hfs: releaseblock: modified is 0 but forcewrite set! bp %p\n", bp
);
273 retval
= btree_journal_modify_block_end(hfsmp
, bp
);
274 blockPtr
->isModified
= 0;
276 retval
= VNOP_BWRITE(bp
);
279 /* Don't let anyone else try to use this bp, it's been consumed */
280 blockPtr
->blockHeader
= NULL
;
282 } else if (options
& kMarkBlockDirty
) {
285 if ((options
& kLockTransaction
) && hfsmp
->jnl
== NULL
) {
288 * Set the B_LOCKED flag and unlock the buffer, causing buf_brelse to move
289 * the buffer onto the LOCKED free list. This is necessary, otherwise
290 * getnewbuf() would try to reclaim the buffers using buf_bawrite, which
291 * isn't going to work.
294 /* Don't hog all the buffers... */
295 if (count_lock_queue() > kMaxLockedMetaBuffers
) {
296 hfs_btsync(vp
, HFS_SYNCTRANS
);
297 /* Rollback sync time to cause a sync on lock release... */
298 (void) BTSetLastSync(VTOF(vp
), tv
.tv_sec
- (kMaxSecsForFsync
+ 1));
300 buf_setflags(bp
, B_LOCKED
);
304 * Delay-write this block.
305 * If the maximum delayed buffers has been exceeded then
306 * free up some buffers and fall back to an asynchronous write.
309 if (blockPtr
->isModified
== 0) {
310 panic("hfs: releaseblock: modified is 0 but markdirty set! bp %p\n", bp
);
312 retval
= btree_journal_modify_block_end(hfsmp
, bp
);
313 blockPtr
->isModified
= 0;
314 } else if (bdwrite_internal(bp
, 1) != 0) {
316 /* Rollback sync time to cause a sync on lock release... */
317 (void) BTSetLastSync(VTOF(vp
), tv
.tv_sec
- (kMaxSecsForFsync
+ 1));
319 buf_clearflags(bp
, B_LOCKED
);
323 /* Don't let anyone else try to use this bp, it's been consumed */
324 blockPtr
->blockHeader
= NULL
;
327 // check if we had previously called journal_modify_block_start()
328 // on this block and if so, abort it (which will call buf_brelse()).
329 if (hfsmp
->jnl
&& blockPtr
->isModified
) {
330 // XXXdbg - I don't want to call modify_block_abort()
331 // because I think it may be screwing up the
332 // journal and blowing away a block that has
335 // journal_modify_block_abort(hfsmp->jnl, bp);
336 //panic("hfs: releaseblock called for 0x%x but mod_block_start previously called.\n", bp);
337 btree_journal_modify_block_end(hfsmp
, bp
);
338 blockPtr
->isModified
= 0;
340 buf_brelse(bp
); /* note: B-tree code will clear blockPtr->blockHeader and blockPtr->buffer */
343 /* Don't let anyone else try to use this bp, it's been consumed */
344 blockPtr
->blockHeader
= NULL
;
353 OSStatus
ExtendBTreeFile(FileReference vp
, FSSize minEOF
, FSSize maxEOF
)
355 #pragma unused (maxEOF)
357 OSStatus retval
= 0, ret
= 0;
358 int64_t actualBytesAdded
, origSize
;
359 u_int64_t bytesToAdd
;
360 u_int32_t startAllocation
;
361 u_int32_t fileblocks
;
365 struct proc
*p
= NULL
;
369 filePtr
= GetFileControlBlock(vp
);
371 if ( (off_t
)minEOF
> filePtr
->fcbEOF
)
373 bytesToAdd
= minEOF
- filePtr
->fcbEOF
;
375 if (bytesToAdd
< filePtr
->ff_clumpsize
)
376 bytesToAdd
= filePtr
->ff_clumpsize
; //XXX why not always be a mutiple of clump size?
386 * The Extents B-tree can't have overflow extents. ExtendFileC will
387 * return an error if an attempt is made to extend the Extents B-tree
388 * when the resident extents are exhausted.
391 /* Protect allocation bitmap and extents overflow file. */
392 lockflags
= SFL_BITMAP
;
393 if (VTOC(vp
)->c_fileid
!= kHFSExtentsFileID
)
394 lockflags
|= SFL_EXTENTS
;
395 lockflags
= hfs_systemfile_lock(vcb
, lockflags
, HFS_EXCLUSIVE_LOCK
);
397 (void) BTGetInformation(filePtr
, 0, &btInfo
);
401 * The b-tree code expects nodes to be contiguous. So when
402 * the allocation block size is less than the b-tree node
403 * size, we need to force disk allocations to be contiguous.
405 if (vcb
->blockSize
>= btInfo
.nodeSize
) {
408 /* Ensure that all b-tree nodes are contiguous on disk */
409 extendFlags
= kEFContigMask
;
413 origSize
= filePtr
->fcbEOF
;
414 fileblocks
= filePtr
->ff_blocks
;
415 startAllocation
= vcb
->nextAllocation
;
417 // loop trying to get a contiguous chunk that's an integer multiple
418 // of the btree node size. if we can't get a contiguous chunk that
419 // is at least the node size then we break out of the loop and let
420 // the error propagate back up.
421 while((off_t
)bytesToAdd
>= btInfo
.nodeSize
) {
423 retval
= ExtendFileC(vcb
, filePtr
, bytesToAdd
, 0,
424 kEFContigMask
| kEFMetadataMask
| kEFNoClumpMask
,
425 (int64_t *)&actualBytesAdded
);
426 if (retval
== dskFulErr
&& actualBytesAdded
== 0) {
428 if (bytesToAdd
< btInfo
.nodeSize
) {
430 } else if ((bytesToAdd
% btInfo
.nodeSize
) != 0) {
431 // make sure it's an integer multiple of the nodeSize
432 bytesToAdd
-= (bytesToAdd
% btInfo
.nodeSize
);
435 } while (retval
== dskFulErr
&& actualBytesAdded
== 0);
437 if (retval
== dskFulErr
&& actualBytesAdded
== 0 && bytesToAdd
<= btInfo
.nodeSize
) {
441 filePtr
->fcbEOF
= (u_int64_t
)filePtr
->ff_blocks
* (u_int64_t
)vcb
->blockSize
;
442 bytesToAdd
= minEOF
- filePtr
->fcbEOF
;
446 * If a new extent was added then move the roving allocator
447 * reference forward by the current b-tree file size so
448 * there's plenty of room to grow.
451 ((VCBTOHFS(vcb
)->hfs_flags
& HFS_METADATA_ZONE
) == 0) &&
452 (vcb
->nextAllocation
> startAllocation
) &&
453 ((vcb
->nextAllocation
+ fileblocks
) < vcb
->allocLimit
)) {
454 HFS_UPDATE_NEXT_ALLOCATION(vcb
, vcb
->nextAllocation
+ fileblocks
);
457 filePtr
->fcbEOF
= (u_int64_t
)filePtr
->ff_blocks
* (u_int64_t
)vcb
->blockSize
;
459 // XXXdbg ExtendFileC() could have returned an error even though
460 // it grew the file to be big enough for our needs. If this is
461 // the case, we don't care about retval so we blow it away.
463 if (filePtr
->fcbEOF
>= (off_t
)minEOF
&& retval
!= 0) {
467 // XXXdbg if the file grew but isn't large enough or isn't an
468 // even multiple of the nodeSize then trim things back. if
469 // the file isn't large enough we trim back to the original
470 // size. otherwise we trim back to be an even multiple of the
473 if ((filePtr
->fcbEOF
< (off_t
)minEOF
) || ((filePtr
->fcbEOF
- origSize
) % btInfo
.nodeSize
) != 0) {
475 if (filePtr
->fcbEOF
< (off_t
)minEOF
) {
478 if (filePtr
->fcbEOF
< origSize
) {
479 panic("hfs: btree file eof %lld less than orig size %lld!\n",
480 filePtr
->fcbEOF
, origSize
);
483 trim
= filePtr
->fcbEOF
- origSize
;
485 trim
= ((filePtr
->fcbEOF
- origSize
) % btInfo
.nodeSize
);
488 ret
= TruncateFileC(vcb
, filePtr
, filePtr
->fcbEOF
- trim
, 0, 0, FTOC(filePtr
)->c_fileid
, 0);
489 filePtr
->fcbEOF
= (u_int64_t
)filePtr
->ff_blocks
* (u_int64_t
)vcb
->blockSize
;
491 // XXXdbg - panic if the file didn't get trimmed back properly
492 if ((filePtr
->fcbEOF
% btInfo
.nodeSize
) != 0) {
493 panic("hfs: truncate file didn't! fcbEOF %lld nsize %d fcb %p\n",
494 filePtr
->fcbEOF
, btInfo
.nodeSize
, filePtr
);
498 // XXXdbg - this probably doesn't need to be a panic()
499 panic("hfs: error truncating btree files (sz 0x%llx, trim %lld, ret %ld)\n",
500 filePtr
->fcbEOF
, trim
, (long)ret
);
505 if(VTOC(vp
)->c_fileid
!= kHFSExtentsFileID
) {
507 * Get any extents overflow b-tree changes to disk ASAP!
509 (void) BTFlushPath(VTOF(vcb
->extentsRefNum
));
510 (void) hfs_fsync(vcb
->extentsRefNum
, MNT_WAIT
, 0, p
);
512 hfs_systemfile_unlock(vcb
, lockflags
);
515 if ((filePtr
->fcbEOF
% btInfo
.nodeSize
) != 0) {
516 panic("hfs: extendbtree: fcb %p has eof 0x%llx not a multiple of 0x%x (trim %llx)\n",
517 filePtr
, filePtr
->fcbEOF
, btInfo
.nodeSize
, trim
);
521 * Update the Alternate MDB or Alternate VolumeHeader
523 if ((VTOC(vp
)->c_fileid
== kHFSExtentsFileID
) ||
524 (VTOC(vp
)->c_fileid
== kHFSCatalogFileID
) ||
525 (VTOC(vp
)->c_fileid
== kHFSAttributesFileID
)
527 VTOC(vp
)->c_flag
|= C_MODIFIED
;
529 ret
= hfs_flushvolumeheader(VCBTOHFS(vcb
), MNT_WAIT
, HFS_ALTFLUSH
);
531 VTOC(vp
)->c_touch_chgtime
= TRUE
;
532 VTOC(vp
)->c_touch_modtime
= TRUE
;
533 (void) hfs_update(vp
, TRUE
);
536 ret
= ClearBTNodes(vp
, btInfo
.nodeSize
, origSize
, (filePtr
->fcbEOF
- origSize
));
542 hfs_systemfile_unlock(vcb
, lockflags
);
549 * Clear out (zero) new b-tree nodes on disk.
552 ClearBTNodes(struct vnode
*vp
, long blksize
, off_t offset
, off_t amount
)
554 struct hfsmount
*hfsmp
= VTOHFS(vp
);
555 struct buf
*bp
= NULL
;
559 blk
= offset
/ blksize
;
560 blkcnt
= amount
/ blksize
;
563 bp
= buf_getblk(vp
, blk
, blksize
, 0, 0, BLK_META
);
569 // XXXdbg -- skipping this for now since it makes a transaction
570 // become *way* too large
571 //journal_modify_block_start(hfsmp->jnl, bp);
573 bzero((char *)buf_dataptr(bp
), blksize
);
579 // XXXdbg -- skipping this for now since it makes a transaction
580 // become *way* too large
581 //journal_modify_block_end(hfsmp->jnl, bp);
583 // XXXdbg - remove this once we decide what to do with the
584 // writes to the journal
590 /* wait/yield every 32 blocks so we don't hog all the buffers */
604 extern char hfs_attrname
[];
607 * Create an HFS+ Attribute B-tree File.
609 * No global resources should be held.
612 hfs_create_attr_btree(struct hfsmount
*hfsmp
, u_int32_t nodesize
, u_int32_t nodecnt
)
614 struct vnode
* vp
= NULLVP
;
615 struct cat_desc cndesc
;
616 struct cat_attr cnattr
;
617 struct cat_fork cfork
;
618 BlockDescriptor blkdesc
;
619 BTNodeDescriptor
*ndp
;
621 BTreeControlBlockPtr btcb
= NULL
;
622 struct buf
*bp
= NULL
;
626 u_int32_t node_num
, num_map_nodes
;
627 u_int32_t bytes_per_map_record
;
632 int newvnode_flags
= 0;
636 * Serialize creation using HFS_CREATING_BTREE flag.
638 lck_mtx_lock(&hfsmp
->hfs_mutex
);
639 if (hfsmp
->hfs_flags
& HFS_CREATING_BTREE
) {
640 /* Someone else beat us, wait for them to finish. */
641 (void) msleep(hfsmp
->hfs_attribute_cp
, &hfsmp
->hfs_mutex
,
642 PDROP
| PINOD
, "hfs_create_attr_btree", 0);
643 if (hfsmp
->hfs_attribute_vp
) {
648 hfsmp
->hfs_flags
|= HFS_CREATING_BTREE
;
649 lck_mtx_unlock(&hfsmp
->hfs_mutex
);
651 /* Check if were out of usable disk space. */
652 if ((hfs_freeblks(hfsmp
, 1) == 0)) {
658 * Set up Attribute B-tree vnode
659 * (this must be done before we start a transaction
660 * or take any system file locks)
662 bzero(&cndesc
, sizeof(cndesc
));
663 cndesc
.cd_parentcnid
= kHFSRootParentID
;
664 cndesc
.cd_flags
|= CD_ISMETA
;
665 cndesc
.cd_nameptr
= (const u_int8_t
*)hfs_attrname
;
666 cndesc
.cd_namelen
= strlen(hfs_attrname
);
667 cndesc
.cd_cnid
= kHFSAttributesFileID
;
669 bzero(&cnattr
, sizeof(cnattr
));
670 cnattr
.ca_linkcount
= 1;
671 cnattr
.ca_mode
= S_IFREG
;
672 cnattr
.ca_fileid
= cndesc
.cd_cnid
;
674 bzero(&cfork
, sizeof(cfork
));
675 cfork
.cf_clump
= nodesize
* nodecnt
;
677 result
= hfs_getnewvnode(hfsmp
, NULL
, NULL
, &cndesc
, 0, &cnattr
,
678 &cfork
, &vp
, &newvnode_flags
);
683 * Set up Attribute B-tree control block
685 MALLOC(btcb
, BTreeControlBlock
*, sizeof(BTreeControlBlock
), M_TEMP
, M_WAITOK
);
686 bzero(btcb
, sizeof(BTreeControlBlock
));
688 btcb
->nodeSize
= nodesize
;
689 btcb
->maxKeyLength
= kHFSPlusAttrKeyMaximumLength
;
690 btcb
->btreeType
= 0xFF;
691 btcb
->attributes
= kBTVariableIndexKeysMask
| kBTBigKeysMask
;
692 btcb
->version
= kBTreeVersion
;
693 btcb
->writeCount
= 1;
694 btcb
->flags
= 0; /* kBTHeaderDirty */
695 btcb
->fileRefNum
= vp
;
696 btcb
->getBlockProc
= GetBTreeBlock
;
697 btcb
->releaseBlockProc
= ReleaseBTreeBlock
;
698 btcb
->setEndOfForkProc
= ExtendBTreeFile
;
699 btcb
->keyCompareProc
= (KeyCompareProcPtr
)hfs_attrkeycompare
;
700 VTOF(vp
)->fcbBTCBPtr
= btcb
;
703 * Allocate some space
705 if (hfs_start_transaction(hfsmp
) != 0) {
711 /* Note ExtendBTreeFile will acquire the necessary system file locks. */
712 result
= ExtendBTreeFile(vp
, nodesize
, cfork
.cf_clump
);
716 btcb
->totalNodes
= VTOF(vp
)->ff_size
/ nodesize
;
719 * Figure out how many map nodes we'll need.
721 * bytes_per_map_record = the number of bytes in the map record of a
722 * map node. Since that is the only record in the node, it is the size
723 * of the node minus the node descriptor at the start, and two record
724 * offsets at the end of the node. The "- 2" is to round the size down
725 * to a multiple of 4 bytes (since sizeof(BTNodeDescriptor) is not a
728 * The value "temp" here is the number of *bits* in the map record of
731 bytes_per_map_record
= nodesize
- sizeof(BTNodeDescriptor
) - 2*sizeof(u_int16_t
) - 2;
732 temp
= 8 * (nodesize
- sizeof(BTNodeDescriptor
)
733 - sizeof(BTHeaderRec
)
734 - kBTreeHeaderUserBytes
735 - 4 * sizeof(u_int16_t
));
736 if (btcb
->totalNodes
> temp
) {
737 num_map_nodes
= howmany(btcb
->totalNodes
- temp
, bytes_per_map_record
* 8);
743 btcb
->freeNodes
= btcb
->totalNodes
- 1 - num_map_nodes
;
746 * Initialize the b-tree header on disk
748 bp
= buf_getblk(vp
, 0, nodesize
, 0, 0, BLK_META
);
754 buffer
= (void *)buf_dataptr(bp
);
755 blkdesc
.buffer
= buffer
;
756 blkdesc
.blockHeader
= (void *)bp
;
757 blkdesc
.blockReadFromDisk
= 0;
758 blkdesc
.isModified
= 0;
760 ModifyBlockStart(vp
, &blkdesc
);
762 if (buf_size(bp
) != nodesize
)
763 panic("hfs_create_attr_btree: bad buffer size (%d)\n", buf_size(bp
));
765 bzero(buffer
, nodesize
);
766 index
= (u_int16_t
*)buffer
;
768 /* FILL IN THE NODE DESCRIPTOR: */
769 ndp
= (BTNodeDescriptor
*)buffer
;
770 if (num_map_nodes
!= 0)
772 ndp
->kind
= kBTHeaderNode
;
774 offset
= sizeof(BTNodeDescriptor
);
775 index
[(nodesize
/ 2) - 1] = offset
;
777 /* FILL IN THE HEADER RECORD: */
778 bthp
= (BTHeaderRec
*)((u_int8_t
*)buffer
+ offset
);
779 bthp
->nodeSize
= nodesize
;
780 bthp
->totalNodes
= btcb
->totalNodes
;
781 bthp
->freeNodes
= btcb
->freeNodes
;
782 bthp
->clumpSize
= cfork
.cf_clump
;
783 bthp
->btreeType
= 0xFF;
784 bthp
->attributes
= kBTVariableIndexKeysMask
| kBTBigKeysMask
;
785 bthp
->maxKeyLength
= kHFSPlusAttrKeyMaximumLength
;
786 bthp
->keyCompareType
= kHFSBinaryCompare
;
787 offset
+= sizeof(BTHeaderRec
);
788 index
[(nodesize
/ 2) - 2] = offset
;
790 /* FILL IN THE USER RECORD: */
791 offset
+= kBTreeHeaderUserBytes
;
792 index
[(nodesize
/ 2) - 3] = offset
;
794 /* Mark the header node and map nodes in use in the map record.
796 * NOTE: Assumes that the header node's map record has at least
797 * (num_map_nodes + 1) bits.
799 bitmap
= (u_int8_t
*) buffer
+ offset
;
800 temp
= num_map_nodes
+ 1; /* +1 for the header node */
805 *bitmap
= ~(0xFF >> temp
);
807 offset
+= nodesize
- sizeof(BTNodeDescriptor
) - sizeof(BTHeaderRec
)
808 - kBTreeHeaderUserBytes
- (4 * sizeof(int16_t));
809 index
[(nodesize
/ 2) - 4] = offset
;
812 result
= btree_journal_modify_block_end(hfsmp
, bp
);
814 result
= VNOP_BWRITE(bp
);
819 /* Create the map nodes: node numbers 1 .. num_map_nodes */
820 for (node_num
=1; node_num
<= num_map_nodes
; ++node_num
) {
821 bp
= buf_getblk(vp
, node_num
, nodesize
, 0, 0, BLK_META
);
826 buffer
= (void *)buf_dataptr(bp
);
827 blkdesc
.buffer
= buffer
;
828 blkdesc
.blockHeader
= (void *)bp
;
829 blkdesc
.blockReadFromDisk
= 0;
830 blkdesc
.isModified
= 0;
832 ModifyBlockStart(vp
, &blkdesc
);
834 bzero(buffer
, nodesize
);
835 index
= (u_int16_t
*)buffer
;
837 /* Fill in the node descriptor */
838 ndp
= (BTNodeDescriptor
*)buffer
;
839 if (node_num
!= num_map_nodes
)
840 ndp
->fLink
= node_num
+ 1;
841 ndp
->kind
= kBTMapNode
;
843 offset
= sizeof(BTNodeDescriptor
);
844 index
[(nodesize
/ 2) - 1] = offset
;
847 /* Fill in the map record's offset */
848 /* Note: We assume that the map record is all zeroes */
849 offset
= sizeof(BTNodeDescriptor
) + bytes_per_map_record
;
850 index
[(nodesize
/ 2) - 2] = offset
;
853 result
= btree_journal_modify_block_end(hfsmp
, bp
);
855 result
= VNOP_BWRITE(bp
);
861 /* Update vp/cp for attribute btree */
862 lck_mtx_lock(&hfsmp
->hfs_mutex
);
863 hfsmp
->hfs_attribute_cp
= VTOC(vp
);
864 hfsmp
->hfs_attribute_vp
= vp
;
865 lck_mtx_unlock(&hfsmp
->hfs_mutex
);
867 (void) hfs_flushvolumeheader(hfsmp
, MNT_WAIT
, HFS_ALTFLUSH
);
870 hfs_end_transaction(hfsmp
);
874 /* Initialize the vnode for virtual attribute data file */
875 result
= init_attrdata_vnode(hfsmp
);
877 printf("hfs_create_attr_btree: init_attrdata_vnode() error=%d\n", result
);
882 hfs_unlock(VTOC(vp
));
891 /* XXX need to give back blocks ? */
894 hfs_end_transaction(hfsmp
);
898 * All done, clear HFS_CREATING_BTREE, and wake up any sleepers.
900 lck_mtx_lock(&hfsmp
->hfs_mutex
);
901 hfsmp
->hfs_flags
&= ~HFS_CREATING_BTREE
;
902 wakeup((caddr_t
)hfsmp
->hfs_attribute_cp
);
903 lck_mtx_unlock(&hfsmp
->hfs_mutex
);